Fused affine + ReLU activation (uses cuBLASLt epilogue on GPU when available).
More...
|
| void | set (Index input_features, Index output_features, Type weight_type=Type::FP32) |
| | Configures the underlying CombinationOp; ReLU is fixed.
|
| |
| vector< TensorSpec > | parameter_specs () const override |
| | Returns the tensor specs of trainable parameters owned by this operator.
|
| |
| void | link_parameters (span< const TensorView > views) override |
| | Binds parameter views provided by the hosting layer.
|
| |
| void | link_gradients (span< const TensorView > views) override |
| | Binds gradient views provided by the hosting layer.
|
| |
| void | set_parameters_random () override |
| | Initializes parameters with random values.
|
| |
| void | set_parameters_glorot () override |
| | Initializes parameters using Glorot (Xavier) initialization.
|
| |
| void | forward_propagate (ForwardPropagation &fp, size_t layer, bool is_training) noexcept override |
| | Runs the operator's forward computation.
|
| |
| void | back_propagate (ForwardPropagation &fp, BackPropagation &bp, size_t layer) const noexcept override |
| | Runs the operator's backward computation, accumulating into gradient/delta buffers.
|
| |
| virtual | ~Operator ()=default |
| |
| virtual vector< TensorSpec > | state_specs () const |
| | Returns the tensor specs of persistent state owned by this operator.
|
| |
| virtual void | link_states (span< const TensorView >) |
| | Binds state views provided by the hosting layer.
|
| |
| virtual void | to_JSON (JsonWriter &) const |
| | Serializes the operator configuration to a JSON writer.
|
| |
| virtual void | from_JSON (const Json *) |
| | Restores the operator configuration from a JSON node.
|
| |
| virtual void | load_state_from_JSON (const Json *) |
| | Restores persistent state (e.g. running statistics) from a JSON node.
|
| |
| virtual void | destroy_cuda () |
| | Releases CUDA resources owned by the operator; called from destructors.
|
| |
| TensorView & | get_input (ForwardPropagation &fp, size_t layer, size_t i=0) const noexcept |
| |
| vector< TensorView > & | get_inputs (ForwardPropagation &fp, size_t layer, size_t i=0) const noexcept |
| |
| TensorView & | get_output (ForwardPropagation &fp, size_t layer, size_t i=0) const noexcept |
| |
| TensorView & | get_output_delta (BackPropagation &bp, size_t layer, size_t i=0) const noexcept |
| |
| TensorView & | get_input_delta (BackPropagation &bp, size_t layer, size_t i=0) const noexcept |
| |
Fused affine + ReLU activation (uses cuBLASLt epilogue on GPU when available).