docs/elementwise_8hpp_source.html

 #pragma once
 #include <dlprim/operator.hpp>
 namespace dlprim {
     namespace json { class value; }
     namespace core {
         class PointwiseOperationBroadcastReduce;
     }
     struct ElementwiseConfig {
         enum Operation {
             elementwise_sum,
             elementwise_prod,
             elementwise_max
         };

         Operation op = elementwise_sum;
         float coeff[2] = {1.0f,1.0f};
         StandardActivations activation = StandardActivations::identity;

         static ElementwiseConfig from_json(json::value const &v);
     };

     class Elementwise : public Operator {
     public:

         Elementwise(Context &ctx,ElementwiseConfig config = ElementwiseConfig());
         virtual ~Elementwise();

         virtual char const *operator_type() const
         {
             return "Elementwise";
         }

                 virtual void setup(std::vector<TensorSpecs> const &in,
                            std::vector<TensorSpecs> &out,
                            std::vector<TensorSpecs> &parameters,
                            size_t &workspace);

         virtual void reshape(std::vector<Shape> const &in,
                              std::vector<Shape> &out,
                              size_t &ws);

                 virtual void forward(std::vector<Tensor> &input,
                              std::vector<Tensor> &output,
                              std::vector<Tensor> &parameters,
                              Tensor &workspace,
                              ExecutionContext const &ctx);

         virtual void backward(std::vector<TensorAndGradient> &input,
                               std::vector<TensorAndGradient> &output,
                               std::vector<TensorAndGradient> &parameters,
                               Tensor &workspace,
                               ExecutionContext const &ctx);


     private:
                 void forward_gpu(Tensor &a,Tensor &b,Tensor &output,ExecutionContext const &ctx);
         void forward_cpu(Tensor &a,Tensor &b,Tensor &output);

         template<int index>
         struct StridePos;

         template<int dim,typename F>
         void loop_strides_dim(Shape s,float *a,Shape a_strides,float *b,Shape b_strides,float *c,F const &func);

         template<typename F>
         void loop_strides(Shape s,float *a,Shape a_strides,float *b,Shape b_strides,float *c,F const &func);

         template<typename F,typename R>
         void loops_reduce(Shape s,float *a,Shape as,float *r,Shape rs,F const &func,R const &reduce);
         template<typename F,typename R>
         void loops_reduce(Shape s,float *a,Shape as,float *b,Shape bs,float *r,Shape rs,F const &func,R const &reduce);
         template<typename F,typename R>
         void loops_reduce(Shape s,float *a,Shape as,float *b,Shape bs,float *c,Shape cs,float *r,Shape rs,F const &func,R const &reduce);


         template<int dim,typename F,typename R>
         void loops_reduce_dim(Shape s,float *a,Shape as,float *r,Shape rs,F const &func,R const &reduce);
         template<int dim,typename F,typename R>
         void loops_reduce_dim(Shape s,float *a,Shape as,float *b,Shape bs,float *r,Shape rs,F const &func,R const &reduce);
         template<int dim,typename F,typename R>
         void loops_reduce_dim(Shape s,float *a,Shape as,float *b,Shape bs,float *c,Shape cs,float *r,Shape rs,F const &func,R const &reduce);


         void backward_cpu(Tensor &a,Tensor &da,
                           Tensor &b,Tensor &db,
                           Tensor &c,Tensor &dc,
                           bool l,bool r,
                           float ba,float bb);

         void backward_gpu(Tensor &a,Tensor &da,
                           Tensor &b,Tensor &db,
                           Tensor &c,Tensor &dc,
                           Tensor &ws,
                           bool l,bool r,
                           float ba,float bb,
                           ExecutionContext const &e);
         void setup_bwd_gpu(std::vector<TensorSpecs> const &in,std::vector<TensorSpecs> &out,size_t &ws);

         ElementwiseConfig config_;
         DataType dtype_;
         std::unique_ptr<core::PointwiseOperationBroadcastReduce> bwd_l_,bwd_r_,bwd_both_;
     };
 } // namespace

dlprim::Shape
Tensor shape.
Definition: shape.hpp:18

dlprim::Elementwise::operator_type
virtual char const * operator_type() const
name of the operator type
Definition: elementwise.hpp:28

dlprim::ElementwiseConfig
Definition: elementwise.hpp:8

dlprim::Operator
Base class for backward/forward propogation calculations for internal network.
Definition: operator.hpp:15

dlprim::Context
This is main object that represent the pair of OpenCL platform and device all other objects use it...
Definition: context.hpp:302

dlprim::DataType
DataType
type definition
Definition: definitions.hpp:70

dlprim::json::value
This class is central representation of json objects.
Definition: json.hpp:652

dlprim
Mane namespace.
Definition: context.hpp:9

dlprim::Tensor
Central Data Contrainer - Tensor.
Definition: tensor.hpp:99

dlprim::StandardActivations
StandardActivations
Parameterless Activations that can be embedded to general kernels like inner product or convolution...
Definition: definitions.hpp:266

dlprim::Elementwise
Definition: elementwise.hpp:22

dlprim::ExecutionContext
This class is used to pass cl::Events that the kernel should wait for and/or signal event completion...
Definition: context.hpp:121