onnx2versal/softmax_8h_source.html

#ifndef SOFTMAX_H_

#define SOFTMAX_H_


#include <adf.h>

#include <assert.h>


double fastexp(float val);


float fastexp2(float val, int precision);


template <int INP_H, int INP_W, int INP_W_PAD>


class SoftmaxScalar {

    private:

      float coef[10] = {1, 0.5, 0.16666666666666666, 0.041666666666666664, 0.008333333333333333, 0.001388888888888889, 0.0001984126984126984, 2.48015873015873e-05, 2.7557319223985893e-06, 2.755731922398589e-07};


        float fastexp3(float val, int precision);


    public:

        void filter(

            input_window<float>* in,

            output_window<float>* out

        );


        static void registerKernelClass() {

            REGISTER_FUNCTION(SoftmaxScalar::filter);

        }

};


template <int INP_H, int INP_W, int INP_W_PAD>


class SoftmaxSingleaxis {

    public:

        void filter(

            input_window<float>* in,

            output_window<float>* out

        );


        static void registerKernelClass() {

            static_assert(INP_W_PAD % 8 == 0);

            REGISTER_FUNCTION(SoftmaxSingleaxis::filter);

        }

};


template <int INP_H, int INP_W, int INP_W_PAD>


class SoftmaxMultiaxis {

    public:

        void filter(

            input_window<float>* in,

            output_window<float>* out

        );


        static void registerKernelClass() {

            static_assert(INP_H % 2 == 0 && INP_W_PAD % 8 == 0);

            REGISTER_FUNCTION(SoftmaxMultiaxis::filter);

        }

};


#endif // SOFTMAX_H_

SoftmaxMultiaxis
Vector implementation for multiple axis, SoftmaxMultiaxis<10,10,16> takes 1082 cycles requires INP_H%...
Definition softmax.h:90

SoftmaxScalar
Scalar implementation, SoftmaxScalar<10,10,16> takes.
Definition softmax.h:42

SoftmaxSingleaxis
Vector implementation for single axis, SoftmaxSingleaxis<10,10,16> takes 1241 cycles requires INP_W_P...
Definition softmax.h:70

fastexp2
float fastexp2(float val, int precision)
approximation with (1 + x/256)^256 Error is small for [-512. 1.5]
Definition qlinearsoftmax.cc:11

fastexp
double fastexp(float val)
See https://nic.schraudolph.org/pubs/Schraudolph99.pdf.
Definition softmax.cc:9