onnx2versal/qlinearsoftmax_8h_source.html

#ifndef QLINEARSOFTMAX_H_

#define QLINEARSOFTMAX_H_


#include <adf.h>

#include <assert.h>


template <typename TT, int INP_H, int INP_W, int INP_W_PAD>


class QLinearSoftmaxScalar {


  private:

    float x_scale;

    float y_scale;

    TT x_zero;

    TT y_zero;


    float scale;


  public:

    QLinearSoftmaxScalar (

      float x_scale,

      float y_scale,

      TT x_zero,

      TT y_zero

    ): x_scale(x_scale), y_scale(y_scale), x_zero(x_zero), y_zero(y_zero) {};


    void filter(

      input_window<TT>* in,

      output_stream<TT>* out

    );


    static void registerKernelClass() {

      static_assert((std::is_same<TT, int8_t>::value) || (std::is_same<TT, uint8_t>::value));

      REGISTER_FUNCTION(QLinearSoftmaxScalar::filter);

    };

};


template <typename TT, int INP_H, int INP_W, int INP_W_PAD>


class QLinearSoftmaxFloatmul {


  private:

    float x_scale;

    float y_scale;

    TT x_zero;

    TT y_zero;


    int EXP_BITSHIFT = 18;

    int OUT_BITSHIFT = 10;


    // precompute

    float fastexp_scale;

    int16_t min_value;


  public:

    QLinearSoftmaxFloatmul (

      float x_scale,

      float y_scale,

      TT x_zero,

      TT y_zero

    );


        void filter(

            input_window<TT>* in,

            output_stream<TT>* out

        );


        static void registerKernelClass() {

      static_assert((std::is_same<TT, int8_t>::value) || (std::is_same<TT, uint8_t>::value));

            static_assert(INP_W_PAD % 16 == 0);

            REGISTER_FUNCTION(QLinearSoftmaxFloatmul::filter);

        }

};


template <typename TT, int INP_H, int INP_W, int INP_W_PAD>


class QLinearSoftmaxSingleaxis {


  private:

    float x_scale;

    float y_scale;

    TT x_zero;

    TT y_zero;


    int EXP_BITSHIFT;

    int OUT_BITSHIFT = 4;


    // precompute

    int16_t fastexp_scale;

    int32_t expsum_offset;

    int16_t min_value;


  public:

    QLinearSoftmaxSingleaxis (

      float x_scale,

      float y_scale,

      TT x_zero,

      TT y_zero

    );


        void filter(

            input_window<TT>* in,

            output_stream<TT>* out

        );


        static void registerKernelClass() {

      static_assert((std::is_same<TT, int8_t>::value) || (std::is_same<TT, uint8_t>::value));

            static_assert(INP_W_PAD % 16 == 0);

            REGISTER_FUNCTION(QLinearSoftmaxSingleaxis::filter);

        }

};


#endif // QLINEARSOFTMAX_H_

QLinearSoftmaxFloatmul
Vector implementation using fastexp2 method, float multiplication for exp estimation QLinearSoftmaxFl...
Definition qlinearsoftmax.h:65

QLinearSoftmaxScalar
Scalar implementation. QLinearSoftmaxScalar<10,20,32> takes 517922 cycles for expf,...
Definition qlinearsoftmax.h:29

QLinearSoftmaxSingleaxis
Vector implementation using fastexp2 method for single axis, QLinearSoftmaxSingleaxis<10,...
Definition qlinearsoftmax.h:107