1#ifndef TMVA_SOFIE_ROPERATOR_Softmax
2#define TMVA_SOFIE_ROPERATOR_Softmax
30 ROperator_Softmax(int64_t attr_axis, std::string nameX, std::string nameY,
bool logSoftmax =
false)
39 std::vector<ETensorType>
TypeInference(std::vector<ETensorType> input)
override {
return input; }
41 std::vector<std::vector<size_t>>
ShapeInference(std::vector<std::vector<size_t>> input)
override {
47 if (model.CheckIfTensorAlreadyExist(
fNX) ==
49 throw std::runtime_error(
"TMVA SOFIE Softmax Op Input Tensor is not found in model");
52 model.AddIntermediateTensor(
fNY, model.GetTensorType(
fNX),
fShape);
54 if (model.Verbose()) {
59 model.AddNeededCustomHeader(
"vdt/exp.h");
61 model.AddNeededCustomHeader(
"vdt/log.h");
65 std::string
Generate(std::string OpName)
override {
66 OpName =
"op_" + OpName;
68 throw std::runtime_error(
"TMVA SOFIE Operator Softmax called to Generate without being initialized first");
70 std::stringstream out;
75 std::string expFunction = (
fUseVDT) ?
"vdt::fast_expf" :
"std::exp";
76 std::string logFunction = (
fUseVDT) ?
"vdt::fast_logf" :
"std::log";
79 if (axis ==
size - 1) {
80 std::string axis_size =
fShape[axis].GetVal();
83 num_rows = std::to_string(std::stoul(length_str) / std::stoul(axis_size));
85 num_rows =
"(" + length_str +
") / (" + axis_size +
")";
88 out <<
"\n" <<
SP <<
"//------ SOFTMAX - " <<
size <<
" " << length_str <<
" " << axis <<
"\n";
89 out <<
SP <<
"for (int i = 0; i < " << num_rows <<
"; ++i) {\n";
90 out <<
SP <<
SP <<
"size_t offset = i * " << axis_size <<
";\n";
91 out <<
SP <<
SP <<
fType <<
" const * x_ptr = &tensor_" <<
fNX <<
"[offset];\n";
92 out <<
SP <<
SP <<
fType <<
" * y_ptr = &tensor_" <<
fNY <<
"[offset];\n";
94 out <<
SP <<
SP <<
fType <<
" vmax = x_ptr[0];\n";
95 out <<
SP <<
SP <<
"for (int j = 1; j < " << axis_size <<
"; ++j) {\n";
96 out <<
SP <<
SP <<
SP <<
"if (x_ptr[j] > vmax) vmax = x_ptr[j];\n";
97 out <<
SP <<
SP <<
"}\n";
99 out <<
SP <<
SP <<
fType <<
" sum = 0.0;\n";
100 out <<
SP <<
SP <<
"for (int j = 0; j < " << axis_size <<
"; ++j) {\n";
101 out <<
SP <<
SP <<
SP <<
"y_ptr[j] = " << expFunction <<
"(x_ptr[j] - vmax);\n";
102 out <<
SP <<
SP <<
SP <<
"sum += y_ptr[j];\n";
103 out <<
SP <<
SP <<
"}\n";
105 out <<
SP <<
SP <<
fType <<
" inv_sum = 1.0f / sum;\n";
106 out <<
SP <<
SP <<
"for (int j = 0; j < " << axis_size <<
"; ++j) {\n";
107 out <<
SP <<
SP <<
SP <<
"y_ptr[j] *= inv_sum;\n";
109 out <<
SP <<
SP <<
SP <<
"y_ptr[j] = " << logFunction <<
"(y_ptr[j]);\n";
110 out <<
SP <<
SP <<
"}\n";
116 std::vector<std::string>
l(
size);
117 for (
size_t i = 0; i <
size; i++) {
119 for (
size_t j = 0; j < k; j++) out <<
SP;
120 l[i] = std::string(
"i") + std::to_string(i);
121 out <<
"for (int " <<
l[i] <<
" = 0; " <<
l[i] <<
" < " <<
fShape[i] <<
"; " <<
l[i] <<
"++) {\n";
125 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
126 out <<
fType <<
" sum = 0.;\n";
127 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
128 out <<
"size_t index = ";
130 for (
size_t i = 0; i <
size; i++) {
131 if (i == axis)
continue;
132 if (!first) out <<
" + ";
133 if (stride[i].GetVal() !=
"1")
134 out << stride[i] <<
"*";
140 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
141 out <<
fType <<
" vmax = tensor_" <<
fNX <<
"[index];\n";
142 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
143 out <<
"for (int i = 1; i < " <<
fShape[axis] <<
"; i++) {\n";
144 for (
size_t j = 0; j <
size; j++) out <<
SP;
145 out <<
fType <<
" x = tensor_" <<
fNX <<
"[index + i";
146 if (stride[axis].GetVal() !=
"1") out <<
"*(" << stride[axis] <<
")";
148 for (
size_t j = 0; j <
size; j++) out <<
SP;
149 out <<
"if (x > vmax) vmax = x;\n";
150 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
153 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
154 out <<
"for (int i = 0; i < " <<
fShape[axis] <<
"; i++) {\n";
155 for (
size_t j = 0; j <
size; j++) out <<
SP;
156 out <<
"size_t id = index + i";
157 if (stride[axis].GetVal() !=
"1") out <<
"*(" << stride[axis] <<
")";
159 for (
size_t j = 0; j <
size; j++) out <<
SP;
160 out <<
"tensor_" <<
fNY <<
"[id] = " << expFunction <<
"(tensor_" <<
fNX <<
"[id] - vmax);\n";
161 for (
size_t j = 0; j <
size; j++) out <<
SP;
162 out <<
"sum += tensor_" <<
fNY <<
"[id];\n";
163 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
166 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
167 out <<
"for (int i = 0; i < " <<
fShape[axis] <<
"; i++) {\n";
168 for (
size_t j = 0; j <
size; j++) out <<
SP;
169 out <<
"size_t id = index + i";
170 if (stride[axis].GetVal() !=
"1") out <<
"*(" << stride[axis] <<
");\n";
171 for (
size_t j = 0; j <
size; j++) out <<
SP;
172 out <<
"tensor_" <<
fNY <<
"[id] /= sum;\n";
174 for (
size_t j = 0; j <
size; j++) out <<
SP;
175 out <<
"tensor_" <<
fNY <<
"[id] = " << logFunction <<
"(tensor_" <<
fNY <<
"[id]);\n";
177 for (
size_t j = 0; j <
size-1; j++) out <<
SP;
180 for (
int i =
static_cast<int>(k) - 1; i >= 0; i--) {
181 for (
int j = 0; j < i; j++) out <<
SP;
187 std::vector<std::string>
GetStdLibs()
override {
return { std::string(
"cmath") }; }
size_t size(const MatrixT &matrix)
retrieve the size of a square matrix
std::vector< std::vector< size_t > > ShapeInference(std::vector< std::vector< size_t > > input) override
std::vector< ETensorType > TypeInference(std::vector< ETensorType > input) override
std::string Generate(std::string OpName) override
std::vector< std::string > GetStdLibs() override
void Initialize(RModel &model) override
ROperator_Softmax(int64_t attr_axis, std::string nameX, std::string nameY, bool logSoftmax=false)
std::vector< Dim > fShape
std::vector< std::string_view > fInputTensorNames
const std::string SP
space used to correctly indent the generated C++ code
std::vector< std::string_view > fOutputTensorNames
std::vector< size_t > ComputeStrideFromShape(const std::vector< size_t > &shape)
compute stride of a tensor given its shape (assume layout is row-major)
std::string ConvertDimShapeToString(const std::vector< Dim > &shape)
std::string ConvertTypeToString(ETensorType type)
std::string ConvertDimShapeToLength(const std::vector< Dim > &shape)
bool IsInteger(const std::string &s)
create variable transformations