doc/master/RModel_8cxx_source.html

#include <limits>

#include <algorithm>

#include <cctype>

#include <memory>

#include <string>


#ifdef SOFIE_SUPPORT_ROOT_BINARY

#include "TFile.h"

#endif


#include "TMVA/RModel.hxx"

#include "TMVA/SOFIE_common.hxx"


namespace TMVA {

namespace Experimental {

namespace SOFIE {


namespace {

const std::string SP = "   ";

}


std::underlying_type_t<Options> operator|(Options opA, Options opB) {

    return static_cast<std::underlying_type_t<Options>>(opA) | static_cast<std::underlying_type_t<Options>>(opB);

}


std::underlying_type_t<Options> operator|(std::underlying_type_t<Options> opA, Options opB) {

    return opA | static_cast<std::underlying_type_t<Options>>(opB);

}


std::vector<size_t> RModel::GetTensorShape(const std::string & name) const {

    auto f = fReadyInputTensorInfos.find(name);

    if (f != fReadyInputTensorInfos.end()) {

        return f->second.shape;

    }

    auto f2 = fInitializedTensors.find(name);

    if (f2 != fInitializedTensors.end()) {

        return f2->second.shape();

    }

    auto f3 = fInputTensorInfos.find(name);

    if (f3 != fInputTensorInfos.end()) {

        throw std::runtime_error("TMVA SOFIE tensor [" + name + "] is an input tensor with unspecified dimension parameter");

    }

    auto f4 = fIntermediateTensorInfos.find(name);

    if (f4 != fIntermediateTensorInfos.end()) {

        return f4->second.shape;

    }

    // case of shape tensors

    auto f5 = fShapeTensors.find(name);

    if (f5 != fShapeTensors.end()) {

      // shape is vector of size 1 with size of shape values or just a scalar

      if (f5->second.second)  // check scalar flag

         return std::vector<size_t>{};

      else

         return std::vector<size_t>{f5->second.first.size()};

    }


    if (fDynamicTensorInfos.find(name) != fDynamicTensorInfos.end())

      throw std::runtime_error("TMVA SOFIE tensor [" + name + "] is a dynamic tensor. Use GetDynamicTensorShape instead of GetTensorShape");


   if (fIsSubGraph && fParentGraph)

      return fParentGraph->GetTensorShape(name);


    throw std::runtime_error("TMVA SOFIE tensor [" + name + "] for which the shape is requested is not found");

}


std::vector<Dim> RModel::GetDimTensorShape(const std::string & name) const {

   if (auto f = fDynamicTensorInfos.find(name); f != fDynamicTensorInfos.end()) {

      return f->second.shape;

   }

   if (auto f = fInputTensorInfos.find(name); f != fInputTensorInfos.end()) {

      return f->second.shape;

   }

   // in case is not a dynamic tensor convert normal shape to Dim one

   // for this we need to return the vector by value

   return ConvertShapeToDim(GetTensorShape(name));

}


std::vector<Dim> RModel::GetDynamicTensorShape(const std::string & name) const {

   if (auto f = fDynamicTensorInfos.find(name); f != fDynamicTensorInfos.end()) {

      return f->second.shape;

   }

   if (auto f = fInputTensorInfos.find(name); f != fInputTensorInfos.end()) {

      return f->second.shape;

   }

   // throw error if shape is not dynamic

   if (!IsDynamicTensor(name))

      throw std::runtime_error("TMVA SOFIE tensor [" + name + "] for which the shape is requested is not dynamic");


   throw std::runtime_error("TMVA SOFIE tensor [" + name + "] for which the shape is requested is not found");

}


ETensorType RModel::GetTensorType(std::string name) const {

    auto f = fReadyInputTensorInfos.find(name);

    if (f != fReadyInputTensorInfos.end()) {

        return f->second.type;

    }

    auto f2 = fInitializedTensors.find(name);

    if (f2 != fInitializedTensors.end()) {

        return f2->second.type();

    }

    auto f3 = fInputTensorInfos.find(name);

    if (f3 != fInputTensorInfos.end()) {

        return f3->second.type;

    }

    auto f4 = fIntermediateTensorInfos.find(name);

    if (f4 != fIntermediateTensorInfos.end()) {

        return f4->second.type;

    }

    auto f5 = fDynamicTensorInfos.find(name);

    if (f5 != fDynamicTensorInfos.end()){

      return f5->second.type;

    }

    // case of shape tensor type is INT64

    if (fShapeTensors.find(name) != fShapeTensors.end()){

      return ETensorType::INT64;

    }


    if (fIsSubGraph && fParentGraph)

      return fParentGraph->GetTensorType(name);


    throw std::runtime_error("TMVA SOFIE tensor [" + name + "] for which the type is requested is not found, model name: " + fName);

}


bool RModel::CheckIfTensorAlreadyExist(std::string tensor_name) {

    if (fReadyInputTensorInfos.find(tensor_name) != fReadyInputTensorInfos.end())  return true;

    if (fInputTensorInfos.find(tensor_name) != fInputTensorInfos.end()) return true;

    if (fInitializedTensors.find(tensor_name) != fInitializedTensors.end()) return true;

    if (fIntermediateTensorInfos.find(tensor_name) != fIntermediateTensorInfos.end()) return true;

    if (fDynamicTensorInfos.find(tensor_name) != fDynamicTensorInfos.end()) return true;

    if (fShapeTensors.find(tensor_name) != fShapeTensors.end()) return true;

    if (fIsSubGraph && fParentGraph) return fParentGraph->CheckIfTensorAlreadyExist(tensor_name);

    return false;

}


void RModel::AddInputTensorInfo(std::string input_name, ETensorType type, std::vector<Dim> shape) {

    input_name = UTILITY::Clean_name(input_name);

    if (CheckIfTensorAlreadyExist(input_name)) {

        throw std::runtime_error("TMVA-SOFIE: input tensor with name " + input_name + " already exists \n");

    }


    InputTensorInfo inputInfo { type, shape };

    fInputTensorInfos[input_name] = inputInfo;

}


void RModel::AddInputTensorInfo(std::string input_name, ETensorType type, std::vector<size_t> shape) {

    input_name = UTILITY::Clean_name(input_name);

    if (CheckIfTensorAlreadyExist(input_name)) {

        throw std::runtime_error("TMVA-SOFIE: input tensor with name " + input_name + " already exists \n");

    }

    TensorInfo inputInfo { type, shape };

    fReadyInputTensorInfos[input_name] = inputInfo;

}


void RModel::AddInputTensorName(std::string input_name) {

    fInputTensorNames.emplace_back(UTILITY::Clean_name(input_name));

}


void RModel::AddOperator(std::unique_ptr<ROperator> op, int order_execution) {

    AddBlasRoutines(op->GetBlasRoutines());

    auto libs = op->GetStdLibs();

    auto op_input_tensors = op->GetOpInputTensors();

    for (auto& stdlib : libs) {

        AddNeededStdLib(stdlib);

    }

    if (order_execution >= 0) {

        fOperators.insert(fOperators.begin() + order_execution, std::move(op));

    } else {

        fOperators.push_back(std::move(op));

    }


    // storing the last usage of tensors which are input to

    // operators (but are not inputs to the model, i.e. they are intermediate

    // tensors). This information is needed to keep a check on when a

    // particular intermediate tensor can be flushed to free up memory for reuse.

   for(size_t index = 0; index<op_input_tensors.size() &&

         fInitializedTensors.find(UTILITY::Clean_name(std::string(op_input_tensors[index]))) == fInitializedTensors.end() &&

         std::find(fInputTensorNames.begin(), fInputTensorNames.end(),

                   UTILITY::Clean_name(std::string(op_input_tensors[index]))) == fInputTensorNames.end() &&

         fDynamicTensorInfos.find(UTILITY::Clean_name(std::string(op_input_tensors[index]))) == fDynamicTensorInfos.end();

         ++index){

            fIntermediateTensorFrequencyLookup[op_input_tensors[index]] = order_execution;

   }

}


void RModel::AddInitializedTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape, std::shared_ptr<void> data) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    //NB: own data

    if (CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: initialized tensor with name " + tensor_name + " already exists \n");

    }

    InitializedTensor new_tensor {type, shape, data};

    fInitializedTensors[tensor_name] = new_tensor;

}


void RModel::AddConstantTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape, std::shared_ptr<void> data) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    //NB: own data

    if (CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: constant tensor with name " + tensor_name + " already exists \n");

    }

    InitializedTensor new_tensor {type, shape, data, true};   // add here flag to specify is a constant tensor

    fInitializedTensors[tensor_name] = new_tensor;

}


void RModel::AddShapeTensor(const std::string & name, const std::vector<Dim> & shape_values, bool scalar){

   auto tensor_name = UTILITY::Clean_name(name);

   if (fShapeTensors.count(tensor_name) != 0) {

      throw std::runtime_error("TMVA-SOFIE: shape tensor with name " + tensor_name + " already exists \n");

   }

   fShapeTensors[tensor_name] = std::make_pair(shape_values, scalar);

}


bool RModel::IsShapeTensor(const std::string & tensor_name) const {

   return fShapeTensors.count(tensor_name) != 0;

}


const std::vector<Dim> & RModel::GetShapeTensorValues(const std::string & tensor_name) const {

   //if (!IsShapeTensor(tensor_name) ) return std::vector<Dim>{};

   return fShapeTensors.at(tensor_name).first;

}


bool RModel::IsInitializedTensor(const std::string& tensorName) const {

    std::string name = UTILITY::Clean_name(tensorName);

    return fInitializedTensors.find(name) != fInitializedTensors.end();

}


bool RModel::IsConstantTensor(const std::string& tensorName) const {

    std::string name = UTILITY::Clean_name(tensorName);

    auto itr = fInitializedTensors.find(name);

    if (itr == fInitializedTensors.end()) return false;

    return itr->second.IsConstantTensor();

}


// dynamic tensors include also Dim input tensors


bool RModel::IsDynamicTensor(const std::string& tensorName) const {

   std::string name = UTILITY::Clean_name(tensorName);

   bool ret = fDynamicTensorInfos.find(name) != fDynamicTensorInfos.end();

   return (ret) ? true : IsDimInputTensor(tensorName);

}


bool RModel::IsDimInputTensor(const std::string& tensorName) const {

   std::string name = UTILITY::Clean_name(tensorName);

   return fInputTensorInfos.find(name) != fInputTensorInfos.end();

}


bool RModel::IsReadyInputTensor(const std::string& tensorName) const {

   std::string name = UTILITY::Clean_name(tensorName);

   return fReadyInputTensorInfos.find(name) != fReadyInputTensorInfos.end();

}


// generic addition of a tensor


void RModel::AddIntermediateTensor(std::string tensor_name, ETensorType type, std::vector<Dim> dim_shape) {

   auto int_shape = ConvertShapeToInt(dim_shape);

   if (!int_shape.empty())

      AddIntermediateTensor(tensor_name, type, int_shape);

   else

      AddDynamicTensor(tensor_name, type, dim_shape);

}


void RModel::AddIntermediateTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    if (CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: intermediate tensor with name " + tensor_name + " already exists \n");

    }

    TensorInfo new_tensor {type, shape};

    fIntermediateTensorInfos[tensor_name] = new_tensor;

}


void RModel::AddDynamicTensor(std::string tensor_name, ETensorType type, std::vector<Dim> shape){

   tensor_name = UTILITY::Clean_name(tensor_name);

   if (CheckIfTensorAlreadyExist(tensor_name)){

      throw std::runtime_error("TMVA-SOFIE: intermediate tensor with name " + tensor_name + " already exists \n");

   }

   DynamicTensorInfo new_tensor {type, shape};

   fDynamicTensorInfos[tensor_name] = new_tensor;

   // store shape parameter if not existing

   for (auto &d : shape) {

      if (d.isParam) {

         if (d.dim != size_t(-1)) {

            AddShapeParam(d.param, d.dim);

         }

      }

   }

}


void RModel::AddShapeParam(const std::string & param, size_t default_value) {

   if (fShapeParams.count(param) == 0) {

      fShapeParams[param] = std::to_string(default_value);

      // add also in the vector list (used to keep the order)

      fDimShapeNames.push_back(param);

   }

}


void RModel::AddOutputTensorNameList(std::vector<std::string> outputtensornames) {

    fOutputTensorNames.clear();

    for(auto& it : outputtensornames) {

        fOutputTensorNames.emplace_back(UTILITY::Clean_name(it));

    }

}


void RModel::UpdateOutputTensorList(std::vector<std::string> curr_output_tensors, std::vector<std::string> new_output_tensors) {

    for(auto& it:curr_output_tensors) {

        fOutputTensorNames.erase(std::remove(fOutputTensorNames.begin(), fOutputTensorNames.end(), it), fOutputTensorNames.end());

    }

    fOutputTensorNames.insert(fOutputTensorNames.end(), new_output_tensors.begin(), new_output_tensors.end());

}


void RModel::UpdateInitializedTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape, std::shared_ptr<void> data) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    if (!CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: tensor " + tensor_name + " not found when trying to update it");

    }

    InitializedTensor new_tensor {type, shape, data};

    fInitializedTensors[tensor_name] = new_tensor;

}


std::shared_ptr<void> RModel::GetInitializedTensorData(std::string tensor_name) {

    auto f = fInitializedTensors.find(tensor_name);

    if (f == fInitializedTensors.end()) {

        throw std::runtime_error("TMVA-SOFIE: tensor " + tensor_name + " not found when trying to get its data");

    } else {

        return f->second.sharedptr();

    }

}


void RModel::SetNotWritableInitializedTensor(const std::string & tensor_name) {

      auto t = fInitializedTensors.find(tensor_name);

      if (t == fInitializedTensors.end()) {

         throw std::runtime_error("TMVA-SOFIE: initialized tensor " + tensor_name + " not found when trying to get its info");

      }

      t->second.SetNotWritable();

   }


std::string RModel::AllocateIntermediateMemory(std::span<const std::string_view> op_output_tensors)

{

   std::stringstream code;


   if (fVerbose) {

      std::cout << "Total chunks allocated\n";

      for (auto chunk = fIntermediateMemoryInfo.total_stack.begin(); chunk != fIntermediateMemoryInfo.total_stack.end(); ++chunk) {

         std::cout << "..... chunk " << chunk->first << " size " << chunk->second.tensor_size << " " << chunk->second.tensor_name << std::endl;

      }

   }


   auto declareIntermediateTensor = [this, &code](std::string const &name, size_t size, size_t location) {

      std::string typeName = ConvertTypeToString(GetTensorType(name));

      code << "\n // Allocating memory for intermediate tensor " << name << " with size " << size << " bytes";

      code << "\n"

           << typeName << "* tensor_" << name << " = reinterpret_cast<" << typeName

           << "*>(fIntermediateMemoryPool.data() + " << location << ");\n";

   };


   if (fVerbose) std::cout << "*** AllocateIntermediateMemory: Loop on op output tensors\n";

   // order output tensors by size

   std::vector<TensorMemoryInfo> ordered_output_tensors;


   for (auto &it : op_output_tensors) {

      auto name = std::string(it);

      if (GetTensorType(name) == ETensorType::BOOL || fInitializedTensors.find(name) != fInitializedTensors.end() ||

          fDynamicTensorInfos.find(name) != fDynamicTensorInfos.end())

         continue;


      auto tensor_size = GetTypeSize(GetTensorType(name)) * ConvertShapeToLength(GetTensorShape(name));

      // important fill the pair in the ordered output tensors with the string view and not the string

      TensorMemoryInfo tmi = {it, tensor_size};

      ordered_output_tensors.push_back(tmi);

   }

   std::sort(ordered_output_tensors.begin(), ordered_output_tensors.end(),

             [](const TensorMemoryInfo &a, const TensorMemoryInfo &b) { return a.tensor_size > b.tensor_size; });


   for (auto &it : ordered_output_tensors) {

      bool allocated = false;

      std::string name = std::string{it.tensor_name};

      size_t tensor_size = it.tensor_size;

      if (fVerbose)

         std::cout << "output tensor " << name << " size " << tensor_size << std::endl;


      for (auto chunk = fIntermediateMemoryInfo.available_stack.begin();

           chunk != fIntermediateMemoryInfo.available_stack.end();) {


         if (fVerbose) std::cout << ".. available chunk " << chunk->first << " with size = " << chunk->second;

         // check if available memory chunks can accommodate the tensor

         if (chunk->second >= tensor_size) {

            // need to use here string_view (i.e it.tensor_name)

            // split returns the new chunk with size of new tensor. The free chunk is before the used one

            auto new_chunk = fIntermediateMemoryInfo.total_stack[chunk->first].split(it.tensor_name, tensor_size);

            auto new_chunk_location = chunk->first + chunk->second - tensor_size;

            fIntermediateMemoryInfo.total_stack[new_chunk_location] = new_chunk;


            declareIntermediateTensor(name, tensor_size, new_chunk_location);

            chunk->second -= tensor_size;


            allocated = true;


            if (fVerbose) std::cout << " is re-used and split in a new of size " << new_chunk.tensor_size << " at " << new_chunk_location;


            if (chunk->second == 0) {

               if (fVerbose) std::cout << " and deleted since size matches";

               fIntermediateMemoryInfo.available_stack.erase(chunk);

            }

            if (fVerbose) std::cout << std::endl;

            break;

         } else if (chunk->first == fIntermediateMemoryInfo.available_stack.rbegin()->first &&

                    fIntermediateMemoryInfo.total_stack.rbegin()->first == chunk->first) {

            // case last available chunk is the last in the memory, we can increase that one

            fIntermediateMemoryInfo.total_stack[chunk->first] = {it.tensor_name, tensor_size};

            declareIntermediateTensor(name, tensor_size, chunk->first);

            fIntermediateMemoryInfo.available_stack.erase(chunk);

            allocated = true;

            if (fVerbose) std::cout << " is extended  with a bigger one of size " << tensor_size << std::endl;

            break;

         }

         ++chunk;

         if (fVerbose) std::cout << std::endl;

      }


      if (!allocated) {

         size_t chunk_idx = fIntermediateMemoryInfo.total_stack.empty()

                               ? 0

                               : fIntermediateMemoryInfo.total_stack.rbegin()->first +

                                    fIntermediateMemoryInfo.total_stack.rbegin()->second.tensor_size;


         fIntermediateMemoryInfo.total_stack[chunk_idx] = it;


         declareIntermediateTensor(name, tensor_size, chunk_idx);


         if (fVerbose) std::cout << "no chunk available - add in total stack a new chunk with size of tensor and idx : " << chunk_idx

                   << std::endl;

      }

   }

   return code.str();

}


void RModel::CheckAndFlushIntermediateMemory(std::span<const std::string_view> op_input_tensors, const size_t& op_idx){

   if (fVerbose) std::cout << "*** CheckAndFlushIntermediateMemory: Loop on input tensors for op " << op_idx << "\n";

   //print available chunks

   if (fVerbose) std::cout << "available chunks before freeing them : \n";

   for (auto chunk = fIntermediateMemoryInfo.available_stack.begin();

        chunk != fIntermediateMemoryInfo.available_stack.end(); chunk++) {

      if (fVerbose) std::cout << "-- free chunk " << chunk->first <<  " size = " << chunk->second << std::endl;

   }

   for (auto &it : op_input_tensors) {

      // last occurence of the tensor is reached => flush it from memory

      if (fVerbose) std::cout << ".. input tensors : " << it;

      if (fIntermediateTensorFrequencyLookup[it] == op_idx) {

         if (fVerbose) std::cout << "  flash condition is met - looping on chunks to find matching one \n";

         for (auto chunk = fIntermediateMemoryInfo.total_stack.begin();

              chunk != fIntermediateMemoryInfo.total_stack.end(); ++chunk) {

            if (fVerbose) std::cout << "---  chunk " << chunk->first << " , " << chunk->second.tensor_name << " size " << chunk->second.tensor_size;

            if (chunk->second.tensor_name == it) {

               if (fVerbose) std::cout << " --  Found chunk corresponding to input tensor:  " << chunk->first;

               // check if nearby chunks in available memory can coalesce

               auto first_greater = fIntermediateMemoryInfo.available_stack.upper_bound(

                  chunk->first); // smallest element greater than the flushed chunk idx

               auto last_smaller = (first_greater == fIntermediateMemoryInfo.available_stack.begin())

                                      ? fIntermediateMemoryInfo.available_stack.end()

                                      : std::prev(first_greater); // largest element smaller than the flushed chunk idx


               // check if the next stack entry is actually adjacent in memory


               if (last_smaller != fIntermediateMemoryInfo.available_stack.end() &&

                   last_smaller->first + last_smaller->second == chunk->first) {

                  // merge chunk with previous one

                  last_smaller->second += chunk->second.tensor_size;

                  fIntermediateMemoryInfo.total_stack[last_smaller->first].merge(chunk->second);

                  if (fVerbose) std::cout << " is adjacent in memory with previous one - merge ";

                  if (first_greater != fIntermediateMemoryInfo.available_stack.end() &&

                      last_smaller->first + last_smaller->second == first_greater->first) {

                     // merge also with following one

                     last_smaller->second += first_greater->second;

                     fIntermediateMemoryInfo.total_stack[last_smaller->first].merge(

                        fIntermediateMemoryInfo.total_stack[first_greater->first]);

                     // delete merged one in available stack and in total stack

                     fIntermediateMemoryInfo.total_stack.erase(first_greater->first);

                     fIntermediateMemoryInfo.available_stack.erase(first_greater);

                     if (fVerbose) std::cout << " merge also with following that is free ";

                  }

                  fIntermediateMemoryInfo.total_stack.erase(chunk->first);

                  if (fVerbose) std::cout << std::endl;

                  break;

               } else if (first_greater != fIntermediateMemoryInfo.available_stack.end() &&

                          chunk->first + chunk->second.tensor_size == first_greater->first) {

                  // merge with first greater

                  if (fVerbose) std::cout << " is adjacent in memory with following one - merge \n";

                  // cannot modify idx of first_greter. Insert a new one and delete previous one

                  size_t new_size = chunk->second.tensor_size + first_greater->second;

                  size_t first_greater_idx = first_greater->first;

                  fIntermediateMemoryInfo.available_stack.erase(first_greater);

                  // cannot use anymore first_greater

                  fIntermediateMemoryInfo.available_stack.insert({chunk->first, new_size});

                  fIntermediateMemoryInfo.total_stack[chunk->first].merge(

                     fIntermediateMemoryInfo.total_stack[first_greater_idx]);

                  fIntermediateMemoryInfo.total_stack.erase(first_greater_idx);

               } else {

                  fIntermediateMemoryInfo.available_stack.insert({chunk->first, chunk->second.tensor_size});

                  if (fVerbose) std::cout << " insert in the available stack the chunk with size " << chunk->second.tensor_size << std::endl;

               }

               chunk->second.tensor_name = "free";

               break;

            }

         }

      } else {

         if (fVerbose) std::cout << std::endl;

      }

   }

}


void RModel::Initialize(int batchSize, bool verbose) {

   std::map<std::string, size_t> inputParams;

   if (batchSize > 0) {

      inputParams["input_size"] = batchSize;

      inputParams["batch_size"] = batchSize;

      inputParams["bs"] = batchSize;

   }

   Initialize(inputParams, verbose);

   fIntermediateMemoryInfo = MemoryPoolInfo();

}


void RModel::Initialize(const std::map<std::string, size_t> & inputParams, bool verbose) {


   fVerbose = int(verbose);


   if (fIsInitialized) {

      if (verbose)

         std::cout << "Model is already initialized  - skip initialization " << std::endl;

      return;

   }

   fIntermediateTensorInfos.clear();

   fDynamicTensorInfos.clear();


   // loop on inputs and see if shape can be  full specified

   // if the batch size is provided it can be used to specify the full shape

   // Add the full specified tensors in fReadyInputTensors collection

   auto originalInputTensorInfos = fInputTensorInfos; // need to copy because we may delete elements

   for (auto &input : originalInputTensorInfos) {

      if (verbose) std::cout << "looking at the tensor " << input.first << std::endl;

      // if a parameter (e.g. batch_size) is specified use for converting parametric shape in defined one

      if (!inputParams.empty()) {

         for (auto &d : input.second.shape) {

            if (d.isParam) {

               std::string pname = d.param;

               if (pname == input.first + "_size") pname = "input_size";

               auto itr = inputParams.find(pname);

               if (itr != inputParams.end() ) {

                  d = Dim{ itr->second };

                  if (verbose)

                     std::cout << "Tensor: " << input.first << " - fix parametric shape " << itr->first << " to " << itr->second << std::endl;

               }

            }

         }

      }

      // see if shape now is fully defined

      auto shape = ConvertShapeToInt(input.second.shape);

      if (verbose)

         std::cout << "converting input shape for " << input.first << " " << ConvertShapeToString(shape) << " from "

            << ConvertShapeToString(input.second.shape) << std::endl;

      if (!shape.empty()) {

         // case shape is defined (not parametric) we add the tensor in the fReadyInputTensorInfos map and

         // we remove the tensor from the fInputTensorInfo where th eold parametric shape was stored

         fInputTensorInfos.erase(input.first);

         // add to the ready input tensor information the new fixed shape

         AddInputTensorInfo(input.first, input.second.type, shape);

         // check consistency

         assert( fReadyInputTensorInfos.size() + fInputTensorInfos.size() == fInputTensorNames.size());

      }

      // store the parameters of the input tensors

      else {

         // store the found parametric shape parameters

         for (auto &d : input.second.shape) {

            if (d.isParam) {

               if (fShapeParams.count(d.param) == 0) {

                  fDimShapeNames.push_back(d.param);

                  fShapeParams[d.param] = std::to_string(d.dim);

               }

            }

         }

      }

   }


   if (verbose) {

      PrintRequiredInputTensors();

      PrintDynamicTensors();

   }


   // check if there are initialized tensors to write in a weight file

   // support for the time being only weight of FLOAT type

   if (fUseWeightFile) {

      bool modelHasWeights = false;

      for (auto &i : fInitializedTensors) {

         if (i.second.type() == ETensorType::FLOAT) {

            modelHasWeights = true;

            break;

         }

      }

      if (!modelHasWeights)

         fUseWeightFile = false;

   }

   // Go through model and initialize each operator

   int i = 0;


   std::vector<size_t> temp_available_stack; // vector stores individual chunks of available memory that maybe reused


   for(size_t op_idx = 0; op_idx < fOperators.size(); ++op_idx){

      if (verbose) {

         auto& r = *fOperators[op_idx].get();

         std::cout << "Initializing operator " << i << "  " << typeid(r).name() << std::endl;

      }

      fOperators[op_idx]->Initialize(*this);

      for(auto &it:fOperators[op_idx]->GetOpOutputTensors()){

         std::string name = std::string{it};

         if (fIntermediateTensorFrequencyLookup.find(it) == fIntermediateTensorFrequencyLookup.end() &&

             std::find(fOutputTensorNames.begin(), fOutputTensorNames.end(), name) == fOutputTensorNames.end() &&

             fInitializedTensors.find(name) == fInitializedTensors.end() &&

             fDynamicTensorInfos.find(name) == fDynamicTensorInfos.end()){

            fIntermediateTensorFrequencyLookup[it] = op_idx;

         }

      }

      i++;

   }


   fIsInitialized = true;

}


void RModel::InitializeSubGraph(std::shared_ptr<RModel>  graph) {

   // add the subgraph to the list

   fSubGraphs.push_back(graph);

   //this needs to be done before initializing

   graph->fParentGraph = this;

   graph->fIsSubGraph = true;


   graph->Initialize(fBatchSize, fVerbose);

   // set the same options as parent model

   graph->fWeightFile = fWeightFile;

   graph->fUseWeightFile = fUseWeightFile;

   graph->fUseSession = fUseSession;

   // add needed blas routines and libs

   std::vector<std::string> blasRoutines;

   for (auto & e : graph->fNeededBlasRoutines)

      blasRoutines.push_back(e);

   AddBlasRoutines(blasRoutines);

   for (auto e : graph->fNeededStdLib)

      AddNeededStdLib(e);


   // add parent input tensors to current graph

   for (auto & name : fInputTensorNames)

      graph->fInputTensorNames.emplace_back(name);


   // clean graph name

   graph->fName = UTILITY::Clean_name(graph->fName);


}


// Function to generate the code for declaring and initializing constant tensors

// This is for tensors which are not part of weight files and can be created from the Constant operator

template <typename T>


std::string GenerateConstantTensorCode(const std::pair<std::string, InitializedTensor> &t)

{

   std::stringstream strs;

   std::string type = ConvertTypeToString(t.second.type());

   size_t length = ConvertShapeToLength(t.second.shape());

   // avoid using stack sizes for constant tensors to reduce compilation time

   bool allocateOnStack = (length > 100) ? false : true;


   const T *data = t.second.data<T>();


   // and check if all values are the same

   bool sameData = false;

   // for non stack allocation check if data are the same

   if (!allocateOnStack && length > 1) {

      size_t idx = 1;

      do {

         sameData = (data[idx] == data[idx - 1]);

         idx++;

      } while (sameData && idx < length);

   }

   if (allocateOnStack) {

      strs << type << " tensor_" << t.first << "[" << length << "] = " << ConvertValuesToString(length, data) << ";\n";

   } else {

      strs << "std::vector<" << type << "> fTensor_" << t.first << " = ";

      if (sameData)

         strs << "std::vector<" << type << ">(" << length << ", " << ConvertValToString(data[0]) << ");\n";

      else {

         strs << ConvertValuesToString(length, data) << ";\n";

      }

      strs << "const " << type << " * tensor_" + t.first + " = fTensor_" + t.first + ".data();\n";

   }

   return strs.str();

}


void RModel::GenerateInitializedTensorInfo()

{

   if (!fInitializedTensors.empty())

      fGC += "// initialized tensors\n";


   for (auto &i : fInitializedTensors) {

      if (!fUseWeightFile || i.second.IsConstantTensor()) {

         if (i.second.type() == ETensorType::FLOAT) {

            fGC += GenerateConstantTensorCode<float>(i);

            fConstantTensorSize += ConvertShapeToLength(i.second.shape()) * 4;

         } else if (i.second.type() == ETensorType::INT64) {

            fGC += GenerateConstantTensorCode<int64_t>(i);

            fConstantTensorSize += ConvertShapeToLength(i.second.shape()) * 8;

         }


      } else {

         // case of tensors which are read from a file

         size_t length = ConvertShapeToLength(i.second.shape());

         if (i.second.type() == ETensorType::FLOAT) {

            fGC += "std::vector<float> fTensor_" + i.first + " = std::vector<float>(" + std::to_string(length) + ");\n";

            fGC += "float * tensor_" + i.first + " = fTensor_" + i.first + ".data();\n";

            fWeightsTensorSize += ConvertShapeToLength(i.second.shape()) * 4;

         }

      }

   }

}


void RModel::GenerateIntermediateMemoryPool() {

   if (fIntermediateMemoryInfo.total_stack.empty()) return;

   fGC += "\n//--- Allocating session memory pool to be used for allocating intermediate tensors\n";


   // char memory block is allocated since char takes 1 byte, thus easier to allocate tensors

   // of other data types

   auto const &totalStack = fIntermediateMemoryInfo.total_stack;

   const size_t memPoolSize = totalStack.rbegin()->first + totalStack.rbegin()->second.tensor_size;

   fGC += "std::vector<char> fIntermediateMemoryPool = std::vector<char>(" + std::to_string(memPoolSize) + ");\n\n";

}


void RModel::GenerateIntermediateTensorInfo() {

   if (!fIntermediateTensorInfos.empty()) {

      std::string tensor_declaration_block = "";

      for (auto &i : fIntermediateTensorInfos) {

         if (i.second.type == ETensorType::BOOL) {

               tensor_declaration_block += "std::vector<std::uint8_t> fTensor_" + i.first + " = std::vector<std::uint8_t>(" + std::to_string(ConvertShapeToLength(i.second.shape)) + ");\n";

               tensor_declaration_block += "std::uint8_t * tensor_" + i.first + " = fTensor_" + i.first + ".data();\n";

               continue;

         }

         bool is_extended = (fOptimizationLevel == OptimizationLevel::kExtended);

         bool not_in_freq_map =

            (fIntermediateTensorFrequencyLookup.find(i.first) == fIntermediateTensorFrequencyLookup.end());

         bool not_in_output_names =

            (std::find(fOutputTensorNames.begin(), fOutputTensorNames.end(), i.first) == fOutputTensorNames.end());


         if ((not_in_freq_map && not_in_output_names) || (!not_in_freq_map && !is_extended && not_in_output_names)) {

            size_t length = ConvertShapeToLength(i.second.shape);


            if (i.second.type == ETensorType::FLOAT) {

               tensor_declaration_block += "std::vector<float> fTensor_" + i.first + " = std::vector<float>(" + std::to_string(length) + ");\n";

               tensor_declaration_block += "float * tensor_" + i.first + " = fTensor_" + i.first + ".data();\n";

               fOtherTensorSize += 4 * length;

            }

            else if (i.second.type == ETensorType::DOUBLE) {

               tensor_declaration_block += "std::vector<double> fTensor_" + i.first + " = std::vector<double>(" + std::to_string(length) + ");\n";

               tensor_declaration_block += "double * tensor_" + i.first + " = fTensor_" + i.first + ".data();\n";

               fOtherTensorSize += 8 * length;

            }

            else if (i.second.type == ETensorType::INT64) {

               tensor_declaration_block += "std::vector<int64_t> fTensor_" + i.first + " = std::vector<int64_t>(" + std::to_string(length) + ");\n";

               tensor_declaration_block += "int64_t * tensor_" + i.first + " = fTensor_" + i.first + ".data();\n";

               fOtherTensorSize += 8 * length;

            }

         }

      }


      if (tensor_declaration_block.length()) {

         fGC += "\n//--- declare and allocate the intermediate tensors\n" + tensor_declaration_block;

      }

   }

   // add also the dynamic tensors (only declarations, allocation will be done later)

   if (!fDynamicTensorInfos.empty()) {

      fGC += "//--- declare the dynamic tensors\n";

      for (auto &i : fDynamicTensorInfos) {

         if (i.second.type == ETensorType::FLOAT) {

            fGC += "std::vector<float> fTensor_" + i.first + ";\n";

            fGC += "float * tensor_" + i.first + " = nullptr;\n";

         } else if (i.second.type == ETensorType::DOUBLE) {

            fGC += "std::vector<double> fTensor_" + i.first + ";\n";

            fGC += "double * tensor_" + i.first + " = nullptr;\n";

         } else if (i.second.type == ETensorType::INT64) {

            fGC += "std::vector<int64_t> fTensor_" + i.first + ";\n";

            fGC += "int64_t * tensor_" + i.first + " = nullptr;\n";

         }

      }

   }

}


// generate code for specific operator declarations  to be defined in the Session class


void RModel::GenerateOperatorDeclarations() {

   std::string strcode;

   for (auto & op : fOperators) {

      strcode += op->GenerateDeclCode();

   }

   if (strcode.empty()) return;

   fGC += "\n//---- operator declarations \n";

   fGC += strcode;

   fGC += "\n";

}


void RModel::GenerateDynamicTensorInfo()

{

   std::stringstream out;

   for (auto &i : fDynamicTensorInfos) {

      auto length = ConvertDynamicShapeToLength(i.second.shape);

      out << SP << "if (" << length << " > 0) {\n";

      out << SP << SP << "fTensor_" << i.first << ".resize(" << length << ");\n";

      out << SP << SP << "tensor_" << i.first << " = fTensor_" << i.first << ".data();\n";

      out << SP << "}\n";

   }

   fGC += out.str();

}


std::string RModel::GenerateInferSignature(bool isdecl) {

   // generate the infer signature given the inputs: eg. "float * tensor1, float * tensor2"

   // if (decl = false) generate only calling signature (tensor1,tensor2,....)

   std::string rGC;

   std::unordered_map<std::string, int> inputParams;

   int i_input = 0;

   for (auto &name : fInputTensorNames) {

      // if is a dynamic tensor pass initial parameters

      if (IsDimInputTensor(name)) {

         auto shape = GetDynamicTensorShape(name);

         for (auto &d : shape) {

            std::string pName = d.param;

            // need to check if the input parameters is already existing in another input tensor

            if (d.isParam && inputParams.count(pName) == 0) {

               if (isdecl) rGC += "size_t ";

               rGC += d.param + ",";

               inputParams[pName] = i_input;

            }

         }

      }

      if (isdecl) {

         std::string type = ConvertTypeToString(GetTensorType(name));

         if (type == "other")

            throw std::runtime_error("TMVA-SOFIE: input tensor " + name +

                                     " is of a data type which is not yet supported.");

         rGC += type + " const* ";

      }

      rGC += "tensor_" + name + ",";

      i_input++;

   }


   if (fInputTensorNames.size() > 0) rGC.pop_back();// remove last ","

   return rGC;

}


namespace {


std::string typeForOutput(ETensorType t) {

   // The std::vector<bool> is a special type that is not wrapping continuous memory.

   // We don't want to use it as a return type.

   if (t == ETensorType::BOOL) t = ETensorType::UINT8;

   return ConvertTypeToString(t);

}


}


void RModel::GenerateOutput()

{

   size_t outputSize = fOutputTensorNames.size();

   // assume output types are all the same


   bool sameOutputTypes = true;

   std::string inferReturnType; // type return by infer function

   ETensorType eFirstOutputType = GetTensorType(*fOutputTensorNames.begin());

   fGC += "\n\n";

   if (outputSize == 1) {

      fGC += "std::vector<" + typeForOutput(eFirstOutputType) + ">";

   } else {

      // if all output types are the same we return an std::vector - otherwise a tuple

      for (std::string const &name : fOutputTensorNames) {

         if (GetTensorType(name) != eFirstOutputType)

            sameOutputTypes = false;

      }

      if (sameOutputTypes)

         fGC += "std::vector<std::vector<" + typeForOutput(eFirstOutputType) + ">>";

      else {

         inferReturnType = "std::tuple<";

         for (size_t i = 0; i < outputSize; i++) {

            inferReturnType += "std::vector<" + typeForOutput(GetTensorType(fOutputTensorNames[i])) + ">";

            if (i < outputSize - 1)

               inferReturnType += ",";

         }

         inferReturnType += ">";

         fGC += inferReturnType;

      }

   }


   fGC += " infer(" + GenerateInferSignature() + "){\n";


   std::string doInferArgs = GenerateInferSignature(false);

   if (!doInferArgs.empty())

      doInferArgs += ",";

   for (std::string const &name : fOutputTensorNames) {

      fGC += SP + "std::vector<" + typeForOutput(GetTensorType(name)) + " > output_tensor_" + name + ";\n";

      doInferArgs += " output_tensor_" + name + ",";

   }

   if (!doInferArgs.empty())

      doInferArgs.back() = ' ';


   fGC += SP + "doInfer(" + doInferArgs + ");\n";


   fGC += SP + "return {";

   for (size_t i = 0; i < fOutputTensorNames.size(); i++) {

      fGC += "output_tensor_" + fOutputTensorNames[i];

      if (i < fOutputTensorNames.size() - 1)

         fGC += ",";

   }

   fGC += "};\n";

   fGC += "}\n"; // end of infer function scope

}


void RModel::GenerateSessionCode()

{

   // Determine the signature of the actual inference function

   std::string doInferSignature = GenerateInferSignature();

   if (!doInferSignature.empty())

      doInferSignature += ", ";

   for (auto const &name : fOutputTensorNames) {

      doInferSignature += " std::vector<" + typeForOutput(GetTensorType(name)) + "> &output_tensor_" + name + ",";

   }

   doInferSignature.back() = ' ';


   doInferSignature = "void doInfer(" + doInferSignature + ")";


   // define the Session struct (for GNN this is generated in RModel_GNN)

   if (fUseSession && !fIsGNNComponent) {

      if (!fIsSubGraph)

         fGC += "struct Session {\n";

      else

         fGC += "struct Session_" + fName + " {\n";

   }


   // generate code for declaring the initialized tensors

   GenerateInitializedTensorInfo();


   if (fOptimizationLevel == OptimizationLevel::kExtended) {

      // evaluate total intermediate memory and position intermediate tensor addresses

      std::string intermediate_memory_alloc_string = "";

      intermediate_memory_alloc_string += "\n// --- Positioning intermediate tensor memory --";

      for (size_t op_idx = 0; op_idx < fOperators.size(); ++op_idx) {

         if (fVerbose) {

            auto op = fOperators[op_idx].get();

            std::cout << "\n******************\n analyzing input/output operator " << op_idx << "  "

                      << typeid(*op).name() << std::endl;

         }

         intermediate_memory_alloc_string += AllocateIntermediateMemory(fOperators[op_idx]->GetOpOutputTensors());

         CheckAndFlushIntermediateMemory(fOperators[op_idx]->GetOpInputTensors(), op_idx);

      }


      // to check remaining unused fragments after memory allocation (lesser the better)

      // for (const auto &it: fIntermediateMemoryInfo.available_stack){

      //    std::cout<<"chunk_idx: "<<it.first<<", chunk_size: "<<it.second<<"\n";

      // }


      // generate the memory pool to be used by intermediate tensors

      GenerateIntermediateMemoryPool();


      // position intermediate tensors

      fGC += intermediate_memory_alloc_string;

   }


   // generate the declaring the intermediate tensors

   GenerateIntermediateTensorInfo();

   // generate code for declarations of some specific operators

   GenerateOperatorDeclarations();


   // add subgraph session

   if (!fSubGraphs.empty()) fGC += "//   subgraph sessions\n";

   for (auto & graph : fSubGraphs) {

      fGC += "Session_" + graph->fName + "  fSession_" + graph->fName + ";\n";

   }


   // Generate code for Session constructor

   if (fUseSession) {

      std::string sessionName = "Session";

      if (fIsSubGraph)

         sessionName += "_" + fName;

      // add here specific operator code that needs to define session data members

      fGC += "\n";

      for (size_t id = 0; id < fOperators.size(); id++) {

         std::string opName = std::to_string(id);

         fGC += fOperators[id]->GenerateSessionMembersCode(opName);

      }

      fGC += "\n";

      // here add initialization and reading of weight tensors

      if (fUseWeightFile) {

         std::string fileName = fName;

         if (fWeightFile == WeightFileType::Text) {

            fileName += ".dat";

         }

         if (fWeightFile == WeightFileType::RootBinary) {

            fileName += ".root";

         }

         fGC += sessionName + "(std::string filename =\"" + fileName + "\"";

      } else {

         // no need to pass weight file since it is not used

         // keep passing a string for compatibility

         fGC += sessionName + "(std::string = \"\"";

      }

      // add initialization of shape parameters

      // assume all parameters are of type size_t

      if (!fDimShapeNames.empty()) {

         for (auto &p : fDimShapeNames) {

            fGC += ",\n";

            fGC += "        size_t " + p + " = " + fShapeParams[p];

         }

      }

      fGC += ") {\n";


      if (fUseWeightFile) {

         fGC += "\n//--- reading weights from file\n";

         ReadInitializedTensorsFromFile(fReadPos);

         fGC += "\n";

         // fUseWeightFile = fUseWeightFile;

      }


      // now we have passed the parameters we can allocate the dynamic tensors

      GenerateDynamicTensorInfo();


      // add here initialization code  for operator

      for (size_t id = 0; id < fOperators.size(); id++) {

         fGC += fOperators[id]->GenerateInitCode();

      }


      fGC += "}\n\n";

   }


   fGC += doInferSignature + "{\n";

   fGC += "\n";


   // generate the inference code

   if (fVerbose)

      std::cout << "Generating main inference code for " << fName << std::endl;


   if (fOutputTensorNames.size() == 0)

      throw std::runtime_error("TMVA-SOFIE: output size=0 are not supported");


   for (size_t op_idx = 0; op_idx < fOperators.size(); ++op_idx) {

      if (fVerbose)

         std::cout << "Generating code for operator .... " << op_idx << std::endl;

      fGC += (fOperators[op_idx]->Generate(std::to_string(op_idx)));

   }


   fGC += SP + "using TMVA::Experimental::SOFIE::UTILITY::FillOutput;\n\n";


   for (std::string const &name : fOutputTensorNames) {

      // need to check is size is the same (don't want to return a vector with

      // larger size) in that case better to copy

      bool isIntermediate = fIntermediateTensorInfos.count(name) > 0;

      std::string n = isIntermediate ? std::to_string(ConvertShapeToLength(GetTensorShape(name)))

                                     : ConvertDimShapeToLength(GetDimTensorShape(name));

      fGC += SP + "FillOutput(tensor_" + name + ", output_tensor_" + name + ", " + n + ");\n";

   }


   fGC += "}\n\n";


   // generate the inference overload that returns an output struct

   GenerateOutput();


   // end of session

   if (fUseSession && !fIsGNNComponent) {

      fGC += "};   // end of Session\n\n";

   }

}


void RModel::Generate(std::underlying_type_t<Options> options, int batchSize, long pos, bool verbose)

{

   fVerbose = verbose;

   fBatchSize = batchSize;

   fReadPos = pos;


   // session flag is used in operator initialize

   if (static_cast<std::underlying_type_t<Options>>(Options::kNoSession) & options) {

      fUseSession = false;

      fWeightFile = WeightFileType::None;

   }

   if (static_cast<std::underlying_type_t<Options>>(Options::kNoWeightFile) & options) {

      fUseWeightFile = false;

      fWeightFile = WeightFileType::None;

   }

   if (static_cast<std::underlying_type_t<Options>>(Options::kRootBinaryWeightFile) & options) {

      fUseWeightFile = true;

      fWeightFile = WeightFileType::RootBinary;

   }

   if (fUseWeightFile && !fUseSession) {

      throw std::runtime_error(

         "TMVA-SOFIE: RModel::Generate: cannot use a separate weight file without generating a Session class");

   }


   if (static_cast<std::underlying_type_t<Options>>(Options::kGNN) & options)

      fIsGNN = true;

   if (static_cast<std::underlying_type_t<Options>>(Options::kGNNComponent) & options)

      fIsGNNComponent = true;


   // initialize the model including all operators and sub-graphs

   Initialize(batchSize, verbose);


   std::string hgname;

   if (!fIsGNNComponent && !fIsSubGraph) {

      fGC.clear();

      GenerateHeaderInfo(hgname);

   }


   // generate first code for the subgraphs

   for (auto &graph : fSubGraphs) {

      if (fVerbose)

         std::cout << "generate session code for subgraph " << graph->fName << std::endl;

      graph->GenerateSessionCode();

      fGC += graph->fGC;

   }


   if (fVerbose)

      std::cout << "generate Main session code - model  " << fName << std::endl;


   // generate main session code

   GenerateSessionCode();


   if (!fIsGNNComponent && !fIsSubGraph) {

      fGC += ("} //TMVA_SOFIE_" + fName + "\n");

      fGC += "\n#endif  // " + hgname + "\n";

   }

}


void RModel::ReadInitializedTensorsFromFile(long pos) {

    // generate the code to read initialized tensors from a text data file

    if (fWeightFile == WeightFileType::Text) {

        if (fInitializedTensors.empty()) return;


        fGC += "   std::ifstream f;\n";

        fGC += "   f.open(filename);\n";

        fGC += "   if (!f.is_open()) {\n";

        fGC += "      throw std::runtime_error(\"tmva-sofie failed to open file \" + filename + \" for input weights\");\n";

        fGC += "   }\n";


        if(fIsGNNComponent) {

            fGC += "   f.seekg(" + std::to_string(pos) + ");\n";

        }


        fGC += "   using TMVA::Experimental::SOFIE::ReadTensorFromStream;\n";


        // loop on tensors and parse the file

        for (auto& i: fInitializedTensors) {

            // skip Constant and shape tensors (not written in a file)

            if (!i.second.IsWeightTensor()) continue;

            std::string tensor_name = "tensor_" + i.first;

            if (i.second.type() == ETensorType::FLOAT) {

               std::string length = std::to_string(ConvertShapeToLength(i.second.shape()));

               fGC += "   ReadTensorFromStream(f, " + tensor_name + ", \"" + tensor_name + "\", " + length + ");\n";

            } else {

               std::runtime_error("tmva-sofie tensor " + tensor_name + " with type " + ConvertTypeToString(i.second.type()) + " cannot be read from a file");

            }

        }

        fGC += "   f.close();\n";

    }


    // generate the code to read initialized tensors from a ROOT data file

    if(fWeightFile == WeightFileType::RootBinary) {

#ifdef SOFIE_SUPPORT_ROOT_BINARY

        fGC += "  {\n";

        fGC += "   std::unique_ptr<TFile> rootFile(TFile::Open(filename.c_str(), \"READ\"));\n";

        fGC += "   if (!rootFile->IsOpen()) {\n";

        fGC += "      throw std::runtime_error(\"tmva-sofie failed to open ROOT file for input weights\");\n";

        fGC += "   }\n";


        std::string dirName = fName + "_weights";

        fGC += "   if (!rootFile->GetKey(\"" + dirName + "\")) {\n";

        fGC += "      throw std::runtime_error(\"tmva-sofie failed to open ROOT directory for input weights\");\n";

        fGC += "   }\n";


        for (auto &i : fInitializedTensors) {

            // skip Constant and shape tensors

            if (!i.second.IsWeightTensor()) continue;

            fGC += "  {\n";

            std::string tensor_name = "tensor_" + i.first;

            if (i.second.type() == ETensorType::FLOAT) {

               fGC += "      fTensor_" + i.first + " = *reinterpret_cast<std::vector<float>*>(rootFile->Get(\"";

               fGC += dirName + "/" + tensor_name + "\"));\n";

            } else if (i.second.type() == ETensorType::DOUBLE) {

               fGC += "      fTensor_" + i.first + " = *reinterpret_cast<std::vector<double>*>(rootFile->Get(\"";

               fGC += dirName + + "/" + tensor_name + "\"));\n";

            } else if (i.second.type() == ETensorType::INT64) {

               fGC += "      fTensor_" + i.first + " = *reinterpret_cast<std::vector<int64_t>*>(rootFile->Get(\"";

               fGC += dirName + "/" + tensor_name + "\"));\n";

            } else {

               std::runtime_error("tmva-sofie tensor " + tensor_name + " with type " + ConvertTypeToString(i.second.type()) + " cannot be read from a ROOT file");

            }

            fGC += "  }\n";

        }

        fGC += "  }\n";

#else

        throw std::runtime_error("SOFIE was not built with ROOT file support.");

#endif // SOFIE_SUPPORT_ROOT_BINARY

    }

}


long RModel::WriteInitializedTensorsToFile(std::string filename) {

    // Determine the file extension based on the weight file type

    std::string fileExtension;

    switch (fWeightFile) {

    case WeightFileType::None:

        fileExtension = ".dat";

        break;

    case WeightFileType::RootBinary:

        fileExtension = ".root";

        break;

    case WeightFileType::Text:

        fileExtension = ".dat";

        break;

    }


    // If filename is empty, use the model name as the base filename

    if (filename.empty()) {

        filename = fFileName + fileExtension;

    }


    // Write the initialized tensors to the file

    if (fWeightFile == WeightFileType::RootBinary) {

#ifdef SOFIE_SUPPORT_ROOT_BINARY

        if(fIsGNNComponent || fIsGNN) {

            throw std::runtime_error("SOFIE-GNN yet not supports writing to a ROOT file.");

        }

        std::unique_ptr<TFile> outputFile(TFile::Open(filename.c_str(), "UPDATE"));


        std::string dirName = fName + "_weights";

        // check if directory exists, in case delete to replace with new one

        if (outputFile->GetKey(dirName.c_str()))

            outputFile->rmdir(dirName.c_str());


        auto outputDir = outputFile->mkdir(dirName.c_str());


        for (const auto& item : fInitializedTensors) {

            // skip Constant tensors and tensors which are not writable (e.g. shape tensors)

            if (!item.second.IsWeightTensor()) continue;

            std::string tensorName = "tensor_" + item.first;

            size_t length = 1;

            length = ConvertShapeToLength(item.second.shape());

            if(item.second.type() == ETensorType::FLOAT) {

               const float* data = item.second.data<float>();

                std::vector<float> tensorDataVector(data, data + length);

               outputDir->WriteObjectAny(&tensorDataVector, "std::vector<float>", tensorName.c_str());

            }

            else if(item.second.type() == ETensorType::DOUBLE) {

               const double* data = item.second.data<double>();

               std::vector<double> tensorDataVector(data, data + length);

               outputDir->WriteObjectAny(&tensorDataVector, "std::vector<double>", tensorName.c_str());

            }

            else if(item.second.type() == ETensorType::INT64) {

               const int64_t* data = item.second.data<int64_t>();

               std::vector<int64_t> tensorDataVector(data, data + length);

               outputDir->WriteObjectAny(&tensorDataVector, "std::vector<int64_t>", tensorName.c_str());

            }

            else {

               std::runtime_error("tmva-sofie tensor " + tensorName + " with type " + ConvertTypeToString(item.second.type()) +

                                  " cannot be written to a ROOT file");

            }

        }

        outputFile->Write(filename.c_str());


        // this needs to be changed, similar to the text file

        return -1;


#else

        throw std::runtime_error("SOFIE was not built with ROOT file support.");

#endif // SOFIE_SUPPORT_ROOT_BINARY

    } else if (fWeightFile == WeightFileType::Text) {

        std::ofstream f;

        if(fIsGNNComponent) {

            // appending all GNN components into the same file

            f.open(filename, std::ios::app);

        } else {

            f.open(filename);

        }

        if (!f.is_open())

            throw

            std::runtime_error("tmva-sofie failed to open file " + filename + " for tensor weight data");

        for (auto& i: fInitializedTensors) {

             // skip Constant tensors and not writable tensors (e.g. shape tensors)

            if (!i.second.IsWeightTensor()) {

               continue;

            }

            size_t length = ConvertShapeToLength(i.second.shape());

            std::string tensor_name = "tensor_" + i.first;

            f << tensor_name << " " << length << "\n";

            if (i.second.type() == ETensorType::FLOAT) {

               const float * data = i.second.data<float>();

               for (size_t idx = 0; idx < length; idx++) {

                  // round to zero sub-normal values

                  float value = data[idx];

                  if (value != 0. && std::abs(value) < std::numeric_limits<float>::min() ) value = 0;

                  f << std::setprecision(std::numeric_limits<float>::max_digits10) << value;

                  f <<  ( (idx < length-1) ? " " : "\n" );

               }

            }

            else {

               std::runtime_error("tmva-sofie tensor " + tensor_name + " with type " + ConvertTypeToString(i.second.type()) + " cannot be written to a file");

            }

            if (f.fail())

               std::runtime_error("tmva-sofie failed to write tensor data to file for  " + tensor_name);

        }

        long curr_pos = f.tellp();

        f.close();

        return curr_pos;

    } else {

        return -1;

    }

}


void RModel::PrintRequiredInputTensors() {

    std::cout << "Model requires following inputs:\n";

    for (auto& inputInfo: fInputTensorInfos) {

        std::cout << "Parametrised Tensor name: " << inputInfo.first << "\t";

        std::cout << "type: " << ConvertTypeToString(inputInfo.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < inputInfo.second.shape.size(); i++) {

            if (inputInfo.second.shape[i].isParam) {

                std::cout << inputInfo.second.shape[i].param;

            } else {

                std::cout << inputInfo.second.shape[i].dim ;

            }

            if (i < inputInfo.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }


    for (auto& inputInfo: fReadyInputTensorInfos) {

        std::cout << "Fully Specified Tensor name: " << inputInfo.first << "\t";

        std::cout << "type: " << ConvertTypeToString(inputInfo.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < inputInfo.second.shape.size(); i++) {

            std::cout << inputInfo.second.shape[i];

            if (i < inputInfo.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }

    std::cout << "\n";

}


void RModel::PrintInitializedTensors() {

    std::cout << "Model initialized the following tensors:\n";

    for (auto& it: fInitializedTensors) {

        std::cout << "Tensor name: \"" << it.first << "\"\t";

        std::cout << "type: " << ConvertTypeToString(it.second.type()) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < it.second.shape().size(); i++) {

            std::cout << it.second.shape()[i];

            if (i < it.second.shape().size() - 1) std::cout << ",";

        }

        std::cout << "]";

        if (it.second.IsConstantTensor()) std::cout << " (Constant)";

        else if (!it.second.IsWeightTensor()) std::cout << " (Not Writable)";

        std::cout << std::endl;

    }

    std::cout << "\n";

}


void RModel::PrintIntermediateTensors() {

    std::cout << "Model specify the following intermediate tensors:\n";

    for (auto& it: fIntermediateTensorInfos) {

        std::cout << "Tensor name: \"" << it.first << "\"\t";

        std::cout << "type: " << ConvertTypeToString(it.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < it.second.shape.size(); i++) {

            std::cout << it.second.shape[i];

            if (i < it.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }

    std::cout << "\n";

}


void RModel::PrintDynamicTensors() {

    std::cout << "Model specify the following dynamic tensors:\n";

    for (auto& it: fDynamicTensorInfos) {

        std::cout << "Tensor name: \"" << it.first << "\"\t";

        std::cout << "type: " << ConvertTypeToString(it.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < it.second.shape.size(); i++) {

            std::cout << it.second.shape[i].GetVal();

            if (i < it.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }

    std::cout << "\n";

}


void RModel::PrintOutputTensors() {

    std::cout << "Model specify the following output tensors:\n";

    for (auto& it: fOutputTensorNames) {

        std::cout << "Tensor name: \"" << it << "\"\t";

        if (!IsDynamicTensor(it))

           std::cout << "shape: " << ConvertShapeToString(GetTensorShape(it)) << std::endl;

        else

          std::cout << "shape: " << ConvertShapeToString(GetDynamicTensorShape(it)) << std::endl;

    }

    std::cout << "\n";

}


void RModel::HeadInitializedTensors(std::string name, int n_print) {

    auto it = fInitializedTensors.find(name);

    if (it == fInitializedTensors.end()) {

        std::cout << "Tensor " << name << " not found in model's initialized tensor list" << std::endl;

        return;

    }


    std::cout << "Tensor name: " << it->first << "\t";

    std::cout << "type: " << ConvertTypeToString(it->second.type()) << "\t";

    int length =1;

    std::cout << "shape: [";

    for (size_t i = 0; i < it->second.shape().size(); i++) {

        std::cout << it->second.shape()[i];

        length *= it->second.shape()[i];

        if (i < it->second.shape().size() - 1) std::cout << ",";

    }

    std::cout << "]" << std::endl;

    bool ellipsis = true;

    if (n_print > length) {

        n_print = length;

        ellipsis = false;

    }


    std::cout << "data: [" << std::endl;

    if (it->second.type() == ETensorType::FLOAT) {

        auto converted_data = it->second.data<float>();

        for (int i =0; i < n_print; i++) {

            std::cout << converted_data[i];

            if (i < n_print - 1) std::cout << " ,";

        }

    }

    if (ellipsis) std::cout << ", ...";

    std::cout << "]" << std::endl;


}


void RModel::OutputGenerated(std::string filename, bool append) {


    RModel_Base::OutputGenerated(filename, append);


    // write weights in a text file

    if (fUseWeightFile) {

        if (!filename.empty()) {

            size_t pos = filename.find(".hxx");

            if (fWeightFile == WeightFileType::Text)

                filename.replace(pos, 4, ".dat");

            if (fWeightFile == WeightFileType::RootBinary)  {

                filename = filename.erase(pos, 4);

                filename += ".root";

            }

        } else {

            filename = fName;

            filename += fWeightFile == WeightFileType::Text ? ".dat" : ".root";

        }

        WriteInitializedTensorsToFile(filename);

    }

}


void RModel::Streamer(TBuffer &R__b) {

    if (R__b.IsReading()) {

        RModel::Class()->ReadBuffer(R__b, this);

        for (auto & i : fInitializedTensors) {

            i.second.CastPersistentToShared();

        }

    }

    else {

        for (auto & i : fInitializedTensors) {

            i.second.CastSharedToPersistent();

        }

        RModel::Class()->WriteBuffer(R__b, this);

    }

}


}//SOFIE

}//Experimental

}//TMVA

RModel.hxx

d
#define d(i)
Definition RSha256.hxx:102

b
#define b(i)
Definition RSha256.hxx:100

f
#define f(i)
Definition RSha256.hxx:104

a
#define a(i)
Definition RSha256.hxx:99

e
#define e(i)
Definition RSha256.hxx:103

size
size_t size(const MatrixT &matrix)
retrieve the size of a square matrix

SOFIE_common.hxx

TRangeDynCast
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
Definition TCollection.h:358

TFile.h

p
winID h TVirtualViewer3D TVirtualGLPainter p
Definition TGWin32VirtualGLProxy.cxx:51

data
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void data
Definition TGWin32VirtualXProxy.cxx:104

input
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void input
Definition TGWin32VirtualXProxy.cxx:142

filename
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char filename
Definition TGWin32VirtualXProxy.cxx:232

r
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t r
Definition TGWin32VirtualXProxy.cxx:168

index
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t index
Definition TGWin32VirtualXProxy.cxx:168

length
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h length
Definition TGWin32VirtualXProxy.cxx:245

id
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize id
Definition TGWin32VirtualXProxy.cxx:94

value
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void value
Definition TGWin32VirtualXProxy.cxx:142

type
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h Atom_t Int_t ULong_t ULong_t unsigned char prop_list Atom_t Atom_t Atom_t Time_t type
Definition TGWin32VirtualXProxy.cxx:249

name
char name[80]
Definition TGX11.cxx:110

ROOT::Detail::TRangeCast
Definition TCollection.h:311

ROOT::RRangeCast::begin
const_iterator begin() const
Definition RRangeCast.hxx:104

ROOT::RRangeCast::end
const_iterator end() const
Definition RRangeCast.hxx:105

TBuffer
Buffer base class used for serializing objects.
Definition TBuffer.h:43

TFile::Open
static TFile * Open(const char *name, Option_t *option="", const char *ftitle="", Int_t compress=ROOT::RCompressionSetting::EDefaults::kUseCompiledDefault, Int_t netopt=0)
Create / open a file.
Definition TFile.cxx:3764

TMVA::Experimental::SOFIE::InitializedTensor
Definition SOFIE_common.hxx:240

TMVA::Experimental::SOFIE::RModel_Base::fIsGNN
bool fIsGNN
Definition RModel_Base.hxx:62

TMVA::Experimental::SOFIE::RModel_Base::GenerateHeaderInfo
void GenerateHeaderInfo(std::string &hgname)
Definition RModel_Base.cxx:15

TMVA::Experimental::SOFIE::RModel_Base::fGC
std::string fGC
Definition RModel_Base.hxx:59

TMVA::Experimental::SOFIE::RModel_Base::fFileName
std::string fFileName
Definition RModel_Base.hxx:48

TMVA::Experimental::SOFIE::RModel_Base::OutputGenerated
void OutputGenerated(std::string filename="", bool append=false)
Definition RModel_Base.cxx:62

TMVA::Experimental::SOFIE::RModel_Base::fIsGNNComponent
bool fIsGNNComponent
Definition RModel_Base.hxx:63

TMVA::Experimental::SOFIE::RModel_Base::fUseSession
bool fUseSession
Definition RModel_Base.hxx:61

TMVA::Experimental::SOFIE::RModel_Base::fUseWeightFile
bool fUseWeightFile
Definition RModel_Base.hxx:60

TMVA::Experimental::SOFIE::RModel_Base::fWeightFile
WeightFileType fWeightFile
Definition RModel_Base.hxx:51

TMVA::Experimental::SOFIE::RModel_Base::AddBlasRoutines
void AddBlasRoutines(std::vector< std::string > routines)
Definition RModel_Base.hxx:77

TMVA::Experimental::SOFIE::RModel_Base::AddNeededStdLib
void AddNeededStdLib(std::string libname)
Definition RModel_Base.hxx:83

TMVA::Experimental::SOFIE::RModel_Base::fName
std::string fName
Definition RModel_Base.hxx:58

TMVA::Experimental::SOFIE::RModel::AddShapeParam
void AddShapeParam(const std::string &name, size_t def_value=0)
Definition RModel.cxx:281

TMVA::Experimental::SOFIE::RModel::GetTensorShape
std::vector< size_t > GetTensorShape(const std::string &name) const
Definition RModel.cxx:29

TMVA::Experimental::SOFIE::RModel::fBatchSize
int fBatchSize
Definition RModel.hxx:18

TMVA::Experimental::SOFIE::RModel::fReadPos
long fReadPos
Definition RModel.hxx:19

TMVA::Experimental::SOFIE::RModel::GetDimTensorShape
std::vector< Dim > GetDimTensorShape(const std::string &name) const
Definition RModel.cxx:65

TMVA::Experimental::SOFIE::RModel::fDynamicTensorInfos
std::unordered_map< std::string, DynamicTensorInfo > fDynamicTensorInfos
Definition RModel.hxx:30

TMVA::Experimental::SOFIE::RModel::IsDynamicTensor
bool IsDynamicTensor(const std::string &name) const
Definition RModel.cxx:232

TMVA::Experimental::SOFIE::RModel::fOtherTensorSize
size_t fOtherTensorSize
Definition RModel.hxx:22

TMVA::Experimental::SOFIE::RModel::AddIntermediateTensor
void AddIntermediateTensor(std::string tensor_name, ETensorType type, std::vector< Dim > dim_shape)
Definition RModel.cxx:247

TMVA::Experimental::SOFIE::RModel::GenerateIntermediateTensorInfo
void GenerateIntermediateTensorInfo()
Definition RModel.cxx:722

TMVA::Experimental::SOFIE::RModel::PrintIntermediateTensors
void PrintIntermediateTensors()
Definition RModel.cxx:1352

TMVA::Experimental::SOFIE::RModel::GenerateInferSignature
std::string GenerateInferSignature(bool isdecl=true)
Definition RModel.cxx:805

TMVA::Experimental::SOFIE::RModel::GenerateOutput
void GenerateOutput()
Definition RModel.cxx:851

TMVA::Experimental::SOFIE::RModel::GenerateOperatorDeclarations
void GenerateOperatorDeclarations()
Definition RModel.cxx:781

TMVA::Experimental::SOFIE::RModel::PrintOutputTensors
void PrintOutputTensors()
Definition RModel.cxx:1382

TMVA::Experimental::SOFIE::RModel::fWeightsTensorSize
size_t fWeightsTensorSize
Definition RModel.hxx:21

TMVA::Experimental::SOFIE::RModel::CheckIfTensorAlreadyExist
bool CheckIfTensorAlreadyExist(std::string tensor_name)
Definition RModel.cxx:122

TMVA::Experimental::SOFIE::RModel::fOperators
std::vector< std::unique_ptr< ROperator > > fOperators
Definition RModel.hxx:39

TMVA::Experimental::SOFIE::RModel::OutputGenerated
void OutputGenerated(std::string filename="", bool append=false)
Definition RModel.cxx:1430

TMVA::Experimental::SOFIE::RModel::AddInputTensorInfo
void AddInputTensorInfo(std::string input_name, ETensorType type, std::vector< Dim > shape)
Definition RModel.cxx:133

TMVA::Experimental::SOFIE::RModel::fIntermediateTensorInfos
std::unordered_map< std::string, TensorInfo > fIntermediateTensorInfos
Definition RModel.hxx:29

TMVA::Experimental::SOFIE::RModel::AddOutputTensorNameList
void AddOutputTensorNameList(std::vector< std::string > output_tensor_names)
Definition RModel.cxx:289

TMVA::Experimental::SOFIE::RModel::fReadyInputTensorInfos
std::unordered_map< std::string, TensorInfo > fReadyInputTensorInfos
Definition RModel.hxx:27

TMVA::Experimental::SOFIE::RModel::AddConstantTensor
void AddConstantTensor(std::string tensor_name, ETensorType type, std::vector< std::size_t > shape, std::shared_ptr< void > data)
Definition RModel.cxx:193

TMVA::Experimental::SOFIE::RModel::AddDynamicTensor
void AddDynamicTensor(std::string tensor_name, ETensorType type, std::vector< Dim > shape)
Definition RModel.cxx:264

TMVA::Experimental::SOFIE::RModel::fDimShapeNames
std::vector< std::string > fDimShapeNames
Definition RModel.hxx:33

TMVA::Experimental::SOFIE::RModel::AddInitializedTensor
void AddInitializedTensor(std::string tensor_name, ETensorType type, std::vector< std::size_t > shape, std::shared_ptr< void > data)
Definition RModel.cxx:183

TMVA::Experimental::SOFIE::RModel::fIntermediateTensorFrequencyLookup
std::unordered_map< std::string_view, size_t > fIntermediateTensorFrequencyLookup
! lookup table for intermediate tensor frequency (transient)
Definition RModel.hxx:46

TMVA::Experimental::SOFIE::RModel::AddInputTensorName
void AddInputTensorName(std::string name)
Definition RModel.cxx:152

TMVA::Experimental::SOFIE::RModel::PrintDynamicTensors
void PrintDynamicTensors()
Definition RModel.cxx:1367

TMVA::Experimental::SOFIE::RModel::fOutputTensorNames
std::vector< std::string > fOutputTensorNames
Definition RModel.hxx:34

TMVA::Experimental::SOFIE::RModel::GenerateSessionCode
void GenerateSessionCode()
Definition RModel.cxx:906

TMVA::Experimental::SOFIE::RModel::IsDimInputTensor
bool IsDimInputTensor(const std::string &name) const
Definition RModel.cxx:237

TMVA::Experimental::SOFIE::RModel::GenerateDynamicTensorInfo
void GenerateDynamicTensorInfo()
Definition RModel.cxx:792

TMVA::Experimental::SOFIE::RModel::IsShapeTensor
bool IsShapeTensor(const std::string &name) const
check if a tensor is a shape tensor
Definition RModel.cxx:211

TMVA::Experimental::SOFIE::RModel::IsInitializedTensor
bool IsInitializedTensor(const std::string &name) const
Definition RModel.cxx:220

TMVA::Experimental::SOFIE::RModel::fConstantTensorSize
size_t fConstantTensorSize
Definition RModel.hxx:20

TMVA::Experimental::SOFIE::RModel::CheckAndFlushIntermediateMemory
void CheckAndFlushIntermediateMemory(std::span< const std::string_view > op_output_tensors, const size_t &op_idx)
Definition RModel.cxx:429

TMVA::Experimental::SOFIE::RModel::PrintInitializedTensors
void PrintInitializedTensors()
Definition RModel.cxx:1334

TMVA::Experimental::SOFIE::RModel::AddOperator
void AddOperator(std::unique_ptr< ROperator > op, int order_execution=-1)
Definition RModel.cxx:156

TMVA::Experimental::SOFIE::RModel::fParentGraph
RModel * fParentGraph
Definition RModel.hxx:42

TMVA::Experimental::SOFIE::RModel::HeadInitializedTensors
void HeadInitializedTensors(std::string name, int n_print=50)
Definition RModel.cxx:1394

TMVA::Experimental::SOFIE::RModel::IsConstantTensor
bool IsConstantTensor(const std::string &name) const
Definition RModel.cxx:224

TMVA::Experimental::SOFIE::RModel::Initialize
void Initialize(int batchSize=-1, bool verbose=false)
Definition RModel.cxx:503

TMVA::Experimental::SOFIE::RModel::WriteInitializedTensorsToFile
long WriteInitializedTensorsToFile(std::string filename="")
Definition RModel.cxx:1192

TMVA::Experimental::SOFIE::RModel::fOptimizationLevel
OptimizationLevel fOptimizationLevel
Definition RModel.hxx:24

TMVA::Experimental::SOFIE::RModel::Generate
void Generate(std::underlying_type_t< Options > options, int batchSize=-1, long pos=0, bool verbose=false)
Definition RModel.cxx:1062

TMVA::Experimental::SOFIE::RModel::GetDynamicTensorShape
std::vector< Dim > GetDynamicTensorShape(const std::string &name) const
Definition RModel.cxx:76

TMVA::Experimental::SOFIE::RModel::fInputTensorInfos
std::unordered_map< std::string, InputTensorInfo > fInputTensorInfos
Definition RModel.hxx:26

TMVA::Experimental::SOFIE::RModel::GetInitializedTensorData
std::shared_ptr< void > GetInitializedTensorData(std::string tensor_name)
Definition RModel.cxx:312

TMVA::Experimental::SOFIE::RModel::fIsInitialized
bool fIsInitialized
Definition RModel.hxx:15

TMVA::Experimental::SOFIE::RModel::fIsSubGraph
bool fIsSubGraph
Definition RModel.hxx:16

TMVA::Experimental::SOFIE::RModel::fIntermediateMemoryInfo
MemoryPoolInfo fIntermediateMemoryInfo
! intermediate memory info (transient)
Definition RModel.hxx:45

TMVA::Experimental::SOFIE::RModel::GenerateIntermediateMemoryPool
void GenerateIntermediateMemoryPool()
Definition RModel.cxx:711

TMVA::Experimental::SOFIE::RModel::ReadInitializedTensorsFromFile
void ReadInitializedTensorsFromFile(long)
Definition RModel.cxx:1120

TMVA::Experimental::SOFIE::RModel::AllocateIntermediateMemory
std::string AllocateIntermediateMemory(std::span< const std::string_view > op_output_tensors)
Definition RModel.cxx:329

TMVA::Experimental::SOFIE::RModel::fShapeTensors
std::unordered_map< std::string, std::pair< std::vector< Dim >, bool > > fShapeTensors
Definition RModel.hxx:31

TMVA::Experimental::SOFIE::RModel::fVerbose
int fVerbose
Definition RModel.hxx:17

TMVA::Experimental::SOFIE::RModel::InitializeSubGraph
void InitializeSubGraph(std::shared_ptr< RModel > graph)
Definition RModel.cxx:618

TMVA::Experimental::SOFIE::RModel::fShapeParams
std::unordered_map< std::string, std::string > fShapeParams
Definition RModel.hxx:32

TMVA::Experimental::SOFIE::RModel::SetNotWritableInitializedTensor
void SetNotWritableInitializedTensor(const std::string &tensor_name)
Definition RModel.cxx:321

TMVA::Experimental::SOFIE::RModel::GetTensorType
ETensorType GetTensorType(std::string name) const
Definition RModel.cxx:90

TMVA::Experimental::SOFIE::RModel::GenerateInitializedTensorInfo
void GenerateInitializedTensorInfo()
Definition RModel.cxx:684

TMVA::Experimental::SOFIE::RModel::fInputTensorNames
std::vector< std::string > fInputTensorNames
Definition RModel.hxx:35

TMVA::Experimental::SOFIE::RModel::fInitializedTensors
std::unordered_map< std::string, InitializedTensor > fInitializedTensors
Definition RModel.hxx:28

TMVA::Experimental::SOFIE::RModel::UpdateInitializedTensor
void UpdateInitializedTensor(std::string tensor_name, ETensorType type, std::vector< std::size_t > shape, std::shared_ptr< void > data)
Definition RModel.cxx:303

TMVA::Experimental::SOFIE::RModel::GetShapeTensorValues
const std::vector< Dim > & GetShapeTensorValues(const std::string &tensor_name) const
Definition RModel.cxx:215

TMVA::Experimental::SOFIE::RModel::fSubGraphs
std::vector< std::shared_ptr< RModel > > fSubGraphs
! sub-graph models (transient)
Definition RModel.hxx:41

TMVA::Experimental::SOFIE::RModel::IsReadyInputTensor
bool IsReadyInputTensor(const std::string &name) const
Definition RModel.cxx:241

TMVA::Experimental::SOFIE::RModel::UpdateOutputTensorList
void UpdateOutputTensorList(std::vector< std::string > curr_output_tensor, std::vector< std::string > modify_output_tensor)
Definition RModel.cxx:296

TMVA::Experimental::SOFIE::RModel::AddShapeTensor
void AddShapeTensor(const std::string &name, const std::vector< Dim > &shapeValues, bool scalar=false)
Definition RModel.cxx:203

TMVA::Experimental::SOFIE::RModel::PrintRequiredInputTensors
void PrintRequiredInputTensors()
Definition RModel.cxx:1304

int

n
const Int_t n
Definition legend1.C:16

TMVA::Experimental::SOFIE::UTILITY::Clean_name
std::string Clean_name(std::string input_tensor_name)
Definition SOFIE_common.cxx:510

TMVA::Experimental::SOFIE::ConvertShapeToLength
std::size_t ConvertShapeToLength(const std::vector< size_t > &shape)
Definition SOFIE_common.cxx:52

TMVA::Experimental::SOFIE::ETensorType
ETensorType
Definition SOFIE_common.hxx:28

TMVA::Experimental::SOFIE::ETensorType::INT64
@ INT64

TMVA::Experimental::SOFIE::ETensorType::BOOL
@ BOOL

TMVA::Experimental::SOFIE::ETensorType::FLOAT
@ FLOAT

TMVA::Experimental::SOFIE::ETensorType::UINT8
@ UINT8

TMVA::Experimental::SOFIE::ETensorType::DOUBLE
@ DOUBLE

TMVA::Experimental::SOFIE::ConvertDynamicShapeToLength
std::string ConvertDynamicShapeToLength(const std::vector< Dim > &shape)
Definition SOFIE_common.cxx:173

TMVA::Experimental::SOFIE::ConvertShapeToDim
std::vector< Dim > ConvertShapeToDim(const std::vector< size_t > &shape)
Convert shape from integer format to dynamic one (based on Dim)
Definition SOFIE_common.cxx:15

TMVA::Experimental::SOFIE::GetTypeSize
constexpr size_t GetTypeSize(ETensorType type)
Definition SOFIE_common.hxx:37

TMVA::Experimental::SOFIE::OptimizationLevel::kExtended
@ kExtended

TMVA::Experimental::SOFIE::ConvertValuesToString
std::string ConvertValuesToString(size_t n, const T *data)
Definition SOFIE_common.hxx:223

TMVA::Experimental::SOFIE::GenerateConstantTensorCode
std::string GenerateConstantTensorCode(const std::pair< std::string, InitializedTensor > &t)
Definition RModel.cxx:650

TMVA::Experimental::SOFIE::ConvertShapeToInt
std::vector< size_t > ConvertShapeToInt(const std::vector< Dim > &shape)
Convert shape based on Dim to integer format.
Definition SOFIE_common.cxx:26

TMVA::Experimental::SOFIE::ConvertTypeToString
std::string ConvertTypeToString(ETensorType type)
Definition SOFIE_common.cxx:59

TMVA::Experimental::SOFIE::operator|
std::underlying_type_t< Options > operator|(Options opA, Options opB)
Definition RModel.cxx:22

TMVA::Experimental::SOFIE::WeightFileType::None
@ None

TMVA::Experimental::SOFIE::WeightFileType::Text
@ Text

TMVA::Experimental::SOFIE::WeightFileType::RootBinary
@ RootBinary

TMVA::Experimental::SOFIE::ConvertDimShapeToLength
std::string ConvertDimShapeToLength(const std::vector< Dim > &shape)
Definition SOFIE_common.cxx:140

TMVA::Experimental::SOFIE::ConvertShapeToString
std::string ConvertShapeToString(const std::vector< size_t > &shape)
Definition SOFIE_common.cxx:118

TMVA::Experimental::SOFIE::ConvertValToString
std::string ConvertValToString(T value)
Definition SOFIE_common.hxx:212

TMVA::Experimental::SOFIE::Options
Options
Definition RModel_Base.hxx:22

TMVA::Experimental::SOFIE::Options::kNoWeightFile
@ kNoWeightFile

TMVA::Experimental::SOFIE::Options::kNoSession
@ kNoSession

TMVA::Experimental::SOFIE::Options::kGNN
@ kGNN

TMVA::Experimental::SOFIE::Options::kGNNComponent
@ kGNNComponent

TMVA::Experimental::SOFIE::Options::kRootBinaryWeightFile
@ kRootBinaryWeightFile

TMVA
create variable transformations
Definition GeneticMinimizer.h:22

TMVA::Experimental::SOFIE::Dim
Definition SOFIE_common.hxx:63

TMVA::Experimental::SOFIE::DynamicTensorInfo
Definition SOFIE_common.hxx:119

TMVA::Experimental::SOFIE::InputTensorInfo
Definition SOFIE_common.hxx:109

TMVA::Experimental::SOFIE::MemoryPoolInfo
Definition SOFIE_common.hxx:186

TMVA::Experimental::SOFIE::MemoryPoolInfo::total_stack
std::map< size_t, TensorMemoryInfo > total_stack
Definition SOFIE_common.hxx:189

TMVA::Experimental::SOFIE::MemoryPoolInfo::available_stack
std::map< size_t, size_t > available_stack
Definition SOFIE_common.hxx:192

TMVA::Experimental::SOFIE::TensorInfo
Definition SOFIE_common.hxx:114

TMVA::Experimental::SOFIE::TensorMemoryInfo
Definition SOFIE_common.hxx:168