doc/v630/RModel_8cxx_source.html

#include <limits>

#include <algorithm>

#include <cctype>

#include <memory>


#include "TFile.h"


#include "TMVA/RModel.hxx"

#include "TMVA/SOFIE_common.hxx"


namespace TMVA {

namespace Experimental {

namespace SOFIE {


std::underlying_type_t<Options> operator|(Options opA, Options opB) {

    return static_cast<std::underlying_type_t<Options>>(opA) | static_cast<std::underlying_type_t<Options>>(opB);

}

std::underlying_type_t<Options> operator|(std::underlying_type_t<Options> opA, Options opB) {

    return opA | static_cast<std::underlying_type_t<Options>>(opB);

}


RModel::RModel(RModel&& other) {

    fInputTensorInfos = std::move(other.fInputTensorInfos);

    fReadyInputTensorInfos = std::move(other.fReadyInputTensorInfos);

    fOutputTensorNames = other.fOutputTensorNames;

    fInputTensorNames = other.fInputTensorNames;

    fOperators = std::move(other.fOperators);

    fInitializedTensors = std::move(other.fInitializedTensors);

    fIntermediateTensorInfos = std::move(other.fIntermediateTensorInfos);

    fName = other.fName;

    fFileName = other.fFileName;

    fParseTime = other.fParseTime;

    fGC = other.fGC;

    fNeededBlasRoutines = other.fNeededBlasRoutines;

    fNeededStdLib = other.fNeededStdLib;

}


RModel& RModel::operator=(RModel&& other) {

    fInputTensorInfos = std::move(other.fInputTensorInfos);

    fReadyInputTensorInfos = std::move(other.fReadyInputTensorInfos);

    fOutputTensorNames = other.fOutputTensorNames;

    fInputTensorNames = other.fInputTensorNames;

    fOperators = std::move(other.fOperators);

    fInitializedTensors = std::move(other.fInitializedTensors);

    fIntermediateTensorInfos = std::move(other.fIntermediateTensorInfos);

    fName = other.fName;

    fFileName = other.fFileName;

    fParseTime = other.fParseTime;

    fGC = other.fGC;

    fNeededBlasRoutines = other.fNeededBlasRoutines;

    fNeededStdLib = other.fNeededStdLib;

    return *this;

}


const std::vector<size_t>& RModel::GetTensorShape(std::string name) {

    auto f = fReadyInputTensorInfos.find(name);

    if (f != fReadyInputTensorInfos.end()) {

        return f->second.shape;

    }

    auto f2 = fInitializedTensors.find(name);

    if (f2 != fInitializedTensors.end()) {

        return f2->second.fShape;

    }

    auto f3 = fInputTensorInfos.find(name);

    if (f3 != fInputTensorInfos.end()) {

        throw std::runtime_error("TMVA SOFIE tensor [" + name + "] is an input tensor with unspecified dimension parameter");

    }

    auto f4 = fIntermediateTensorInfos.find(name);

    if (f4 != fIntermediateTensorInfos.end()) {

        return f4->second.shape;

    }


    throw std::runtime_error("TMVA SOFIE tensor [" + name + "] for which the shape is requested is not found");

}


const ETensorType& RModel::GetTensorType(std::string name) {

    auto f = fReadyInputTensorInfos.find(name);

    if (f != fReadyInputTensorInfos.end()) {

        return f->second.type;

    }

    auto f2 = fInitializedTensors.find(name);

    if (f2 != fInitializedTensors.end()) {

        return f2->second.fType;

    }

    auto f3 = fInputTensorInfos.find(name);

    if (f3 != fInputTensorInfos.end()) {

        return f3->second.type;

    }

    auto f4 = fIntermediateTensorInfos.find(name);

    if (f4 != fIntermediateTensorInfos.end()) {

        return f4->second.type;

    }


    throw std::runtime_error("TMVA SOFIE tensor [" + name + "] for which the type is requested is not found");

}


bool RModel::CheckIfTensorAlreadyExist(std::string tensor_name) {

    if (fReadyInputTensorInfos.find(tensor_name) != fReadyInputTensorInfos.end())  return true;

    if (fInitializedTensors.find(tensor_name) != fInitializedTensors.end()) return true;

    if (fIntermediateTensorInfos.find(tensor_name) != fIntermediateTensorInfos.end()) return true;

    return false;

}


void RModel::AddInputTensorInfo(std::string input_name, ETensorType type, std::vector<Dim> shape) {

    input_name = UTILITY::Clean_name(input_name);

    if (CheckIfTensorAlreadyExist(input_name)) {

        throw std::runtime_error("TMVA-SOFIE: input tensor with name " + input_name + " already exists \n");

    }


    InputTensorInfo inputInfo { type, shape };

    fInputTensorInfos[input_name] = inputInfo;

}


void RModel::AddInputTensorInfo(std::string input_name, ETensorType type, std::vector<size_t> shape) {

    input_name = UTILITY::Clean_name(input_name);

    if (CheckIfTensorAlreadyExist(input_name)) {

        throw std::runtime_error("TMVA-SOFIE: input tensor with name " + input_name + " already exists \n");

    }

    TensorInfo inputInfo { type, shape };

    fReadyInputTensorInfos[input_name] = inputInfo;

}


void RModel::AddInputTensorName(std::string input_name) {

    fInputTensorNames.push_back(UTILITY::Clean_name(input_name));

}


void RModel::AddOperator(std::unique_ptr<ROperator> op, int order_execution) {

    AddBlasRoutines(op->GetBlasRoutines());

    auto libs = op->GetStdLibs();

    for (auto& stdlib : libs) {

        AddNeededStdLib(stdlib);

    }

    if (order_execution >= 0) {

        fOperators.insert(fOperators.begin() + order_execution, std::move(op));

    } else {

        fOperators.push_back(std::move(op));

    }

}


void RModel::AddInitializedTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape, std::shared_ptr<void> data) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    //NB: own data

    if (CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: initialized tensor with name " + tensor_name + " already exists \n");

    }

    InitializedTensor new_tensor {type, shape, data};

    fInitializedTensors[tensor_name] = new_tensor;


}


bool RModel::IsInitializedTensor(const std::string& tensorName) const {

    std::string name = UTILITY::Clean_name(tensorName);

    return fInitializedTensors.find(name) != fInitializedTensors.end();

}


void RModel::AddIntermediateTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    if (CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: intermediate tensor with name " + tensor_name + " already exists \n");

    }

    TensorInfo new_tensor {type, shape};

    fIntermediateTensorInfos[tensor_name] = new_tensor;

}


void RModel::AddOutputTensorNameList(std::vector<std::string> outputtensornames) {

    fOutputTensorNames.clear();

    for(auto& it : outputtensornames) {

        fOutputTensorNames.push_back(UTILITY::Clean_name(it));

    }

}


void RModel::UpdateOutputTensorList(std::vector<std::string> curr_output_tensors, std::vector<std::string> new_output_tensors) {

    for(auto& it:curr_output_tensors) {

        fOutputTensorNames.erase(std::remove(fOutputTensorNames.begin(), fOutputTensorNames.end(), it), fOutputTensorNames.end());

    }

    fOutputTensorNames.insert(fOutputTensorNames.end(), new_output_tensors.begin(), new_output_tensors.end());

}


void RModel::UpdateInitializedTensor(std::string tensor_name, ETensorType type, std::vector<std::size_t> shape, std::shared_ptr<void> data) {

    tensor_name = UTILITY::Clean_name(tensor_name);

    if (!CheckIfTensorAlreadyExist(tensor_name)) {

        throw std::runtime_error("TMVA-SOFIE: tensor " + tensor_name + " not found when trying to update it");

    }

    InitializedTensor new_tensor {type, shape, data};

    fInitializedTensors[tensor_name] = new_tensor;

}


std::shared_ptr<void> RModel::GetInitializedTensorData(std::string tensor_name) {

    auto f = fInitializedTensors.find(tensor_name);

    if (f == fInitializedTensors.end()) {

        throw std::runtime_error("TMVA-SOFIE: tensor " + tensor_name + " not found when trying to get its data");

    } else {

        return f->second.fData;

    }

}


void RModel::Initialize(int batchSize) {

    // check if there are only parametrized input tensor and convert in

    // ready input tensor according to batch size

    // convert parametric shape to a dimensional shape

    fIntermediateTensorInfos.clear();

    if (fReadyInputTensorInfos.size() != fInputTensorNames.size()) {

        if ( fReadyInputTensorInfos.size() + fInputTensorInfos.size() != fInputTensorNames.size())

            throw std::runtime_error("TMVA-SOFIE: RModel::Initializes: invalid inputs");

        for (auto & input : fInputTensorInfos) {

            std::vector<size_t> shape;

            shape.reserve(input.second.shape.size());

            for (auto & d : input.second.shape) {

                if (d.isParam)

                    shape.push_back(batchSize);

                else

                    shape.push_back(d.dim);

            }

            AddInputTensorInfo(input.first, input.second.type, shape);

        }

    }

    // check if there are initialized tensors to write in a weight file

    // support for the time being only weight of FLOAT type

    if (fUseWeightFile) {

        bool modelHasWeights = false;

        for (auto& i: fInitializedTensors) {

            if (i.second.fType == ETensorType::FLOAT) {

                modelHasWeights = true;

                break;

            }

        }

        if (!modelHasWeights) fUseWeightFile = false;

    }


    for (auto& i : fOperators) {

        i->Initialize(*this);

    }

}


void RModel::GenerateInitializedTensorInfo() {

    for (auto& i: fInitializedTensors) {

        if (i.second.fType == ETensorType::FLOAT) {

            size_t length = 1;

            for (auto & dim: i.second.fShape) {

                length *= dim;

            }

            if (!fUseWeightFile) {

                fGC += "float tensor_" + i.first + "[" + std::to_string(length) + "] = {";

                std::shared_ptr<float> data = std::static_pointer_cast<float>(i.second.fData);

                std::stringstream floats;

                for (size_t idx = 0; idx < length-1; idx++) {

                    floats << std::setprecision(std::numeric_limits<float>::max_digits10) << data.get()[idx] << ", ";

                }

                floats << std::setprecision(std::numeric_limits<float>::max_digits10) << data.get()[length-1];

                fGC += floats.str();

                fGC += "};\n";

            }

            else {

                fGC += "std::vector<float> fTensor_" + i.first + " = std::vector<float>(" + std::to_string(length) + ");\n";

                fGC += "float * tensor_" + i.first + " = fTensor_" + i.first + ".data();\n";

            }


        }

    }

}


void RModel::GenerateIntermediateTensorInfo() {

    for (auto&i: fIntermediateTensorInfos) {

        size_t length = ConvertShapeToLength(i.second.shape);

        if (i.second.type == ETensorType::FLOAT) {

            fGC += "std::vector<float> fTensor_" + i.first  + " = std::vector<float>(" + std::to_string(length) + ");\n";

            fGC += "float * tensor_" + i.first + " = fTensor_" + i.first  + ".data();\n";

        }

        if (i.second.type == ETensorType::DOUBLE) {

            fGC += "std::vector<double> fTensor_" + i.first  + " = std::vector<double>(" + std::to_string(length) + ");\n";

            fGC += "double * tensor_" + i.first + " = fTensor_" + i.first  + ".data();\n";

        }

        if (i.second.type == ETensorType::INT64) {

            fGC += "std::vector<int64_t> fTensor_" + i.first  + " = std::vector<int64_t>(" + std::to_string(length) + ");\n";

            fGC += "int64_t * tensor_" + i.first + " = fTensor_" + i.first  + ".data();\n";

        }

    }

}


void RModel::GenerateOutput() {

    size_t outputSize = fOutputTensorNames.size();

    // assume output types are all the same

    std::string outputType;

    if (outputSize == 1) {

        auto f = fIntermediateTensorInfos.find(fOutputTensorNames[0]);

        if (f == fIntermediateTensorInfos.end()) {

            throw std::runtime_error("TMVA-SOFIE: output tensor " + fOutputTensorNames[0] + " not found when trying to get its info");

        } else {

            outputType = ConvertTypeToString(f->second.type);

            fGC += "std::vector<" + outputType + "> ";

        }

    } else {

        std::vector<ETensorType> outputTensorsTypes(outputSize);

        for (size_t i = 0; i < outputSize; i++) {

            auto f = fIntermediateTensorInfos.find(fOutputTensorNames[i]);

            if (f == fIntermediateTensorInfos.end()) {

                throw std::runtime_error("TMVA-SOFIE: output tensor " + fOutputTensorNames[i]

                                         + " not found when trying to get its info");

            } else {

                outputTensorsTypes[i] = f->second.type;

            }

        }

        // assume all output types are the same

        outputType = ConvertTypeToString(outputTensorsTypes[0]);

        for (size_t i = 0; i < outputSize; i++) {

            if (outputTensorsTypes[i] != outputTensorsTypes[0]) {

                throw std::runtime_error("TMVA-SOFIE: output tensor " + fOutputTensorNames[i] + " is of different type.");

            }

        }

        fGC += "std::vector<std::vector<" + outputType + ">> ";

    }


    fGC += "infer(";


    for(size_t i = 0; i<fInputTensorNames.size(); ++i) {

        switch((fReadyInputTensorInfos[fInputTensorNames[i]]).type) {

        case  ETensorType::FLOAT : {

            fGC += "float* tensor_" + fInputTensorNames[i] + ",";

            break;

        }

        case  ETensorType::INT32 : {

            fGC += "int32_t* tensor_" + fInputTensorNames[i] + ",";

            break;

        }

        case  ETensorType::INT64 : {

            fGC += "int64_t* tensor_" + fInputTensorNames[i] + ",";

            break;

        }

        case  ETensorType::DOUBLE : {

            fGC += "double* tensor_" + fInputTensorNames[i] + ",";

            break;

        }

        default: {

            throw std::runtime_error("TMVA-SOFIE: input tensor " + fInputTensorNames[i] + " is of a data type which is not yet supported.");

        }

        }

    }


    fGC.pop_back(); //remove last ","

    fGC += "){\n";


    const std::string SP = "   ";


    for (size_t id = 0; id < fOperators.size() ; id++) {

        fGC+= (fOperators[id]->Generate(std::to_string(id)));

    }


    if (outputSize == 1) {

        size_t outputLength = ConvertShapeToLength(GetTensorShape(fOutputTensorNames[0]));


        fGC += SP + "std::vector<" + outputType + "> ret (tensor_" + fOutputTensorNames[0] + ", tensor_" + fOutputTensorNames[0] + " + " +

               std::to_string(outputLength) + ");\n";

    } else {

        for (size_t i = 0; i < outputSize; i++) {

            if (!fOutputTensorNames[i].empty()) {

                size_t outputLength = ConvertShapeToLength(GetTensorShape(fOutputTensorNames[i]));

                fGC += SP + "std::vector<" + outputType + "> ret_";

                fGC += std::to_string(i);

                fGC += " (tensor_" + fOutputTensorNames[i] + ", tensor_" + fOutputTensorNames[i] + " + " +

                       std::to_string(outputLength) + ");\n";

            }

        }

        fGC += SP + "std::vector<std::vector<" + outputType + ">> ret({";

        for (size_t i = 0; i < outputSize; i++) {

            if (fOutputTensorNames[i].empty()) {

                fGC += "{}";

            } else {

                fGC += "ret_";

                fGC += std::to_string(i);

            }

            if (i < outputSize - 1) {

                fGC += ",";

            }

        }

        fGC += "});\n";

    }

    fGC += SP + "return ret;\n";

    fGC += "}\n";

}


void RModel::Generate(std::underlying_type_t<Options> options, int batchSize, long pos) {

    // session flag is used in operator initialize

    if (static_cast<std::underlying_type_t<Options>>(Options::kNoSession) & options) {

        fUseSession = false;

        fWeightFile = WeightFileType::None;

    }

    if (static_cast<std::underlying_type_t<Options>>(Options::kNoWeightFile) & options) {

        fUseWeightFile = false;

        fWeightFile = WeightFileType::None;

    }

    if (static_cast<std::underlying_type_t<Options>>(Options::kRootBinaryWeightFile) & options) {

        fUseWeightFile = true;

        fWeightFile = WeightFileType::RootBinary;

    }

    if (fUseWeightFile && !fUseSession) {

        throw

        std::runtime_error("TMVA-SOFIE: RModel::Generate: cannot use a separate weight file without generating a Session class");

    }


    if (static_cast<std::underlying_type_t<Options>>(Options::kGNN) & options)

        fIsGNN = true;

    if (static_cast<std::underlying_type_t<Options>>(Options::kGNNComponent) & options)

        fIsGNNComponent = true;


    Initialize(batchSize);

    std::string hgname;

    if(!fIsGNNComponent) {

        fGC.clear();

        GenerateHeaderInfo(hgname);

        if (fUseSession) {

            fGC += "struct Session {\n";

        }

    }


    GenerateInitializedTensorInfo();

    GenerateIntermediateTensorInfo();


    if (fUseSession) {

        // add here specific operator code that needs to define session data members

        fGC += "\n";

        for (size_t id = 0; id < fOperators.size(); id++) {

            std::string opName = std::to_string(id);

            fGC += fOperators[id]->GenerateSessionMembersCode(opName);

        }

        fGC += "\n";

        // here add initialization and reading of weight tensors

        if (fUseWeightFile) {

            fGC += "Session(std::string filename =\"\") {\n";

            fGC += "   if (filename.empty()) filename = \"" + fName;

            if (fWeightFile == WeightFileType::Text) {

                fGC += ".dat\";\n";

            }

            if (fWeightFile == WeightFileType::RootBinary) {

                fGC += ".root\";\n";

            }

            ReadInitializedTensorsFromFile(pos);

            //fUseWeightFile = fUseWeightFile;

        } else {

            // no need to pass weight file since it is not used

            // keep passing a string for compatibility

            fGC += "Session(std::string = \"\") {\n";

        }


        // add here initialization code

        for (size_t id = 0; id < fOperators.size() ; id++) {

            fGC += fOperators[id]->GenerateInitCode();

        }


        fGC += "}\n\n";

    }


    GenerateOutput();


    if(!fIsGNNComponent) {

        if (fUseSession) {

            fGC += "};\n";

        }

        fGC += ("} //TMVA_SOFIE_" + fName + "\n");

        fGC += "\n#endif  // " + hgname + "\n";

    }

}


void RModel::ReadInitializedTensorsFromFile(long pos) {

    // generate the code to read initialized tensors from a text data file

    if (fWeightFile == WeightFileType::Text) {

        if (fInitializedTensors.empty()) return;


        fGC += "   std::ifstream f;\n";

        fGC += "   f.open(filename);\n";

        fGC += "   if (!f.is_open()) {\n";

        fGC += "      throw std::runtime_error(\"tmva-sofie failed to open file for input weights\");\n";

        fGC += "   }\n";


        if(fIsGNNComponent) {

            fGC += "   f.seekg(" + std::to_string(pos) + ");\n";

        }


        fGC += "   std::string tensor_name;\n";

        fGC += "   size_t length;\n";


        // loop on tensors and parse the file

        for (auto& i: fInitializedTensors) {

            if (i.second.fType == ETensorType::FLOAT) {

                size_t length = 1;

                length = ConvertShapeToLength(i.second.fShape);

                std::string tensor_name = "tensor_" + i.first;

                std::string slength = std::to_string(length);

                fGC += "   f >> tensor_name >> length;\n";

                fGC += "   if (tensor_name != \"" + tensor_name + "\" ) {\n";

                fGC += "      std::string err_msg = \"TMVA-SOFIE failed to read the correct tensor name; expected name is " +

                       tensor_name + " , read \" + tensor_name;\n";

                fGC += "      throw std::runtime_error(err_msg);\n";

                fGC += "    }\n";

                fGC += "   if (length != " + slength + ") {\n";

                fGC += "      std::string err_msg = \"TMVA-SOFIE failed to read the correct tensor size; expected size is " +

                       slength + " , read \" + std::to_string(length) ;\n";

                fGC += "      throw std::runtime_error(err_msg);\n";

                fGC += "    }\n";

                fGC += "   for (size_t i = 0; i < length; ++i)\n";

                fGC += "      f >> " + tensor_name + "[i];\n";

            }

        }

        fGC += "   f.close();\n";

    }


    // generate the code to read initialized tensors from a ROOT data file

    if(fWeightFile == WeightFileType::RootBinary) {

        fGC += "  {\n";

        fGC += "   std::unique_ptr<TFile> rootFile(TFile::Open(filename.c_str(), \"READ\"));\n";

        fGC += "   if (!rootFile->IsOpen()) {\n";

        fGC += "      throw std::runtime_error(\"tmva-sofie failed to open ROOT file for input weights\");\n";

        fGC += "   }\n";


        std::string dirName = fName + "_weights";

        fGC += "   if (!rootFile->GetKey(\"" + dirName + "\")) {\n";

        fGC += "      throw std::runtime_error(\"tmva-sofie failed to open ROOT directory for input weights\");\n";

        fGC += "   }\n";


        for (auto &i : fInitializedTensors) {

            fGC += "  {\n";

            std::string tensor_name = "tensor_" + i.first;

            if (i.second.fType == ETensorType::FLOAT) {

                fGC += "      fTensor_" + i.first + " = *reinterpret_cast<std::vector<float>*>(rootFile->Get(\"";

                fGC += dirName + "/" + tensor_name + "\"));\n";

            } else if (i.second.fType == ETensorType::DOUBLE) {

                fGC += "      fTensor_" + i.first + " = *reinterpret_cast<std::vector<double>*>(rootFile->Get(\"";

                fGC += dirName + + "/" + tensor_name + "\"));\n";

            } else if (i.second.fType == ETensorType::INT64) {

                fGC += "      fTensor_" + i.first + " = *reinterpret_cast<std::vector<int64_t>*>(rootFile->Get(\"";

                fGC += dirName + "/" + tensor_name + "\"));\n";

            }

            fGC += "  }\n";

        }

        fGC += "  }\n";

    }

}


long RModel::WriteInitializedTensorsToFile(std::string filename) {

    // Determine the file extension based on the weight file type

    std::string fileExtension;

    switch (fWeightFile) {

    case WeightFileType::None:

        fileExtension = ".dat";

        break;

    case WeightFileType::RootBinary:

        fileExtension = ".root";

        break;

    case WeightFileType::Text:

        fileExtension = ".dat";

        break;

    }


    // If filename is empty, use the model name as the base filename

    if (filename.empty()) {

        filename = fFileName + fileExtension;

    }


    // Write the initialized tensors to the file

    if (fWeightFile == WeightFileType::RootBinary) {

        if(fIsGNNComponent || fIsGNN) {

            throw std::runtime_error("SOFIE-GNN yet not supports writing to a ROOT file.");

        }

        std::unique_ptr<TFile> outputFile(TFile::Open(filename.c_str(), "UPDATE"));


        std::string dirName = fName + "_weights";

        // check if directory exists, in case delete to replace with new one

        if (outputFile->GetKey(dirName.c_str()))

            outputFile->rmdir(dirName.c_str());


        auto outputDir = outputFile->mkdir(dirName.c_str());


        for (const auto& item : fInitializedTensors) {

            std::string tensorName = "tensor_" + item.first;

            size_t length = 1;

            length = ConvertShapeToLength(item.second.fShape);

            if(item.second.fType == ETensorType::FLOAT) {

                const std::shared_ptr<void> ptr = item.second.fData; // shared_ptr<void> instance

                const float* data = (std::static_pointer_cast<float>(item.second.fData)).get();

                std::vector<float> tensorDataVector(data, data + length);

                outputDir->WriteObjectAny(&tensorDataVector, "std::vector<float>", tensorName.c_str());

            }

            else if(item.second.fType == ETensorType::DOUBLE) {

                const std::shared_ptr<void> ptr = item.second.fData; // shared_ptr<void> instance

                const double* data = (std::static_pointer_cast<double>(item.second.fData)).get();

                std::vector<double> tensorDataVector(data, data + length);

                outputDir->WriteObjectAny(&tensorDataVector, "std::vector<double>", tensorName.c_str());

            }

            else if(item.second.fType == ETensorType::INT64) {

                const std::shared_ptr<void> ptr = item.second.fData; // shared_ptr<void> instance

                const int64_t* data = (std::static_pointer_cast<int64_t>(item.second.fData)).get();

                std::vector<int64_t> tensorDataVector(data, data + length);

                outputDir->WriteObjectAny(&tensorDataVector, "std::vector<int64_t>", tensorName.c_str());

            }

        }

        outputFile->Write(filename.c_str());


        // this needs to be changed, similar to the text file

        return -1;


    } else if (fWeightFile == WeightFileType::Text) {

        std::ofstream f;

        if(fIsGNNComponent) {

            // appending all GNN components into the same file

            f.open(filename, std::ios::app);

        } else {

            f.open(filename);

        }

        if (!f.is_open())

            throw

            std::runtime_error("tmva-sofie failed to open file for tensor weight data");

        for (auto& i: fInitializedTensors) {

            if (i.second.fType == ETensorType::FLOAT) {

                size_t length = 1;

                for (auto &dim : i.second.fShape) {

                    length *= dim;

                }

                std::string tensor_name = "tensor_" + i.first;

                f << tensor_name << " " << length << "\n";

                const float * data = (std::static_pointer_cast<float>(i.second.fData)).get();

                for (size_t idx = 0; idx < length - 1; idx++) {

                    f << std::setprecision(std::numeric_limits<float>::max_digits10) << data[idx] << " ";

                }

                f << std::setprecision(std::numeric_limits<float>::max_digits10) << data[length - 1];

                f << "\n";

            }

        }

        long curr_pos = f.tellp();

        f.close();

        return curr_pos;

    } else {

        return -1;

    }

}


void RModel::PrintRequiredInputTensors() {

    std::cout << "Model requires following inputs:\n";

    for (auto& inputInfo: fInputTensorInfos) {

        std::cout << "Parameterised Tensor name: " << inputInfo.first << "\t";

        std::cout << "type: " << ConvertTypeToString(inputInfo.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < inputInfo.second.shape.size(); i++) {

            if (inputInfo.second.shape[i].isParam) {

                std::cout << inputInfo.second.shape[i].param;

            } else {

                std::cout << inputInfo.second.shape[i].dim ;

            }

            if (i < inputInfo.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }


    for (auto& inputInfo: fReadyInputTensorInfos) {

        std::cout << "Fully Specified Tensor name: " << inputInfo.first << "\t";

        std::cout << "type: " << ConvertTypeToString(inputInfo.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < inputInfo.second.shape.size(); i++) {

            std::cout << inputInfo.second.shape[i];

            if (i < inputInfo.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }


}


void RModel::PrintInitializedTensors() {

    std::cout << "Model initialized the following tensors:\n";

    for (auto& it: fInitializedTensors) {

        std::cout << "Tensor name: \"" << it.first << "\"\t";

        std::cout << "type: " << ConvertTypeToString(it.second.fType) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < it.second.fShape.size(); i++) {

            std::cout << it.second.fShape[i];

            if (i < it.second.fShape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }

}


void RModel::PrintIntermediateTensors() {

    std::cout << "Model specify the following intermediate tensors:\n";

    for (auto& it: fIntermediateTensorInfos) {

        std::cout << "Tensor name: \"" << it.first << "\"\t";

        std::cout << "type: " << ConvertTypeToString(it.second.type) << "\t";

        std::cout << "shape: [";

        for (size_t i = 0; i < it.second.shape.size(); i++) {

            std::cout << it.second.shape[i];

            if (i < it.second.shape.size() - 1) std::cout << ",";

        }

        std::cout << "]" << std::endl;

    }

}


void RModel::PrintOutputTensors() {

    std::cout << "Model specify the following output tensors:\n";

    for (auto& it: fOutputTensorNames) {

        std::cout << "Tensor name: \"" << it << "\"\t";

        std::cout << "shape: " << ConvertShapeToString(GetTensorShape(it)) << std::endl;

    }

}


void RModel::HeadInitializedTensors(std::string name, int n_print) {

    auto it = fInitializedTensors.find(name);

    if (it == fInitializedTensors.end()) {

        std::cout << "Tensor " << name << " not found in model's intialized tensor list" << std::endl;

        return;

    }


    std::cout << "Tensor name: " << it->first << "\t";

    std::cout << "type: " << ConvertTypeToString(it->second.fType) << "\t";

    int length =1;

    std::cout << "shape: [";

    for (size_t i = 0; i < it->second.fShape.size(); i++) {

        std::cout << it->second.fShape[i];

        length *= it->second.fShape[i];

        if (i < it->second.fShape.size() - 1) std::cout << ",";

    }

    std::cout << "]" << std::endl;

    bool ellipsis = true;

    if (n_print > length) {

        n_print = length;

        ellipsis = false;

    }


    std::cout << "data: [" << std::endl;

    if (it->second.fType == ETensorType::FLOAT) {

        auto converted_data = std::static_pointer_cast<float>(it->second.fData).get();

        for (int i =0; i < n_print; i++) {

            std::cout << converted_data[i];

            if (i < n_print - 1) std::cout << " ,";

        }

    }

    if (ellipsis) std::cout << ", ...";

    std::cout << "]" << std::endl;


}


void RModel::OutputGenerated(std::string filename, bool append) {


    RModel_Base::OutputGenerated(filename, append);


    // write weights in a text file

    if (fUseWeightFile) {

        if (!filename.empty()) {

            size_t pos = filename.find(".hxx");

            if (fWeightFile == WeightFileType::Text)

                filename.replace(pos, 4, ".dat");

            if (fWeightFile == WeightFileType::RootBinary)  {

                filename = filename.erase(pos, 4);

                filename += ".root";

            }

        } else {

            filename = fName;

            filename += fWeightFile == WeightFileType::Text ? ".dat" : ".root";

        }

        WriteInitializedTensorsToFile(filename);

    }

}


void RModel::Streamer(TBuffer &R__b) {

    if (R__b.IsReading()) {

        RModel::Class()->ReadBuffer(R__b, this);

        for(auto i=RModel::fInitializedTensors.begin(); i!=RModel::fInitializedTensors.end(); ++i) {

            i->second.CastPersistentToShared();

        }

    }

    else {

        for(auto i=RModel::fInitializedTensors.begin(); i!=RModel::fInitializedTensors.end(); ++i) {

            i->second.CastSharedToPersistent();

        }

        RModel::Class()->WriteBuffer(R__b, this);

    }

}


}//SOFIE

}//Experimental

}//TMVA

RModel.hxx

d
#define d(i)
Definition RSha256.hxx:102

f
#define f(i)
Definition RSha256.hxx:104

SOFIE_common.hxx

TFile.h

data
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void data
Definition TGWin32VirtualXProxy.cxx:104

input
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void input
Definition TGWin32VirtualXProxy.cxx:142

filename
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char filename
Definition TGWin32VirtualXProxy.cxx:232

length
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h length
Definition TGWin32VirtualXProxy.cxx:245

id
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize id
Definition TGWin32VirtualXProxy.cxx:94

type
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h Atom_t Int_t ULong_t ULong_t unsigned char prop_list Atom_t Atom_t Atom_t Time_t type
Definition TGWin32VirtualXProxy.cxx:249

name
char name[80]
Definition TGX11.cxx:110

TBuffer
Buffer base class used for serializing objects.
Definition TBuffer.h:43

TBuffer::IsReading
Bool_t IsReading() const
Definition TBuffer.h:86

TClass::ReadBuffer
Int_t ReadBuffer(TBuffer &b, void *pointer, Int_t version, UInt_t start, UInt_t count)
Function called by the Streamer functions to deserialize information from buffer b into object at p.
Definition TClass.cxx:6758

TClass::WriteBuffer
Int_t WriteBuffer(TBuffer &b, void *pointer, const char *info="")
Function called by the Streamer functions to serialize object at p to buffer b.
Definition TClass.cxx:6779

TFile::Open
static TFile * Open(const char *name, Option_t *option="", const char *ftitle="", Int_t compress=ROOT::RCompressionSetting::EDefaults::kUseCompiledDefault, Int_t netopt=0)
Create / open a file.
Definition TFile.cxx:4075

TMVA::Experimental::SOFIE::RModel_Base::fIsGNN
bool fIsGNN
Definition RModel_Base.hxx:54

TMVA::Experimental::SOFIE::RModel_Base::GenerateHeaderInfo
void GenerateHeaderInfo(std::string &hgname)
Definition RModel_Base.cxx:14

TMVA::Experimental::SOFIE::RModel_Base::fNeededBlasRoutines
std::unordered_set< std::string > fNeededBlasRoutines
Definition RModel_Base.hxx:44

TMVA::Experimental::SOFIE::RModel_Base::fGC
std::string fGC
Definition RModel_Base.hxx:51

TMVA::Experimental::SOFIE::RModel_Base::fFileName
std::string fFileName
Definition RModel_Base.hxx:39

TMVA::Experimental::SOFIE::RModel_Base::fParseTime
std::string fParseTime
Definition RModel_Base.hxx:40

TMVA::Experimental::SOFIE::RModel_Base::OutputGenerated
void OutputGenerated(std::string filename="", bool append=false)
Definition RModel_Base.cxx:61

TMVA::Experimental::SOFIE::RModel_Base::fIsGNNComponent
bool fIsGNNComponent
Definition RModel_Base.hxx:55

TMVA::Experimental::SOFIE::RModel_Base::fNeededStdLib
std::unordered_set< std::string > fNeededStdLib
Definition RModel_Base.hxx:47

TMVA::Experimental::SOFIE::RModel_Base::fUseSession
bool fUseSession
Definition RModel_Base.hxx:53

TMVA::Experimental::SOFIE::RModel_Base::fUseWeightFile
bool fUseWeightFile
Definition RModel_Base.hxx:52

TMVA::Experimental::SOFIE::RModel_Base::fWeightFile
WeightFileType fWeightFile
Definition RModel_Base.hxx:42

TMVA::Experimental::SOFIE::RModel_Base::AddBlasRoutines
void AddBlasRoutines(std::vector< std::string > routines)
Definition RModel_Base.hxx:65

TMVA::Experimental::SOFIE::RModel_Base::AddNeededStdLib
void AddNeededStdLib(std::string libname)
Definition RModel_Base.hxx:70

TMVA::Experimental::SOFIE::RModel_Base::fName
std::string fName
Definition RModel_Base.hxx:50

TMVA::Experimental::SOFIE::RModel
Definition RModel.hxx:12

TMVA::Experimental::SOFIE::RModel::AddOutputTensorNameList
void AddOutputTensorNameList(std::vector< std::string > outputtensornames)
Definition RModel.cxx:165

TMVA::Experimental::SOFIE::RModel::GetTensorType
const ETensorType & GetTensorType(std::string name)
Definition RModel.cxx:76

TMVA::Experimental::SOFIE::RModel::GenerateIntermediateTensorInfo
void GenerateIntermediateTensorInfo()
Definition RModel.cxx:262

TMVA::Experimental::SOFIE::RModel::PrintIntermediateTensors
void PrintIntermediateTensors()
Definition RModel.cxx:679

TMVA::Experimental::SOFIE::RModel::AddIntermediateTensor
void AddIntermediateTensor(std::string tensor_name, ETensorType type, std::vector< std::size_t > shape)
Definition RModel.cxx:156

TMVA::Experimental::SOFIE::RModel::GenerateOutput
void GenerateOutput()
Definition RModel.cxx:280

TMVA::Experimental::SOFIE::RModel::PrintOutputTensors
void PrintOutputTensors()
Definition RModel.cxx:693

TMVA::Experimental::SOFIE::RModel::CheckIfTensorAlreadyExist
bool CheckIfTensorAlreadyExist(std::string tensor_name)
Definition RModel.cxx:97

TMVA::Experimental::SOFIE::RModel::fOperators
std::vector< std::unique_ptr< ROperator > > fOperators
Definition RModel.hxx:23

TMVA::Experimental::SOFIE::RModel::OutputGenerated
void OutputGenerated(std::string filename="", bool append=false)
Definition RModel.cxx:737

TMVA::Experimental::SOFIE::RModel::AddInputTensorInfo
void AddInputTensorInfo(std::string input_name, ETensorType type, std::vector< Dim > shape)
Definition RModel.cxx:104

TMVA::Experimental::SOFIE::RModel::Initialize
void Initialize(int batchSize=1)
Definition RModel.cxx:197

TMVA::Experimental::SOFIE::RModel::fIntermediateTensorInfos
std::unordered_map< std::string, TensorInfo > fIntermediateTensorInfos
Definition RModel.hxx:19

TMVA::Experimental::SOFIE::RModel::fReadyInputTensorInfos
std::unordered_map< std::string, TensorInfo > fReadyInputTensorInfos
Definition RModel.hxx:17

TMVA::Experimental::SOFIE::RModel::AddInitializedTensor
void AddInitializedTensor(std::string tensor_name, ETensorType type, std::vector< std::size_t > shape, std::shared_ptr< void > data)
Definition RModel.cxx:140

TMVA::Experimental::SOFIE::RModel::operator=
RModel & operator=(RModel &&other)
Definition RModel.cxx:38

TMVA::Experimental::SOFIE::RModel::AddInputTensorName
void AddInputTensorName(std::string name)
Definition RModel.cxx:123

TMVA::Experimental::SOFIE::RModel::fOutputTensorNames
std::vector< std::string > fOutputTensorNames
Definition RModel.hxx:20

TMVA::Experimental::SOFIE::RModel::IsInitializedTensor
bool IsInitializedTensor(const std::string &name) const
Definition RModel.cxx:151

TMVA::Experimental::SOFIE::RModel::PrintInitializedTensors
void PrintInitializedTensors()
Definition RModel.cxx:665

TMVA::Experimental::SOFIE::RModel::AddOperator
void AddOperator(std::unique_ptr< ROperator > op, int order_execution=-1)
Definition RModel.cxx:127

TMVA::Experimental::SOFIE::RModel::RModel
RModel()
Definition RModel.hxx:36

TMVA::Experimental::SOFIE::RModel::HeadInitializedTensors
void HeadInitializedTensors(std::string name, int n_print=50)
Definition RModel.cxx:701

TMVA::Experimental::SOFIE::RModel::GetTensorShape
const std::vector< size_t > & GetTensorShape(std::string name)
Definition RModel.cxx:55

TMVA::Experimental::SOFIE::RModel::WriteInitializedTensorsToFile
long WriteInitializedTensorsToFile(std::string filename="")
Definition RModel.cxx:538

TMVA::Experimental::SOFIE::RModel::Generate
void Generate(std::underlying_type_t< Options > options, int batchSize=1, long pos=0)
Definition RModel.cxx:381

TMVA::Experimental::SOFIE::RModel::fInputTensorInfos
std::unordered_map< std::string, InputTensorInfo > fInputTensorInfos
Definition RModel.hxx:16

TMVA::Experimental::SOFIE::RModel::GetInitializedTensorData
std::shared_ptr< void > GetInitializedTensorData(std::string tensor_name)
Definition RModel.cxx:188

TMVA::Experimental::SOFIE::RModel::ReadInitializedTensorsFromFile
void ReadInitializedTensorsFromFile(long)
Definition RModel.cxx:463

TMVA::Experimental::SOFIE::RModel::GenerateInitializedTensorInfo
void GenerateInitializedTensorInfo()
Definition RModel.cxx:235

TMVA::Experimental::SOFIE::RModel::fInputTensorNames
std::vector< std::string > fInputTensorNames
Definition RModel.hxx:21

TMVA::Experimental::SOFIE::RModel::fInitializedTensors
std::unordered_map< std::string, InitializedTensor > fInitializedTensors
Definition RModel.hxx:18

TMVA::Experimental::SOFIE::RModel::UpdateInitializedTensor
void UpdateInitializedTensor(std::string tensor_name, ETensorType type, std::vector< std::size_t > shape, std::shared_ptr< void > data)
Definition RModel.cxx:179

TMVA::Experimental::SOFIE::RModel::UpdateOutputTensorList
void UpdateOutputTensorList(std::vector< std::string > curr_output_tensor, std::vector< std::string > modify_output_tensor)
Definition RModel.cxx:172

TMVA::Experimental::SOFIE::RModel::PrintRequiredInputTensors
void PrintRequiredInputTensors()
Definition RModel.cxx:635

TObject::Streamer
virtual void Streamer(TBuffer &)
Stream an object of class TObject.
Definition TObject.cxx:888

TObject::Class
static TClass * Class()

TMVA::Experimental::SOFIE::UTILITY::Clean_name
std::string Clean_name(std::string input_tensor_name)
Definition SOFIE_common.cxx:282

TMVA::Experimental::SOFIE::ETensorType
ETensorType
Definition SOFIE_common.hxx:23

TMVA::Experimental::SOFIE::ETensorType::INT64
@ INT64

TMVA::Experimental::SOFIE::ETensorType::INT32
@ INT32

TMVA::Experimental::SOFIE::ETensorType::FLOAT
@ FLOAT

TMVA::Experimental::SOFIE::ETensorType::DOUBLE
@ DOUBLE

TMVA::Experimental::SOFIE::ConvertShapeToString
std::string ConvertShapeToString(std::vector< size_t > shape)
Definition SOFIE_common.cxx:72

TMVA::Experimental::SOFIE::ConvertTypeToString
std::string ConvertTypeToString(ETensorType type)
Definition SOFIE_common.cxx:25

TMVA::Experimental::SOFIE::operator|
std::underlying_type_t< Options > operator|(Options opA, Options opB)
Definition RModel.cxx:15

TMVA::Experimental::SOFIE::WeightFileType::None
@ None

TMVA::Experimental::SOFIE::WeightFileType::Text
@ Text

TMVA::Experimental::SOFIE::WeightFileType::RootBinary
@ RootBinary

TMVA::Experimental::SOFIE::ConvertShapeToLength
std::size_t ConvertShapeToLength(std::vector< size_t > shape)
Definition SOFIE_common.cxx:18

TMVA::Experimental::SOFIE::Options
Options
Definition RModel_Base.hxx:22

TMVA::Experimental::SOFIE::Options::kNoWeightFile
@ kNoWeightFile

TMVA::Experimental::SOFIE::Options::kNoSession
@ kNoSession

TMVA::Experimental::SOFIE::Options::kGNN
@ kGNN

TMVA::Experimental::SOFIE::Options::kGNNComponent
@ kGNNComponent

TMVA::Experimental::SOFIE::Options::kRootBinaryWeightFile
@ kRootBinaryWeightFile

TMVA
create variable transformations
Definition GeneticMinimizer.h:22

TMVA::Experimental::SOFIE::InitializedTensor
Definition SOFIE_common.hxx:56

TMVA::Experimental::SOFIE::InputTensorInfo
Definition SOFIE_common.hxx:42

TMVA::Experimental::SOFIE::TensorInfo
Definition SOFIE_common.hxx:47