Logo ROOT  
Reference Guide
 
Loading...
Searching...
No Matches
CodegenContext.cxx
Go to the documentation of this file.
1/*
2 * Project: RooFit
3 * Authors:
4 * Garima Singh, CERN 2023
5 * Jonas Rembser, CERN 2023
6 *
7 * Copyright (c) 2023, CERN
8 *
9 * Redistribution and use in source and binary forms,
10 * with or without modification, are permitted according to the terms
11 * listed in LICENSE (http://roofit.sourceforge.net/license.txt)
12 */
13
15#include <RooAbsArg.h>
16
17#include "RooFitImplHelpers.h"
18
19#include <TInterpreter.h>
20
21#include <algorithm>
22#include <cctype>
23#include <charconv>
24#include <fstream>
25#include <type_traits>
26#include <unordered_map>
27
28namespace {
29
30bool startsWith(std::string_view str, std::string_view prefix)
31{
32 return str.size() >= prefix.size() && 0 == str.compare(0, prefix.size(), prefix);
33}
34
35} // namespace
36
37namespace RooFit {
38namespace Experimental {
39
40/// @brief Adds (or overwrites) the string representing the result of a node.
41/// @param key The name of the node to add the result for.
42/// @param value The new name to assign/overwrite.
43void CodegenContext::addResult(const char *key, std::string const &value)
44{
45 const TNamed *namePtr = RooNameReg::known(key);
46 if (namePtr)
47 addResult(namePtr, value);
48}
49
50void CodegenContext::addResult(TNamed const *key, std::string const &value)
51{
52 _nodeNames[key] = value;
53}
54
55/// @brief Gets the result for the given node using the node name. This node also performs the necessary
56/// code generation through recursive calls to 'translate'. A call to this function modifies the already
57/// existing code body.
58/// @param key The node to get the result string for.
59/// @return String representing the result of this node.
60std::string const &CodegenContext::getResult(RooAbsArg const &arg)
61{
62 // If the result has already been recorded, just return the result.
63 // It is usually the responsibility of each translate function to assign
64 // the proper result to its class. Hence, if a result has already been recorded
65 // for a particular node, it means the node has already been 'translate'd and we
66 // dont need to visit it again.
67 auto found = _nodeNames.find(arg.namePtr());
68 if (found != _nodeNames.end())
69 return found->second;
70
71 // The result for vector observables should already be in the map if you
72 // opened the loop scope. This is just to check if we did not request the
73 // result of a vector-valued observable outside of the scope of a loop.
74 auto foundVecObs = _vecObsIndices.find(arg.namePtr());
75 if (foundVecObs != _vecObsIndices.end()) {
76 throw std::runtime_error("You requested the result of a vector observable outside a loop scope for it!");
77 }
78
79 auto RAII(OutputScopeRangeComment(&arg));
80
81 // Now, recursively call translate into the current argument to load the correct result.
82 codegen(const_cast<RooAbsArg &>(arg), *this);
83
84 return _nodeNames.at(arg.namePtr());
85}
86
87/// @brief Adds the given string to the string block that will be emitted at the top of the squashed function. Useful
88/// for variable declarations.
89/// @param str The string to add to the global scope.
90void CodegenContext::addToGlobalScope(std::string const &str)
91{
92 // Introduce proper indentation for multiline strings.
93 _code[0] += str;
94}
95
96/// @brief Since the squashed code represents all observables as a single flattened array, it is important
97/// to keep track of the start index for a vector valued observable which can later be expanded to access the correct
98/// element. For example, a vector valued variable x with 10 entries will be squashed to obs[start_idx + i].
99/// @param key The name of the node representing the vector valued observable.
100/// @param idx The start index (or relative position of the observable in the set of all observables).
101void CodegenContext::addVecObs(const char *key, int idx)
102{
103 const TNamed *namePtr = RooNameReg::known(key);
104 if (namePtr)
105 _vecObsIndices[namePtr] = idx;
106}
107
109{
110 auto it = _vecObsIndices.find(arg.namePtr());
111 if (it != _vecObsIndices.end()) {
112 return it->second;
113 }
114
115 return -1; // Not found
116}
117/// @brief Adds the input string to the squashed code body. If a class implements a translate function that wants to
118/// emit something to the squashed code body, it must call this function with the code it wants to emit. In case of
119/// loops, automatically determines if code needs to be stored inside or outside loop scope.
120/// @param klass The class requesting this addition, usually 'this'.
121/// @param in String to add to the squashed code.
122void CodegenContext::addToCodeBody(RooAbsArg const *klass, std::string const &in)
123{
124 // If we are in a loop and the value is scope independent, save it at the top of the loop.
125 // else, just save it in the current scope.
127}
128
129/// @brief A variation of the previous addToCodeBody that takes in a bool value that determines
130/// if input is independent. This overload exists because there might other ways to determine if
131/// a value/collection of values is scope independent.
132/// @param in String to add to the squashed code.
133/// @param isScopeIndep The value determining if the input is scope dependent.
134void CodegenContext::addToCodeBody(std::string const &in, bool isScopeIndep /* = false */)
135{
137 indented = indented.Strip(TString::kBoth); // trim
138
139 std::string indent_str = "";
140 for (unsigned i = 0; i < _indent; ++i)
141 indent_str += " ";
142 indented = indented.Prepend(indent_str);
143
144 // FIXME: Multiline input.
145 // indent_str += "\n";
146 // indented = indented.ReplaceAll("\n", indent_str);
147
148 // If we are in a loop and the value is scope independent, save it at the top of the loop.
149 // else, just save it in the current scope.
150 if (_code.size() > 2 && isScopeIndep) {
151 _code[_code.size() - 2] += indented;
152 } else {
153 _code.back() += indented;
154 }
155}
156
157/// @brief Create a RAII scope for iterating over vector observables. You can't use the result of vector observables
158/// outside these loop scopes.
159/// @param in A pointer to the calling class, used to determine the loop dependent variables.
160std::unique_ptr<CodegenContext::LoopScope> CodegenContext::beginLoop(RooAbsArg const *in)
161{
162 pushScope();
163 unsigned loopLevel = _code.size() - 2; // subtract global + function scope.
164 std::string idx = "loopIdx" + std::to_string(loopLevel);
165
166 std::vector<TNamed const *> vars;
167 // set the results of the vector observables
168 for (auto const &it : _vecObsIndices) {
169 if (!in->dependsOn(it.first))
170 continue;
171
172 vars.push_back(it.first);
173 _nodeNames[it.first] = "obs[" + std::to_string(it.second) + " + " + idx + "]";
174 }
175
176 // TODO: we are using the size of the first loop variable to the the number
177 // of iterations, but it should be made sure that all loop vars are either
178 // scalar or have the same size.
179 std::size_t numEntries = 1;
180 for (auto &it : vars) {
181 std::size_t n = outputSize(it);
182 if (n > 1 && numEntries > 1 && n != numEntries) {
183 throw std::runtime_error("Trying to loop over variables with different sizes!");
184 }
185 numEntries = std::max(n, numEntries);
186 }
187
188 // Make sure that the name of this variable doesn't clash with other stuff
189 addToCodeBody(in, "#pragma clad checkpoint loop\n");
190 addToCodeBody(in, "for(int " + idx + " = 0; " + idx + " < " + std::to_string(numEntries) + "; " + idx + "++) {\n");
191
192 return std::make_unique<LoopScope>(*this, std::move(vars));
193}
194
196{
197 addToCodeBody("}\n");
198
199 // clear the results of the loop variables if they were vector observables
200 for (auto const &ptr : scope.vars()) {
201 if (_vecObsIndices.find(ptr) != _vecObsIndices.end())
202 _nodeNames.erase(ptr);
203 }
204 popScope();
205}
206
207/// @brief Get a unique variable name to be used in the generated code.
209{
210 return "t" + std::to_string(_tmpVarIdx++);
211}
212
213/// @brief A function to save an expression that includes/depends on the result of the input node.
214/// @param in The node on which the valueToSave depends on/belongs to.
215/// @param valueToSave The actual string value to save as a temporary.
216void CodegenContext::addResult(RooAbsArg const *in, std::string const &valueToSave)
217{
218 // std::string savedName = RooFit::Detail::makeValidVarName(in->GetName());
219 std::string savedName = getTmpVarName();
220
221 // Only save values if they contain operations or they are numerals. Otherwise, we can use them directly.
222
223 // Check if string is numeric.
224 char *end;
225 std::strtod(valueToSave.c_str(), &end);
226 bool isNumeric = (*end == '\0');
227
228 const bool hasOperations = valueToSave.find_first_of(":-+/*") != std::string::npos;
229
230 // If the name is not empty and this value is worth saving, save it to the correct scope.
231 // otherwise, just return the actual value itself
232 if (hasOperations || isNumeric) {
233 std::string outVarDecl = "const double " + savedName + " = " + valueToSave + ";\n";
235 } else {
237 }
238
239 addResult(in->namePtr(), savedName);
240}
241
242/// @brief Function to save a RooListProxy as an array in the squashed code.
243/// @param in The list to convert to array.
244/// @return Name of the array that stores the input list in the squashed code.
245std::string CodegenContext::buildArg(RooAbsCollection const &in, std::string const &arrayType)
246{
247 if (in.empty()) {
248 return "nullptr";
249 }
250
251 auto it = _listNames.find(in.uniqueId().value());
252 if (it != _listNames.end())
253 return it->second;
254
255 std::string savedName = getTmpVarName();
256 bool canSaveOutside = true;
257
258 std::stringstream declStrm;
259 declStrm << arrayType << " " << savedName << "[]{";
260 for (const auto arg : in) {
261 declStrm << getResult(*arg) << ",";
263 }
264 declStrm.seekp(-1, declStrm.cur);
265 declStrm << "};\n";
266
268
269 _listNames.insert({in.uniqueId().value(), savedName});
270 return savedName;
271}
272
273std::string CodegenContext::buildArg(std::span<const double> arr)
274{
275 unsigned int n = arr.size();
276 std::string offset = std::to_string(_xlArr.size());
277 _xlArr.reserve(_xlArr.size() + n);
278 for (unsigned int i = 0; i < n; i++) {
279 _xlArr.push_back(arr[i]);
280 }
281 return "xlArr + " + offset;
282}
283
284CodegenContext::ScopeRAII::ScopeRAII(RooAbsArg const *arg, CodegenContext &ctx) : _ctx(ctx), _arg(arg)
285{
286 std::ostringstream os;
287 Option_t *opts = nullptr;
289 _fn = os.str();
290 const std::string info = "// Begin -- " + _fn;
291 _ctx._indent++;
293}
294
296{
297 const std::string info = "// End -- " + _fn + "\n";
298 _ctx.addToCodeBody(_arg, info);
299 _ctx._indent--;
300}
301
303{
304 _code.push_back("");
305}
306
308{
309 std::string active_scope = _code.back();
310 _code.pop_back();
311 _code.back() += active_scope;
312}
313
315{
316 return !in->isReducerNode() && outputSize(in->namePtr()) == 1;
317}
318
319/// @brief Register a function that is only know to the interpreter to the context.
320/// This is useful to dump the standalone C++ code for the computation graph.
321void CodegenContext::collectFunction(std::string const &name)
322{
323 _collectedFunctions.emplace_back(name);
324}
325
326/// @brief Assemble and return the final code with the return expression and global statements.
327/// @param returnExpr The string representation of what the squashed function should return, usually the head node.
328/// @return The name of the declared function.
329std::string
330CodegenContext::buildFunction(RooAbsArg const &arg, std::map<RooFit::Detail::DataKey, std::size_t> const &outputSizes)
331{
332 CodegenContext ctx;
333 ctx.pushScope(); // push our global scope.
336 // We only want to take over parameters and observables
337 for (auto const &item : _nodeNames) {
338 if (startsWith(item.second, "params[") || startsWith(item.second, "obs[")) {
339 ctx._nodeNames.insert(item);
340 }
341 }
342 ctx._xlArr = _xlArr;
345
346 static int iCodegen = 0;
347 auto funcName = "roo_codegen_" + std::to_string(iCodegen++);
348
349 ctx.pushScope();
350 std::string funcBody = ctx.getResult(arg);
351 ctx.popScope();
352 funcBody = ctx._code[0] + "\n return " + funcBody + ";\n";
353
354 // Declare the function
355 std::stringstream bodyWithSigStrm;
356 bodyWithSigStrm << "double " << funcName << "(double* params, double const* obs, double const* xlArr) {\n"
357 << "constexpr double inf = std::numeric_limits<double>::infinity();\n"
358 << funcBody << "\n}\n\n";
359 ctx._collectedFunctions.emplace_back(funcName);
360 ctx._collectedCode += bodyWithSigStrm.str();
361
362 _xlArr = ctx._xlArr;
365
366 return funcName;
367}
368
369void declareDispatcherCode(std::string const &funcName)
370{
371 std::string dispatcherCode = R"(
372namespace RooFit {
373namespace Experimental {
374
375template <class Arg_t, int P>
376auto FUNC_NAME(Arg_t &arg, CodegenContext &ctx, Prio<P> p)
377{
378 if constexpr (std::is_same<Prio<P>, PrioLowest>::value) {
379 return FUNC_NAME(arg, ctx);
380 } else {
381 return FUNC_NAME(arg, ctx, p.next());
382 }
383}
384
385template <class Arg_t>
386struct Caller_FUNC_NAME {
387
388 static auto call(RooAbsArg &arg, CodegenContext &ctx)
389 {
390 return FUNC_NAME(static_cast<Arg_t &>(arg), ctx, PrioHighest{});
391 }
392};
393
394} // namespace Experimental
395} // namespace RooFit
396 )";
397
399 gInterpreter->Declare(dispatcherCode.c_str());
400}
401
403{
404 static bool codeDeclared = false;
405 if (!codeDeclared) {
406 declareDispatcherCode("codegenImpl");
407 codeDeclared = true;
408 }
409
410 using Func = void (*)(RooAbsArg &, CodegenContext &);
411
412 Func func;
413
414 TClass *tclass = arg.IsA();
415
416 // Cache the overload resolutions
417 static std::unordered_map<TClass *, Func> dispatchMap;
418
419 auto found = dispatchMap.find(tclass);
420
421 if (found != dispatchMap.end()) {
422 func = found->second;
423 } else {
424 // Can probably done with CppInterop in the future to avoid string manipulation.
425 std::stringstream cmd;
426 cmd << "&RooFit::Experimental::Caller_codegenImpl<" << tclass->GetName() << ">::call;";
427 func = reinterpret_cast<Func>(gInterpreter->ProcessLine(cmd.str().c_str()));
428 dispatchMap[tclass] = func;
429 }
430
431 return func(arg, ctx);
432}
433
434} // namespace Experimental
435} // namespace RooFit
bool startsWith(std::string_view str, std::string_view prefix)
const char Option_t
Option string (const char)
Definition RtypesCore.h:80
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h offset
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void value
char name[80]
Definition TGX11.cxx:110
#define gInterpreter
const_iterator end() const
Common abstract base class for objects that represent a value and a "shape" in RooFit.
Definition RooAbsArg.h:76
TClass * IsA() const override
Definition RooAbsArg.h:678
const TNamed * namePtr() const
De-duplicated pointer to this object's name.
Definition RooAbsArg.h:502
Int_t defaultPrintContents(Option_t *opt) const override
Define default contents to print.
Abstract container object that can hold multiple RooAbsArg objects.
A class to manage loop scopes using the RAII technique.
A class to maintain the context for squashing of RooFit models into code.
std::unordered_map< RooFit::UniqueId< RooAbsCollection >::Value_t, std::string > _listNames
A map to keep track of list names as assigned by addResult.
void addToGlobalScope(std::string const &str)
Adds the given string to the string block that will be emitted at the top of the squashed function.
std::string const & getResult(RooAbsArg const &arg)
Gets the result for the given node using the node name.
std::string getTmpVarName() const
Get a unique variable name to be used in the generated code.
void addResult(RooAbsArg const *key, std::string const &value)
A function to save an expression that includes/depends on the result of the input node.
void addToCodeBody(RooAbsArg const *klass, std::string const &in)
Adds the input string to the squashed code body.
std::unique_ptr< LoopScope > beginLoop(RooAbsArg const *in)
Create a RAII scope for iterating over vector observables.
void collectFunction(std::string const &name)
Register a function that is only know to the interpreter to the context.
void addVecObs(const char *key, int idx)
Since the squashed code represents all observables as a single flattened array, it is important to ke...
std::unordered_map< const TNamed *, int > _vecObsIndices
A map to keep track of the observable indices if they are non scalar.
int observableIndexOf(const RooAbsArg &arg) const
std::map< RooFit::Detail::DataKey, std::size_t > _nodeOutputSizes
Map of node output sizes.
std::string buildFunction(RooAbsArg const &arg, std::map< RooFit::Detail::DataKey, std::size_t > const &outputSizes={})
Assemble and return the final code with the return expression and global statements.
std::string buildArg(RooAbsCollection const &x, std::string const &arrayType="double")
Function to save a RooListProxy as an array in the squashed code.
void endLoop(LoopScope const &scope)
std::vector< std::string > _collectedFunctions
bool isScopeIndependent(RooAbsArg const *in) const
std::vector< std::string > _code
The code layered by lexical scopes used as a stack.
unsigned _indent
The indentation level for pretty-printing.
std::unordered_map< const TNamed *, std::string > _nodeNames
Map of node names to their result strings.
std::size_t outputSize(RooFit::Detail::DataKey key) const
Figure out the output size of a node.
ScopeRAII OutputScopeRangeComment(RooAbsArg const *arg)
int _tmpVarIdx
Index to get unique names for temporary variables.
static const TNamed * known(const char *stringPtr)
If the name is already known, return its TNamed pointer. Otherwise return 0 (don't register the name)...
virtual StyleOption defaultPrintStyle(Option_t *opt) const
virtual void printStream(std::ostream &os, Int_t contents, StyleOption style, TString indent="") const
Print description of object on ostream, printing contents set by contents integer,...
TClass instances represent classes, structs and namespaces in the ROOT type system.
Definition TClass.h:84
The TNamed class is the base class for all named ROOT classes.
Definition TNamed.h:29
const char * GetName() const override
Returns name of object.
Definition TNamed.h:49
Basic string class.
Definition TString.h:138
@ kBoth
Definition TString.h:284
const Int_t n
Definition legend1.C:16
void replaceAll(std::string &inOut, std::string_view what, std::string_view with)
void declareDispatcherCode(std::string const &funcName)
void codegen(RooAbsArg &arg, CodegenContext &ctx)
The namespace RooFit contains mostly switches that change the behaviour of functions of PDFs (or othe...
Definition CodegenImpl.h:67
ScopeRAII(RooAbsArg const *arg, CodegenContext &ctx)