34 return (leaves.find(leaf) != leaves.end());
41 const std::string &friendName)
44 if (!friendName.empty()) {
46 const auto friendBName = friendName +
"." + branchName;
47 if (bNamesReg.insert(friendBName).second)
48 bNames.push_back(friendBName);
51 if (bNamesReg.insert(branchName).second)
52 bNames.push_back(branchName);
58 const std::string &friendName, std::set<TLeaf *> &foundLeaves,
TLeaf *leaf,
bool allowDuplicates)
60 const bool canAdd = allowDuplicates ? true : !
ContainsLeaf(foundLeaves, leaf);
65 UpdateList(bNamesReg, bNames, branchName, friendName);
67 foundLeaves.insert(leaf);
71 std::string &friendName)
73 for (
auto sb : *
b->GetListOfBranches()) {
75 auto subBranchName = std::string(subBranch->
GetName());
76 auto fullName = prefix + subBranchName;
78 std::string newPrefix;
80 newPrefix = fullName +
".";
82 ExploreBranch(t, bNamesReg, bNames, subBranch, newPrefix, friendName);
85 UpdateList(bNamesReg, bNames, fullName, friendName);
88 UpdateList(bNamesReg, bNames, subBranchName, friendName);
93 std::set<TTree *> &analysedTrees, std::string &friendName,
bool allowDuplicates)
95 std::set<TLeaf *> foundLeaves;
96 if (!analysedTrees.insert(&t).second) {
105 std::string err(
"GetBranchNames: error in opening the tree ");
107 throw std::runtime_error(err);
110 for (
auto b : *branches) {
112 const auto branchName = std::string(branch->
GetName());
116 if (listOfLeaves->GetEntries() == 1) {
117 auto leaf =
static_cast<TLeaf *
>(listOfLeaves->At(0));
118 const auto leafName = std::string(leaf->GetName());
119 if (leafName == branchName) {
120 UpdateList(bNamesReg, bNames, branchName, friendName, foundLeaves, leaf, allowDuplicates);
124 for (
auto leaf : *listOfLeaves) {
125 auto castLeaf =
static_cast<TLeaf *
>(leaf);
126 const auto leafName = std::string(leaf->GetName());
127 const auto fullName = branchName +
"." + leafName;
128 UpdateList(bNamesReg, bNames, fullName, friendName, foundLeaves, castLeaf, allowDuplicates);
132 ExploreBranch(t, bNamesReg, bNames, branch, branchName +
".", friendName);
133 UpdateList(bNamesReg, bNames, branchName, friendName);
138 bool dotIsImplied =
false;
141 throw std::runtime_error(
"GetBranchNames: unsupported branch type");
143 if (be->GetType() == 3 || be->GetType() == 4)
146 if (dotIsImplied || branchName.back() ==
'.')
149 ExploreBranch(t, bNamesReg, bNames, branch, branchName +
".", friendName);
151 UpdateList(bNamesReg, bNames, branchName, friendName);
161 for (
auto friendTreeObj : *friendTrees) {
166 if (alias !=
nullptr)
167 frName = std::string(alias);
169 frName = std::string(friendTree->GetName());
171 GetBranchNamesImpl(*friendTree, bNamesReg, bNames, analysedTrees, frName, allowDuplicates);
179 std::set<std::string> bNamesSet;
181 std::set<TTree *> analysedTrees;
182 std::string emptyFrName =
"";
183 GetBranchNamesImpl(t, bNamesSet, bNames, analysedTrees, emptyFrName, allowDuplicates);
189 : fTree(std::shared_ptr<
TTree>(
tree, [](
TTree *) {})), fDefaultColumns(defaultBranches),
204 fDataSource(std::move(ds))
212 auto friends =
fTree->GetListOfFriends();
215 for (
auto friendElObj : *friends) {
217 auto friendTree = friendEl->
GetTree();
218 if (friendTree && friendTree->GetTreeIndex()) {
219 std::string err =
fTree->GetName();
220 err +=
" has a friend, \"";
221 err += friendTree->GetName();
222 err +=
"\", which has an index. This is not supported.";
223 throw std::runtime_error(err);
237 std::vector<std::pair<ULong64_t, ULong64_t>> entryRanges;
245 entryRanges.emplace_back(start, end);
250 auto genFunction = [
this, &slotStack](
const std::pair<ULong64_t, ULong64_t> &range) {
251 auto slot = slotStack.
GetSlot();
253 for (
auto currEntry = range.first; currEntry < range.second; ++currEntry) {
261 pool.
Foreach(genFunction, entryRanges);
283 auto tp = std::make_unique<ROOT::TTreeProcessorMT>(*
fTree, entryList);
285 std::atomic<ULong64_t> entryCount(0ull);
287 tp->Process([
this, &slotStack, &entryCount](
TTreeReader &
r) ->
void {
288 auto slot = slotStack.
GetSlot();
290 const auto entryRange =
r.GetEntriesRange();
291 const auto nEntries = entryRange.second - entryRange.first;
292 auto count = entryCount.fetch_add(nEntries);
308 if (0 ==
fTree->GetEntriesFast())
326 while (!ranges.empty()) {
329 for (
const auto &range : ranges) {
330 auto end = range.second;
331 for (
auto entry = range.first; entry < end; ++entry) {
353 auto runOnRange = [
this, &slotStack](
const std::pair<ULong64_t, ULong64_t> &range) {
354 const auto slot = slotStack.
GetSlot();
357 const auto end = range.second;
358 for (
auto entry = range.first; entry < end; ++entry) {
370 while (!ranges.empty()) {
371 pool.
Foreach(runOnRange, ranges);
383 actionPtr->Run(slot, entry);
385 namedFilterPtr->CheckFilters(slot, entry);
398 ptr->InitSlot(
r, slot);
400 ptr->InitSlot(
r, slot);
438 ptr->ResetChildrenCount();
440 ptr->ResetChildrenCount();
450 ptr->FinalizeSlot(slot);
452 ptr->ClearTask(slot);
487 actionPtr->TriggerChildrenCount();
489 namedFilterPtr->TriggerChildrenCount();
494 static unsigned int id = 0;
576 fPtr->FillReport(rep);
581 if (everyNEvents == 0ull)
589 std::vector<std::string>
filters;
591 auto name = (filter->HasName() ? filter->GetName() :
"Unnamed Filter");
599 std::vector<RDFInternal::RActionBase *> actions;
616 auto thisNode = std::make_shared<ROOT::Internal::RDF::GraphDrawing::GraphNode>(
name);
618 thisNode->SetCounter(0);
void GetBranchNamesImpl(TTree &t, std::set< std::string > &bNamesReg, ColumnNames_t &bNames, std::set< TTree * > &analysedTrees, std::string &friendName, bool allowDuplicates)
void UpdateList(std::set< std::string > &bNamesReg, ColumnNames_t &bNames, const std::string &branchName, const std::string &friendName)
This overload does not perform any check on the duplicates.
void ExploreBranch(TTree &t, std::set< std::string > &bNamesReg, ColumnNames_t &bNames, TBranch *b, std::string prefix, std::string &friendName)
bool ContainsLeaf(const std::set< TLeaf * > &leaves, TLeaf *leaf)
unsigned long long ULong64_t
RLoopManager(TTree *tree, const ColumnNames_t &defaultBranches)
bool CheckFilters(unsigned int, Long64_t) final
void EvalChildrenCounts()
Trigger counting of number of children nodes for each node of the functional graph.
void CleanUpNodes()
Perform clean-up operations. To be called at the end of each event loop.
void RunEmptySource()
Run event loop with no source files, in sequence.
void Report(ROOT::RDF::RCutFlowReport &rep) const final
Call FillReport on all booked filters.
std::vector< RFilterBase * > fBookedNamedFilters
Contains a subset of fBookedFilters, i.e. only the named filters.
void RunEmptySourceMT()
Run event loop with no source files, in parallel.
const ColumnNames_t & GetBranchNames()
Return all valid TTree::Branch names (caching results for subsequent calls).
bool fMustRunNamedFilters
std::shared_ptr< TTree > fTree
Shared pointer to the input TTree.
const ULong64_t fNEmptyEntries
std::string fToJitExec
Code that should be just-in-time executed right before the event loop.
void RunTreeReader()
Run event loop over one or multiple ROOT files, in sequence.
std::vector< RDFInternal::RActionBase * > GetAllActions()
For all the actions, either booked or run.
void CleanUpTask(unsigned int slot)
Perform clean-up operations. To be called at the end of each task execution.
std::vector< RDFInternal::RActionBase * > fRunActions
Non-owning pointers to actions already run.
void Run()
Start the event loop with a different mechanism depending on IMT/no IMT, data source/no data source.
std::vector< RRangeBase * > fBookedRanges
std::vector< TCallback > fCallbacks
Registered callbacks.
void RunAndCheckFilters(unsigned int slot, Long64_t entry)
Execute actions and make sure named filters are called for each event.
std::vector< RFilterBase * > fBookedFilters
void CheckIndexedFriends()
std::vector< RDFInternal::RActionBase * > fBookedActions
Non-owning pointers to actions to be run.
void JitDeclarations()
Declare to the interpreter type aliases and other entities required by RDF jitted nodes.
std::shared_ptr< ROOT::Internal::RDF::GraphDrawing::GraphNode > GetGraph()
const ELoopType fLoopType
The kind of event loop that is going to be run (e.g. on ROOT files, on no files)
ColumnNames_t fValidBranchNames
Cache of the tree/chain branch names. Never access directy, always use GetBranchNames().
std::vector< RCustomColumnBase * > fCustomColumns
Non-owning container of all custom columns created so far.
const unsigned int fNSlots
const ColumnNames_t & GetDefaultColumnNames() const
Return the list of default columns – empty if none was provided when constructing the RDataFrame.
std::vector< TOneTimeCallback > fCallbacksOnce
Registered callbacks to invoke just once before running the loop.
void RunDataSourceMT()
Run event loop over data accessed through a DataSource, in parallel.
std::string fToJitDeclare
Code that should be just-in-time declared right before the event loop.
std::vector< std::string > GetFiltersNames()
For each booked filter, returns either the name or "Unnamed Filter".
const std::unique_ptr< RDataSource > fDataSource
Owning pointer to a data-source object. Null if no data-source.
static unsigned int GetNextID()
const ColumnNames_t fDefaultColumns
void Book(RDFInternal::RActionBase *actionPtr)
void InitNodeSlots(TTreeReader *r, unsigned int slot)
Build TTreeReaderValues for all nodes This method loops over all filters, actions and other booked ob...
void RegisterCallback(ULong64_t everyNEvents, std::function< void(unsigned int)> &&f)
void RunDataSource()
Run event loop over data accessed through a DataSource, in sequence.
void Jit()
Add RDF nodes that require just-in-time compilation to the computation graph.
void RunTreeProcessorMT()
Run event loop over one or multiple ROOT files, in parallel.
void Deregister(RDFInternal::RActionBase *actionPtr)
void InitNodes()
Initialize all nodes of the functional graph before running the event loop.
unsigned int fNStopsReceived
Number of times that a children node signaled to stop processing entries.
unsigned int fNChildren
Number of nodes of the functional graph hanging from this object.
This is an helper class to allow to pick a slot resorting to a map indexed by thread ids.
void ReturnSlot(unsigned int slotNumber)
This class provides a simple interface to execute the same task multiple times in parallel,...
void Foreach(F func, unsigned nTimes, unsigned nChunks=0)
Execute func (with no arguments) nTimes in parallel.
A Branch for the case of an object.
A TTree is a list of TBranches.
TObjArray * GetListOfLeaves()
A List of entry numbers in a TTree or TChain.
A TFriendElement TF describes a TTree object TF in a file.
virtual TTree * GetTree()
Return pointer to friend TTree.
A TLeaf describes individual elements of a TBranch See TBranch structure in TTree.
virtual const char * GetName() const
Returns name of object.
A simple, robust and fast interface to read values from ROOT columnar datasets such as TTree,...
A TTree represents a columnar dataset.
virtual TBranch * FindBranch(const char *name)
Return the branch that correspond to the path 'branchname', which can include the name of the tree or...
virtual TBranch * GetBranch(const char *name)
Return pointer to the branch with the given name in this tree or its friends.
virtual TObjArray * GetListOfBranches()
virtual TTree * GetTree() const
virtual TList * GetListOfFriends() const
virtual const char * GetFriendAlias(TTree *) const
If the 'tree' is a friend, this method returns its alias name.
ColumnNames_t GetBranchNames(TTree &t, bool allowDuplicates=true)
Get all the branches names, including the ones of the friend trees.
Long64_t InterpreterCalc(const std::string &code, const std::string &context)
void InterpreterDeclare(const std::string &code)
void function(const Char_t *name_, T fun, const Char_t *docstring=0)
Bool_t IsImplicitMTEnabled()
Returns true if the implicit multi-threading in ROOT is enabled.
ROOT::Detail::RDF::ColumnNames_t ColumnNames_t