23from datetime
import datetime
28from dask_lxplus
import CernCluster
35 Creates a connection to HTCondor cluster offered by the CERN batch service.
36 Returns a Dask client that RDataFrame will use to distribute computations.
49 container_runtime=
'none',
55 'MY.JobFlavour':
'"espresso"',
71 client = Client(cluster)
78 print(f
"Waiting for {n_workers} workers to start.")
82 print(f
"All workers are ready, took {round(end - start, 2)} seconds.")
89 Run a simple example with RDataFrame, using the previously created
90 connection to the HTCondor cluster.
93 "x",
"gRandom->Rndm() * 100")
100 print(f
"Dataset has {nentries.GetValue()} entries")
101 print(
"Column x stats:")
102 print(f
"\tmean: {meanv.GetValue()}")
103 print(f
"\tmax: {maxv.GetValue()}")
104 print(f
"\tmin: {minv.GetValue()}")
107if __name__ ==
"__main__":
109 print(f
"Starting the computations at {datetime.now()}")
113 print(f
"Computations ended at {datetime.now()}, "
114 f
"took {round(end - start, 2)} seconds.")
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
ROOT's RDataFrame offers a modern, high-level interface for analysis of data stored in TTree ,...