25if "imt" in ROOT.gROOT.GetConfigFeatures():
28 ROOT.gSystem.Setenv(
"OMP_NUM_THREADS",
"1")
31 print(
"Running in serial mode since ROOT does not support MT")
48def MakeTimeData(n, ntime, ndim):
52 fname =
"time_data_t" + str(ntime) +
"_d" + str(ndim) +
".root"
56 for i
in range(ntime):
57 v1.append(ROOT.TH1D(
"h1_" + str(i),
"h1", ndim, 0, 10))
58 v2.append(ROOT.TH1D(
"h2_" + str(i),
"h2", ndim, 0, 10))
60 f1 = ROOT.TF1(
"f1",
"gaus")
61 f2 = ROOT.TF1(
"f2",
"gaus")
63 sgn = ROOT.TTree(
"sgn",
"sgn")
64 bkg = ROOT.TTree(
"bkg",
"bkg")
65 f =
TFile(fname,
"RECREATE")
70 for i
in range(ntime):
71 x1.append(ROOT.std.vector[
"float"](ndim))
72 x2.append(ROOT.std.vector[
"float"](ndim))
74 for i
in range(ntime):
75 bkg.Branch(
"vars_time" + str(i),
"std::vector<float>", x1[i])
76 sgn.Branch(
"vars_time" + str(i),
"std::vector<float>", x2[i])
80 ROOT.gRandom.SetSeed(0)
82 mean1 = ROOT.std.vector[
"double"](ntime)
83 mean2 = ROOT.std.vector[
"double"](ntime)
84 sigma1 = ROOT.std.vector[
"double"](ntime)
85 sigma2 = ROOT.std.vector[
"double"](ntime)
87 for j
in range(ntime):
88 mean1[j] = 5.0 + 0.2 * ROOT.TMath.Sin(ROOT.TMath.Pi() * j / float(ntime))
89 mean2[j] = 5.0 + 0.2 * ROOT.TMath.Cos(ROOT.TMath.Pi() * j / float(ntime))
90 sigma1[j] = 4 + 0.3 * ROOT.TMath.Sin(ROOT.TMath.Pi() * j / float(ntime))
91 sigma2[j] = 4 + 0.3 * ROOT.TMath.Cos(ROOT.TMath.Pi() * j / float(ntime))
95 print(
"Generating event ... %d", i)
97 for j
in range(ntime):
103 f1.SetParameters(1, mean1[j], sigma1[j])
104 f2.SetParameters(1, mean2[j], sigma2[j])
106 h1.FillRandom(f1, 1000)
107 h2.FillRandom(f2, 1000)
109 for k
in range(ntime):
111 x1[j][k] = h1.GetBinContent(k + 1) + ROOT.gRandom.Gaus(0, 10)
112 x2[j][k] = h2.GetBinContent(k + 1) + ROOT.gRandom.Gaus(0, 10)
120 for j
in range(ntime):
123 for j
in range(ntime):
159if ROOT.gSystem.GetFromPipe(
"root-config --has-tmva-pymva") ==
"yes":
166 ROOT.Warning(
"TMVA_RNN_Classification",
"Skip using Keras since tensorflow cannot be imported")
170rnn_types = [
"RNN",
"LSTM",
"GRU"]
171use_rnn_type = [1, 1, 1]
174 use_rnn_type = [0, 0, 0]
175 use_rnn_type[use_type] = 1
179useGPU =
"tmva-gpu" in ROOT.gROOT.GetConfigFeatures()
180useTMVA_RNN = (
"tmva-cpu" in ROOT.gROOT.GetConfigFeatures())
or useGPU
184 "TMVA_RNN_Classification",
185 "TMVA is not build with GPU or CPU multi-thread support. Cannot use TMVA Deep Learning for RNN",
188archString =
"GPU" if useGPU
else "CPU"
190writeOutputFile =
True
194if "tmva-pymva" in ROOT.gROOT.GetConfigFeatures():
201inputFileName =
"time_data_t10_d30.root"
203fileDoesNotExist = ROOT.gSystem.AccessPathName(inputFileName)
207 MakeTimeData(nTotEvts, ntime, ninput)
212 raise ROOT.Error(
"Error opening input file %s - exit", inputFileName.Data())
215print(
"--- RNNClassification : Using input file: {}".format(inputFile.GetName()))
218outfileName =
"data_RNN_" + archString +
".root"
223 outputFile =
TFile.Open(outfileName,
"RECREATE")
247 "TMVAClassification",
252 DrawProgressBar=
True,
253 Transformations=
None,
255 AnalysisType=
"Classification",
256 ModelPersistence=
True,
260signalTree = inputFile.Get(
"sgn")
261background = inputFile.Get(
"bkg")
266for i
in range(ntime):
267 dataloader.AddVariablesArray(
"vars_time" + str(i), ninput)
270dataloader.AddSignalTree(signalTree, 1.0)
271dataloader.AddBackgroundTree(background, 1.0)
274datainfo = dataloader.GetDataSetInfo()
275vars = datainfo.GetListOfVariables()
276print(
"number of variables is {}".format(vars.size()))
282nTrainSig = 0.8 * nTotEvts
283nTrainBkg = 0.8 * nTotEvts
290dataloader.PrepareTrainingAndTestTree(
293 nTrain_Signal=nTrainSig,
294 nTrain_Background=nTrainBkg,
297 NormMode=
"NumEvents",
299 CalcCorrelations=
False,
302print(
"prepared DATA LOADER ")
312 if not use_rnn_type[i]:
315 rnn_type = rnn_types[i]
319 rnnLayout = str(rnn_type) +
"|10|" + str(ninput) +
"|" + str(ntime) +
"|0|1,RESHAPE|FLAT,DENSE|64|TANH,LINEAR"
322 trainingString1 =
"LearningRate=1e-3,Momentum=0.0,Repetitions=1,ConvergenceSteps=5,BatchSize=" + str(batchSize)
323 trainingString1 +=
",TestRepetitions=1,WeightDecay=1e-2,Regularization=None,MaxEpochs=" + str(maxepochs)
324 trainingString1 +=
"Optimizer=ADAM,DropConfig=0.0+0.+0.+0."
332 rnnName =
"TMVA_" + str(rnn_type)
339 ErrorStrategy=
"CROSSENTROPY",
341 WeightInitialization=
"XAVIERUNIFORM",
344 InputLayout=str(ntime) +
"|" + str(ninput),
346 TrainingStrategy=trainingString1,
347 Architecture=archString
355 trainingString1 = ROOT.TString(
356 "LearningRate=1e-3,Momentum=0.0,Repetitions=1,"
357 "ConvergenceSteps=10,BatchSize=256,TestRepetitions=1,"
358 "WeightDecay=1e-4,Regularization=None,MaxEpochs=20"
359 "DropConfig=0.0+0.+0.+0.,Optimizer=ADAM:"
362 trainingString1.Append(archString)
370 ErrorStrategy=
"CROSSENTROPY",
372 WeightInitialization=
"XAVIER",
374 InputLayout=
"1|1|" + str(ntime * ninput),
375 Layout=
"DENSE|64|TANH,DENSE|TANH|64,DENSE|TANH|64,LINEAR",
376 TrainingStrategy=trainingString1
388 modelName =
"model_" + rnn_types[i] +
".keras"
389 trainedModelName =
"trained_" + modelName
390 print(
"Building recurrent keras model using a", rnn_types[i],
"layer")
395 from tensorflow.keras.layers
import (
403 from tensorflow.keras.models
import Sequential
404 from tensorflow.keras.optimizers
import Adam
407 model.add(Reshape((10, 30), input_shape=(10 * 30,)))
409 if rnn_types[i] ==
"LSTM":
410 model.add(LSTM(units=10, return_sequences=
True))
411 elif rnn_types[i] ==
"GRU":
412 model.add(GRU(units=10, return_sequences=
True))
414 model.add(SimpleRNN(units=10, return_sequences=
True))
417 model.add(Dense(64, activation=
"tanh"))
418 model.add(Dense(2, activation=
"sigmoid"))
419 model.compile(loss=
"binary_crossentropy", optimizer=Adam(learning_rate=0.001), weighted_metrics=[
"accuracy"])
420 model.save(modelName)
422 print(
"saved recurrent model", modelName)
424 if not os.path.exists(modelName):
426 print(
"Error creating Keras recurrent model file - Skip using Keras")
429 print(
"Booking Keras model ", rnn_types[i])
433 "PyKeras_" + rnn_types[i],
437 FilenameModel=modelName,
438 FilenameTrainedModel=
"trained_" + modelName,
445if not useKeras
or not useTMVA_BDT:
464 BaggedSampleFraction=0.5,
471factory.TrainAllMethods()
476factory.TestAllMethods()
479factory.EvaluateAllMethods()
484c1 = factory.GetROCCurve(dataloader)
A file, usually with extension .root, that stores data and code in the form of serialized objects in ...
static TFile * Open(const char *name, Option_t *option="", const char *ftitle="", Int_t compress=ROOT::RCompressionSetting::EDefaults::kUseCompiledDefault, Int_t netopt=0)
Create / open a file.
static Config & Instance()
static function: returns TMVA instance
This is the main MVA steering class.
static void PyInitialize()
Initialize Python interpreter.
void EnableImplicitMT(UInt_t numthreads=0)
Enable ROOT's implicit multi-threading for all objects and methods that provide an internal paralleli...
UInt_t GetThreadPoolSize()
Returns the size of ROOT's thread pool.