#include <stdlib.h>
#include <fcntl.h>
#include <errno.h>
#ifdef WIN32
# include <io.h>
# include <sys/stat.h>
# include <sys/types.h>
# include "snprintf.h"
#else
# include <unistd.h>
#endif
#include <vector>
#include "RConfigure.h"
#include "Riostream.h"
#include "Getline.h"
#include "TBrowser.h"
#include "TChain.h"
#include "TCondor.h"
#include "TDSet.h"
#include "TError.h"
#include "TEnv.h"
#include "TEntryList.h"
#include "TEventList.h"
#include "TFile.h"
#include "TFileInfo.h"
#include "TFunction.h"
#include "TFTP.h"
#include "THashList.h"
#include "TInterpreter.h"
#include "TKey.h"
#include "TMap.h"
#include "TMath.h"
#include "TMessage.h"
#include "TMethodArg.h"
#include "TMethodCall.h"
#include "TMonitor.h"
#include "TMutex.h"
#include "TObjArray.h"
#include "TObjString.h"
#include "TParameter.h"
#include "TProof.h"
#include "TProofNodeInfo.h"
#include "TProofOutputFile.h"
#include "TVirtualProofPlayer.h"
#include "TVirtualPacketizer.h"
#include "TProofServ.h"
#include "TPluginManager.h"
#include "TQueryResult.h"
#include "TRandom.h"
#include "TRegexp.h"
#include "TROOT.h"
#include "TSemaphore.h"
#include "TSlave.h"
#include "TSocket.h"
#include "TSortedList.h"
#include "TSystem.h"
#include "TThread.h"
#include "TTree.h"
#include "TUrl.h"
#include "TFileCollection.h"
#include "TDataSetManager.h"
#include "TDataSetManagerFile.h"
#include "TMacro.h"
#include "TSelector.h"
#include "TPRegexp.h"
TProof *gProof = 0;
TVirtualMutex *gProofMutex = 0;
char TProofMergePrg::fgCr[4] = {'-', '\\', '|', '/'};
TList *TProof::fgProofEnvList = 0;
TPluginHandler *TProof::fgLogViewer = 0;
ClassImp(TProof)
Bool_t TProofInterruptHandler::Notify()
{
if (!fProof->IsTty() || fProof->GetRemoteProtocol() < 22) {
fProof->StopProcess(kTRUE);
} else {
const char *a = 0;
if (fProof->GetRemoteProtocol() < 22) {
a = Getline("\nSwitch to asynchronous mode not supported remotely:"
"\nEnter S/s to stop, Q/q to quit, any other key to continue: ");
} else {
a = Getline("\nEnter A/a to switch asynchronous, S/s to stop, Q/q to quit,"
" any other key to continue: ");
}
if (a[0] == 'Q' || a[0] == 'S' || a[0] == 'q' || a[0] == 's') {
Info("Notify","Processing interrupt signal ... %c", a[0]);
Bool_t abort = (a[0] == 'Q' || a[0] == 'q') ? kTRUE : kFALSE;
fProof->StopProcess(abort);
} else if ((a[0] == 'A' || a[0] == 'a') && fProof->GetRemoteProtocol() >= 22) {
fProof->GoAsynchronous();
}
}
return kTRUE;
}
TProofInputHandler::TProofInputHandler(TProof *p, TSocket *s)
: TFileHandler(s->GetDescriptor(),1),
fSocket(s), fProof(p)
{
}
Bool_t TProofInputHandler::Notify()
{
fProof->CollectInputFrom(fSocket);
return kTRUE;
}
ClassImp(TSlaveInfo)
Int_t TSlaveInfo::Compare(const TObject *obj) const
{
if (!obj) return 1;
const TSlaveInfo *si = dynamic_cast<const TSlaveInfo*>(obj);
if (!si) return fOrdinal.CompareTo(obj->GetName());
const char *myord = GetOrdinal();
const char *otherord = si->GetOrdinal();
while (myord && otherord) {
Int_t myval = atoi(myord);
Int_t otherval = atoi(otherord);
if (myval < otherval) return 1;
if (myval > otherval) return -1;
myord = strchr(myord, '.');
if (myord) myord++;
otherord = strchr(otherord, '.');
if (otherord) otherord++;
}
if (myord) return -1;
if (otherord) return 1;
return 0;
}
Bool_t TSlaveInfo::IsEqual(const TObject* obj) const
{
if (!obj) return kFALSE;
const TSlaveInfo *si = dynamic_cast<const TSlaveInfo*>(obj);
if (!si) return kFALSE;
return (strcmp(GetOrdinal(), si->GetOrdinal()) == 0);
}
void TSlaveInfo::Print(Option_t *opt) const
{
TString stat = fStatus == kActive ? "active" :
fStatus == kBad ? "bad" :
"not active";
Bool_t newfmt = kFALSE;
TString oo(opt);
if (oo.Contains("N")) {
newfmt = kTRUE;
oo.ReplaceAll("N","");
}
if (oo == "active" && fStatus != kActive) return;
if (oo == "notactive" && fStatus != kNotActive) return;
if (oo == "bad" && fStatus != kBad) return;
if (newfmt) {
TString msd, si, datadir;
if (!(fMsd.IsNull())) msd.Form("| msd: %s ", fMsd.Data());
if (!(fDataDir.IsNull())) datadir.Form("| datadir: %s ", fDataDir.Data());
if (fSysInfo.fCpus > 0) {
si.Form("| %s, %d cores, %d MB ram", fHostName.Data(),
fSysInfo.fCpus, fSysInfo.fPhysRam);
} else {
si.Form("| %s", fHostName.Data());
}
Printf("Worker: %9s %s %s%s| %s", fOrdinal.Data(), si.Data(), msd.Data(), datadir.Data(), stat.Data());
} else {
TString msd = fMsd.IsNull() ? "<null>" : fMsd.Data();
std::cout << "Slave: " << fOrdinal
<< " hostname: " << fHostName
<< " msd: " << msd
<< " perf index: " << fPerfIndex
<< " " << stat
<< std::endl;
}
}
void TSlaveInfo::SetSysInfo(SysInfo_t si)
{
fSysInfo.fOS = si.fOS;
fSysInfo.fModel = si.fModel;
fSysInfo.fCpuType = si.fCpuType;
fSysInfo.fCpus = si.fCpus;
fSysInfo.fCpuSpeed = si.fCpuSpeed;
fSysInfo.fBusSpeed = si.fBusSpeed;
fSysInfo.fL2Cache = si.fL2Cache;
fSysInfo.fPhysRam = si.fPhysRam;
}
ClassImp(TProof)
TSemaphore *TProof::fgSemaphore = 0;
TMergerInfo::~TMergerInfo()
{
if (fWorkers) {
fWorkers->SetOwner(kFALSE);
SafeDelete(fWorkers);
}
}
void TMergerInfo::SetMergedWorker()
{
if (AreAllWorkersMerged())
Error("SetMergedWorker", "all workers have been already merged before!");
else
fMergedWorkers++;
}
void TMergerInfo::AddWorker(TSlave *sl)
{
if (!fWorkers)
fWorkers = new TList();
if (fWorkersToMerge == fWorkers->GetSize()) {
Error("AddWorker", "all workers have been already assigned to this merger");
return;
}
fWorkers->Add(sl);
}
Bool_t TMergerInfo::AreAllWorkersMerged()
{
return (fWorkersToMerge == fMergedWorkers);
}
Bool_t TMergerInfo::AreAllWorkersAssigned()
{
if (!fWorkers)
return kFALSE;
return (fWorkers->GetSize() == fWorkersToMerge);
}
static Int_t PoDCheckUrl(TString *_cluster)
{
if ( !_cluster )
return 0;
*_cluster = _cluster->Strip( TString::kBoth );
const TString pod_prot("pod");
TUrl url( _cluster->Data() );
if( pod_prot.CompareTo(url.GetProtocol(), TString::kIgnoreCase) )
return 0;
*_cluster = gSystem->GetFromPipe("pod-info -c -b");
if( 0 == _cluster->Length() ) {
Error("PoDCheckUrl", "PoD server is not running");
return -1;
}
return 0;
}
TProof::TProof(const char *masterurl, const char *conffile, const char *confdir,
Int_t loglevel, const char *alias, TProofMgr *mgr)
: fUrl(masterurl)
{
InitMembers();
fManager = mgr;
fServType = TProofMgr::kXProofd;
fQueryMode = kSync;
ResetBit(TProof::kIsClient);
ResetBit(TProof::kIsMaster);
if (!masterurl || strlen(masterurl) <= 0) {
fUrl.SetProtocol("proof");
fUrl.SetHost("__master__");
} else if (!(strstr(masterurl, "://"))) {
fUrl.SetProtocol("proof");
}
if (fUrl.GetPort() == TUrl(" ").GetPort())
fUrl.SetPort(TUrl("proof:// ").GetPort());
if (!strcmp(fUrl.GetHost(), "__master__"))
fMaster = fUrl.GetHost();
else if (!strlen(fUrl.GetHost()))
fMaster = gSystem->GetHostByName(gSystem->HostName()).GetHostName();
else
fMaster = gSystem->GetHostByName(fUrl.GetHost()).GetHostName();
if (strlen(fUrl.GetOptions()) > 0) {
TString opts(fUrl.GetOptions());
if (!(strncmp(fUrl.GetOptions(),"std",3))) {
fServType = TProofMgr::kProofd;
opts.Remove(0,3);
fUrl.SetOptions(opts.Data());
} else if (!(strncmp(fUrl.GetOptions(),"lite",4))) {
fServType = TProofMgr::kProofLite;
opts.Remove(0,4);
fUrl.SetOptions(opts.Data());
}
}
fMasterServ = kFALSE;
SetBit(TProof::kIsClient);
ResetBit(TProof::kIsMaster);
if (fMaster == "__master__") {
fMasterServ = kTRUE;
ResetBit(TProof::kIsClient);
SetBit(TProof::kIsMaster);
} else if (fMaster == "prooflite") {
fMasterServ = kTRUE;
SetBit(TProof::kIsMaster);
}
if (TestBit(TProof::kIsClient))
if (!gSystem->Getenv("ROOTPROOFCLIENT")) gSystem->Setenv("ROOTPROOFCLIENT","");
Init(masterurl, conffile, confdir, loglevel, alias);
if (strlen(fUrl.GetUser()) <= 0) {
TString usr, emsg;
if (Exec("gProofServ->GetUser()", "0", kTRUE) == 0) {
TObjString *os = fMacroLog.GetLineWith("const char");
if (os) {
Ssiz_t fst = os->GetString().First('\"');
Ssiz_t lst = os->GetString().Last('\"');
usr = os->GetString()(fst+1, lst-fst-1);
} else {
emsg = "could not find 'const char *' string in macro log";
}
} else {
emsg = "could not retrieve user info";
}
if (!emsg.IsNull()) {
UserGroup_t *pw = gSystem->GetUserInfo();
if (pw) {
usr = pw->fUser;
delete pw;
}
Warning("TProof", "%s: using local default %s", emsg.Data(), usr.Data());
}
fUrl.SetUser(usr.Data());
}
if (mgr) {
R__LOCKGUARD2(gROOTMutex);
gROOT->GetListOfSockets()->Remove(mgr);
gROOT->GetListOfSockets()->Add(mgr);
}
if (IsProofd() || TestBit(TProof::kIsMaster))
if (!gROOT->GetListOfProofs()->FindObject(this))
gROOT->GetListOfProofs()->Add(this);
gProof = this;
}
TProof::TProof() : fUrl(""), fServType(TProofMgr::kXProofd)
{
InitMembers();
if (!gROOT->GetListOfProofs()->FindObject(this))
gROOT->GetListOfProofs()->Add(this);
gProof = this;
}
void TProof::InitMembers()
{
fValid = kFALSE;
fTty = kFALSE;
fRecvMessages = 0;
fSlaveInfo = 0;
fMasterServ = kFALSE;
fSendGroupView = kFALSE;
fIsPollingWorkers = kFALSE;
fLastPollWorkers_s = -1;
fActiveSlaves = 0;
fInactiveSlaves = 0;
fUniqueSlaves = 0;
fAllUniqueSlaves = 0;
fNonUniqueMasters = 0;
fActiveMonitor = 0;
fUniqueMonitor = 0;
fAllUniqueMonitor = 0;
fCurrentMonitor = 0;
fBytesRead = 0;
fRealTime = 0;
fCpuTime = 0;
fIntHandler = 0;
fProgressDialog = 0;
fProgressDialogStarted = kFALSE;
SetBit(kUseProgressDialog);
fPlayer = 0;
fFeedback = 0;
fChains = 0;
fDSet = 0;
fNotIdle = 0;
fSync = kTRUE;
fRunStatus = kRunning;
fIsWaiting = kFALSE;
fRedirLog = kFALSE;
fLogFileW = 0;
fLogFileR = 0;
fLogToWindowOnly = kFALSE;
fSaveLogToMacro = kFALSE;
fMacroLog.SetName("ProofLogMacro");
fWaitingSlaves = 0;
fQueries = 0;
fOtherQueries = 0;
fDrawQueries = 0;
fMaxDrawQueries = 1;
fSeqNum = 0;
fSessionID = -1;
fEndMaster = kFALSE;
fGlobalPackageDirList = 0;
fPackageLock = 0;
fEnabledPackagesOnClient = 0;
fInputData = 0;
fPrintProgress = 0;
fLoadedMacros = 0;
fProtocol = -1;
fSlaves = 0;
fTerminatedSlaveInfos = 0;
fBadSlaves = 0;
fAllMonitor = 0;
fDataReady = kFALSE;
fBytesReady = 0;
fTotalBytes = 0;
fAvailablePackages = 0;
fEnabledPackages = 0;
fRunningDSets = 0;
fCollectTimeout = -1;
fManager = 0;
fQueryMode = kSync;
fDynamicStartup = kFALSE;
fCloseMutex = 0;
fMergersSet = kFALSE;
fMergersByHost = kFALSE;
fMergers = 0;
fMergersCount = -1;
fLastAssignedMerger = 0;
fWorkersToMerge = 0;
fFinalizationRunning = kFALSE;
fPerfTree = "";
fWrksOutputReady = 0;
fSelector = 0;
if (gSystem->Getenv("PROOF_ENVVARS")) {
TString envs(gSystem->Getenv("PROOF_ENVVARS")), env, envsfound;
Int_t from = 0;
while (envs.Tokenize(env, from, ",")) {
if (!env.IsNull()) {
if (!gSystem->Getenv(env)) {
Warning("Init", "request for sending over undefined environemnt variable '%s' - ignoring", env.Data());
} else {
if (!envsfound.IsNull()) envsfound += ",";
envsfound += env;
TProof::DelEnvVar(env);
TProof::AddEnvVar(env, gSystem->Getenv(env));
}
}
}
if (envsfound.IsNull()) {
Warning("Init", "none of the requested env variables were found: '%s'", envs.Data());
} else {
Info("Init", "the following environment variables have been added to the list to be sent to the nodes: '%s'", envsfound.Data());
}
}
return;
}
TProof::~TProof()
{
if (fChains) {
while (TChain *chain = dynamic_cast<TChain*> (fChains->First()) ) {
chain->SetProof(0);
RemoveChain(chain);
}
}
if (TestBit(TProof::kIsClient)) {
TIter nextpackage(fEnabledPackagesOnClient);
while (TObjString *package = dynamic_cast<TObjString*>(nextpackage())) {
FileStat_t stat;
if (gSystem->GetPathInfo(package->String(), stat) == 0) {
if (stat.fIsLink)
gSystem->Unlink(package->String());
}
}
}
Close();
SafeDelete(fIntHandler);
SafeDelete(fSlaves);
SafeDelete(fActiveSlaves);
SafeDelete(fInactiveSlaves);
SafeDelete(fUniqueSlaves);
SafeDelete(fAllUniqueSlaves);
SafeDelete(fNonUniqueMasters);
SafeDelete(fTerminatedSlaveInfos);
SafeDelete(fBadSlaves);
SafeDelete(fAllMonitor);
SafeDelete(fActiveMonitor);
SafeDelete(fUniqueMonitor);
SafeDelete(fAllUniqueMonitor);
SafeDelete(fSlaveInfo);
SafeDelete(fChains);
SafeDelete(fPlayer);
SafeDelete(fFeedback);
SafeDelete(fWaitingSlaves);
SafeDelete(fAvailablePackages);
SafeDelete(fEnabledPackages);
SafeDelete(fEnabledPackagesOnClient);
SafeDelete(fLoadedMacros);
SafeDelete(fPackageLock);
SafeDelete(fGlobalPackageDirList);
SafeDelete(fRecvMessages);
SafeDelete(fInputData);
SafeDelete(fRunningDSets);
SafeDelete(fCloseMutex);
if (fWrksOutputReady) {
fWrksOutputReady->SetOwner(kFALSE);
delete fWrksOutputReady;
}
if (TestBit(TProof::kIsClient)) {
if (fLogFileR)
fclose(fLogFileR);
if (fLogFileW)
fclose(fLogFileW);
if (fLogFileName.Length() > 0)
gSystem->Unlink(fLogFileName);
}
gROOT->GetListOfProofs()->Remove(this);
if (fManager && fManager->IsValid())
fManager->DiscardSession(this);
if (gProof && gProof == this) {
TIter pvp(gROOT->GetListOfProofs(), kIterBackward);
while ((gProof = (TProof *)pvp())) {
if (gProof->InheritsFrom(TProof::Class()))
break;
}
}
Emit("~TProof()");
Emit("CloseWindow()");
}
Int_t TProof::Init(const char *, const char *conffile,
const char *confdir, Int_t loglevel, const char *alias)
{
R__ASSERT(gSystem);
fValid = kFALSE;
fTty = (isatty(0) == 0 || isatty(1) == 0) ? kFALSE : kTRUE;
Bool_t attach = kFALSE;
if (strlen(fUrl.GetOptions()) > 0) {
attach = kTRUE;
TString opts = fUrl.GetOptions();
if (opts.Contains("GUI")) {
SetBit(TProof::kUsingSessionGui);
opts.Remove(opts.Index("GUI"));
fUrl.SetOptions(opts);
}
}
if (TestBit(TProof::kIsMaster)) {
if (!conffile || !conffile[0])
fConfFile = kPROOF_ConfFile;
if (!confdir || !confdir[0])
fConfDir = kPROOF_ConfDir;
if (gProofServ) fGroup = gProofServ->GetGroup();
} else {
fConfDir = confdir;
fConfFile = conffile;
}
if (fConfFile.Contains("workers=0")) fConfFile.ReplaceAll("workers=0", "masteronly");
ParseConfigField(fConfFile);
fWorkDir = gSystem->WorkingDirectory();
fLogLevel = loglevel;
fProtocol = kPROOF_Protocol;
fSendGroupView = kTRUE;
fImage = fMasterServ ? "" : "<local>";
fIntHandler = 0;
fStatus = 0;
fRecvMessages = new TList;
fRecvMessages->SetOwner(kTRUE);
fSlaveInfo = 0;
fChains = new TList;
fAvailablePackages = 0;
fEnabledPackages = 0;
fRunningDSets = 0;
fEndMaster = TestBit(TProof::kIsMaster) ? kTRUE : kFALSE;
fInputData = 0;
ResetBit(TProof::kNewInputData);
fPrintProgress = 0;
fCollectTimeout = gEnv->GetValue("Proof.CollectTimeout", -1);
fDynamicStartup = gEnv->GetValue("Proof.DynamicStartup", kFALSE);
if (TestBit(TProof::kIsClient))
fDataPoolUrl.Form("root://%s", fMaster.Data());
else
fDataPoolUrl = "";
fProgressDialog = 0;
fProgressDialogStarted = kFALSE;
TString al = (alias) ? alias : fMaster.Data();
SetAlias(al);
fRedirLog = kFALSE;
if (TestBit(TProof::kIsClient)) {
fLogFileName.Form("%s/ProofLog_%d", gSystem->TempDirectory(), gSystem->GetPid());
if ((fLogFileW = fopen(fLogFileName, "w")) == 0)
Error("Init", "could not create temporary logfile");
if ((fLogFileR = fopen(fLogFileName, "r")) == 0)
Error("Init", "could not open temp logfile for reading");
}
fLogToWindowOnly = kFALSE;
fNotIdle = 0;
fSync = (attach) ? kFALSE : kTRUE;
fIsWaiting = kFALSE;
fBytesRead = 0;
fRealTime = 0;
fCpuTime = 0;
fQueries = 0;
fOtherQueries = 0;
fDrawQueries = 0;
fMaxDrawQueries = 1;
fSeqNum = 0;
fSessionID = -1;
fWaitingSlaves = 0;
fPlayer = 0;
MakePlayer();
fFeedback = new TList;
fFeedback->SetOwner();
fFeedback->SetName("FeedbackList");
AddInput(fFeedback);
fSlaves = new TSortedList(kSortDescending);
fActiveSlaves = new TList;
fInactiveSlaves = new TList;
fUniqueSlaves = new TList;
fAllUniqueSlaves = new TList;
fNonUniqueMasters = new TList;
fBadSlaves = new TList;
fAllMonitor = new TMonitor;
fActiveMonitor = new TMonitor;
fUniqueMonitor = new TMonitor;
fAllUniqueMonitor = new TMonitor;
fCurrentMonitor = 0;
fTerminatedSlaveInfos = new TList;
fTerminatedSlaveInfos->SetOwner(kTRUE);
fPackageLock = 0;
fEnabledPackagesOnClient = 0;
fLoadedMacros = 0;
fGlobalPackageDirList = 0;
Bool_t enableSchemaEvolution = gEnv->GetValue("Proof.SchemaEvolution",1);
if (enableSchemaEvolution) {
TMessage::EnableSchemaEvolutionForAll();
} else {
Info("TProof", "automatic schema evolution in TMessage explicitly disabled");
}
if (IsMaster()) {
fPackageDir = gProofServ->GetPackageDir();
} else {
TString sandbox;
if (GetSandbox(sandbox, kTRUE) != 0) {
Error("Init", "failure asserting sandbox directory %s", sandbox.Data());
return 0;
}
fPackageDir = gEnv->GetValue("Proof.PackageDir", "");
if (fPackageDir.IsNull())
fPackageDir.Form("%s/%s", sandbox.Data(), kPROOF_PackDir);
if (AssertPath(fPackageDir, kTRUE) != 0) {
Error("Init", "failure asserting directory %s", fPackageDir.Data());
return 0;
}
}
if (!IsMaster()) {
TString globpack = gEnv->GetValue("Proof.GlobalPackageDirs","");
if (globpack.Length() > 0) {
Int_t ng = 0;
Int_t from = 0;
TString ldir;
while (globpack.Tokenize(ldir, from, ":")) {
TProofServ::ResolveKeywords(ldir);
if (gSystem->AccessPathName(ldir, kReadPermission)) {
Warning("Init", "directory for global packages %s does not"
" exist or is not readable", ldir.Data());
} else {
TString key = TString::Format("G%d", ng++);
if (!fGlobalPackageDirList) {
fGlobalPackageDirList = new THashList();
fGlobalPackageDirList->SetOwner();
}
fGlobalPackageDirList->Add(new TNamed(key,ldir));
}
}
}
TString lockpath(fPackageDir);
lockpath.ReplaceAll("/", "%");
lockpath.Insert(0, TString::Format("%s/%s",
gSystem->TempDirectory(), kPROOF_PackageLockFile));
fPackageLock = new TProofLockPath(lockpath.Data());
fEnabledPackagesOnClient = new TList;
fEnabledPackagesOnClient->SetOwner();
}
if (fDynamicStartup) {
if (!IsMaster()) {
if (!StartSlaves(attach))
return 0;
}
} else {
Bool_t masterOnly = gEnv->GetValue("Proof.MasterOnly", kFALSE);
if (!IsMaster() || !masterOnly) {
if (!StartSlaves(attach))
return 0;
if (!IsMaster()) {
Int_t dyn;
GetRC("Proof.DynamicStartup", dyn);
if (dyn != 0) fDynamicStartup = kTRUE;
}
}
}
if (fgSemaphore)
SafeDelete(fgSemaphore);
fValid = kTRUE;
fAllMonitor->DeActivateAll();
Int_t nwrk = GetRemoteProtocol() > 35 ? -1 : 9999;
TNamed *n = 0;
if (TProof::GetEnvVars() &&
(n = (TNamed *) TProof::GetEnvVars()->FindObject("PROOF_NWORKERS"))) {
TString s(n->GetTitle());
if (s.IsDigit()) nwrk = s.Atoi();
}
GoParallel(nwrk, attach);
if (!attach)
SendInitialState();
else if (!IsIdle())
fRedirLog = kTRUE;
if (TestBit(TProof::kIsClient))
SetAlias(al);
SetActive(kFALSE);
if (IsValid()) {
ActivateAsyncInput();
R__LOCKGUARD2(gROOTMutex);
gROOT->GetListOfSockets()->Add(this);
}
AskParallel();
return fActiveSlaves->GetSize();
}
Int_t TProof::GetSandbox(TString &sb, Bool_t assert, const char *rc)
{
if (rc && strlen(rc)) sb = gEnv->GetValue(rc, sb);
if (sb.IsNull()) sb = gEnv->GetValue("Proof.Sandbox", "");
if (sb.IsNull()) sb.Form("~/%s", kPROOF_WorkDir);
if (sb == ".") {
sb = gSystem->pwd();
} else if (sb == "..") {
sb = gSystem->DirName(gSystem->pwd());
}
gSystem->ExpandPathName(sb);
if (assert && AssertPath(sb, kTRUE) != 0) return -1;
return 0;
}
void TProof::ParseConfigField(const char *config)
{
TString sconf(config), opt;
Ssiz_t from = 0;
Bool_t cpuPin = kFALSE;
const char *cq = (IsLite()) ? "\"" : "";
while (sconf.Tokenize(opt, from, ",")) {
if (opt.IsNull()) continue;
if (opt.BeginsWith("valgrind")) {
TString mst, top, sub, wrk, all;
TList *envs = fgProofEnvList;
TNamed *n = 0;
if (envs) {
if ((n = (TNamed *) envs->FindObject("PROOF_WRAPPERCMD")))
all = n->GetTitle();
if ((n = (TNamed *) envs->FindObject("PROOF_MASTER_WRAPPERCMD")))
mst = n->GetTitle();
if ((n = (TNamed *) envs->FindObject("PROOF_TOPMASTER_WRAPPERCMD")))
top = n->GetTitle();
if ((n = (TNamed *) envs->FindObject("PROOF_SUBMASTER_WRAPPERCMD")))
sub = n->GetTitle();
if ((n = (TNamed *) envs->FindObject("PROOF_SLAVE_WRAPPERCMD")))
wrk = n->GetTitle();
}
if (all != "" && mst == "") mst = all;
if (all != "" && top == "") top = all;
if (all != "" && sub == "") sub = all;
if (all != "" && wrk == "") wrk = all;
if (all != "" && all.BeginsWith("valgrind_opts:")) {
Info("ParseConfigField","valgrind run: resetting 'PROOF_WRAPPERCMD':"
" must be set again for next run , if any");
TProof::DelEnvVar("PROOF_WRAPPERCMD");
}
TString var, cmd;
cmd.Form("%svalgrind -v --suppressions=<rootsys>/etc/valgrind-root.supp", cq);
TString mstlab("NO"), wrklab("NO");
Bool_t doMaster = (opt == "valgrind" || (opt.Contains("master") &&
!opt.Contains("topmaster") && !opt.Contains("submaster")))
? kTRUE : kFALSE;
if (doMaster) {
if (!IsLite()) {
if (mst == "" || mst.BeginsWith("valgrind_opts:")) {
mst.ReplaceAll("valgrind_opts:","");
var.Form("%s --log-file=<logfilemst>.valgrind.log %s", cmd.Data(), mst.Data());
TProof::AddEnvVar("PROOF_MASTER_WRAPPERCMD", var);
mstlab = "YES";
} else if (mst != "") {
mstlab = "YES";
}
} else {
if (opt.Contains("master")) {
Warning("ParseConfigField",
"master valgrinding does not make sense for PROOF-Lite: ignoring");
opt.ReplaceAll("master", "");
if (!opt.Contains("workers")) return;
}
if (opt == "valgrind" || opt == "valgrind=") opt = "valgrind=workers";
}
}
if (opt.Contains("topmaster")) {
if (top == "" || top.BeginsWith("valgrind_opts:")) {
top.ReplaceAll("valgrind_opts:","");
var.Form("%s --log-file=<logfilemst>.valgrind.log %s", cmd.Data(), top.Data());
TProof::AddEnvVar("PROOF_TOPMASTER_WRAPPERCMD", var);
mstlab = "YES";
} else if (top != "") {
mstlab = "YES";
}
}
if (opt.Contains("submaster")) {
if (sub == "" || sub.BeginsWith("valgrind_opts:")) {
sub.ReplaceAll("valgrind_opts:","");
var.Form("%s --log-file=<logfilemst>.valgrind.log %s", cmd.Data(), sub.Data());
TProof::AddEnvVar("PROOF_SUBMASTER_WRAPPERCMD", var);
mstlab = "YES";
} else if (sub != "") {
mstlab = "YES";
}
}
if (opt.Contains("=workers") || opt.Contains("+workers")) {
if (wrk == "" || wrk.BeginsWith("valgrind_opts:")) {
wrk.ReplaceAll("valgrind_opts:","");
var.Form("%s --log-file=<logfilewrk>.__valgrind__.log %s%s", cmd.Data(), wrk.Data(), cq);
TProof::AddEnvVar("PROOF_SLAVE_WRAPPERCMD", var);
TString nwrks("2");
Int_t inw = opt.Index('#');
if (inw != kNPOS) {
nwrks = opt(inw+1, opt.Length());
if (!nwrks.IsDigit()) nwrks = "2";
}
if (!IsLite()) {
TProof::AddEnvVar("PROOF_NWORKERS", nwrks);
} else {
gEnv->SetValue("ProofLite.Workers", nwrks.Atoi());
}
wrklab = nwrks;
TProof::AddEnvVar("PROOF_ADDITIONALLOG", "__valgrind__.log*");
} else if (wrk != "") {
wrklab = "ALL";
}
}
if (!IsLite()) {
TProof::AddEnvVar("PROOF_INTWAIT", "5000");
gEnv->SetValue("Proof.SocketActivityTimeout", 6000);
} else {
gEnv->SetValue("ProofLite.StartupTimeOut", 5000);
}
Printf(" ");
if (!IsLite()) {
Printf(" ---> Starting a debug run with valgrind (master:%s, workers:%s)", mstlab.Data(), wrklab.Data());
} else {
Printf(" ---> Starting a debug run with valgrind (workers:%s)", wrklab.Data());
}
Printf(" ---> Please be patient: startup may be VERY slow ...");
Printf(" ---> Logs will be available as special tags in the log window (from the progress dialog or TProof::LogViewer()) ");
Printf(" ---> (Reminder: this debug run makes sense only if you are running a debug version of ROOT)");
Printf(" ");
} else if (opt.BeginsWith("igprof-pp")) {
Printf("*** Requested IgProf performance profiling ***");
TString addLogExt = "__igprof.pp__.log";
TString addLogFmt = "igprof -pk -pp -t proofserv.exe -o %s.%s";
TString tmp;
if (IsLite()) {
addLogFmt.Append("\"");
addLogFmt.Prepend("\"");
}
tmp.Form(addLogFmt.Data(), "<logfilemst>", addLogExt.Data());
TProof::AddEnvVar("PROOF_MASTER_WRAPPERCMD", tmp.Data());
tmp.Form(addLogFmt.Data(), "<logfilewrk>", addLogExt.Data());
TProof::AddEnvVar("PROOF_SLAVE_WRAPPERCMD", tmp.Data() );
TProof::AddEnvVar("PROOF_ADDITIONALLOG", addLogExt.Data());
} else if (opt.BeginsWith("cpupin=")) {
opt.Remove(0, 7);
for (Ssiz_t i=0; i<opt.Length(); i++) {
Char_t c = opt[i];
if ((c != '+') && ((c < '0') || (c > '9')))
opt[i] = '_';
}
opt.ReplaceAll("_", "");
TProof::AddEnvVar("PROOF_SLAVE_CPUPIN_ORDER", opt);
cpuPin = kTRUE;
} else if (opt.BeginsWith("workers=")) {
opt.ReplaceAll("workers=","");
TProof::AddEnvVar("PROOF_NWORKERS", opt);
}
}
#ifdef R__LINUX
if (IsLite() && cpuPin) {
Printf("*** Requested CPU pinning ***");
const TList *ev = GetEnvVars();
const char *pinCmd = "taskset -c <cpupin>";
TString val;
TNamed *p;
if (ev && (p = dynamic_cast<TNamed *>(ev->FindObject("PROOF_SLAVE_WRAPPERCMD")))) {
val = p->GetTitle();
val.Insert(val.Length()-1, " ");
val.Insert(val.Length()-1, pinCmd);
}
else {
val.Form("\"%s\"", pinCmd);
}
TProof::AddEnvVar("PROOF_SLAVE_WRAPPERCMD", val.Data());
}
#endif
}
Int_t TProof::AssertPath(const char *inpath, Bool_t writable)
{
if (!inpath || strlen(inpath) <= 0) {
Error("AssertPath", "undefined input path");
return -1;
}
TString path(inpath);
gSystem->ExpandPathName(path);
if (gSystem->AccessPathName(path, kFileExists)) {
if (gSystem->mkdir(path, kTRUE) != 0) {
Error("AssertPath", "could not create path %s", path.Data());
return -1;
}
}
if (gSystem->AccessPathName(path, kWritePermission) && writable) {
if (gSystem->Chmod(path, 0666) != 0) {
Error("AssertPath", "could not make path %s writable", path.Data());
return -1;
}
}
return 0;
}
void TProof::SetManager(TProofMgr *mgr)
{
fManager = mgr;
if (mgr) {
R__LOCKGUARD2(gROOTMutex);
gROOT->GetListOfSockets()->Remove(mgr);
gROOT->GetListOfSockets()->Add(mgr);
}
}
Int_t TProof::AddWorkers(TList *workerList)
{
if (!IsMaster()) {
Error("AddWorkers", "AddWorkers can only be called on the master!");
return -1;
}
if (!workerList || !(workerList->GetSize())) {
Error("AddWorkers", "empty list of workers!");
return -2;
}
fImage = gProofServ->GetImage();
if (fImage.IsNull())
fImage.Form("%s:%s", TUrl(gSystem->HostName()).GetHostFQDN(), gProofServ->GetWorkDir());
UInt_t nSlaves = workerList->GetSize();
UInt_t nSlavesDone = 0;
Int_t ord = 0;
Bool_t goMoreParallel = (fSlaves->GetEntries() > 0);
TList *addedWorkers = new TList();
if (!addedWorkers) {
Error("AddWorkers", "cannot create new list for the workers to be added");
return -2;
}
addedWorkers->SetOwner(kFALSE);
TListIter next(workerList);
TObject *to;
TProofNodeInfo *worker;
TSlaveInfo *dummysi = new TSlaveInfo();
while ((to = next())) {
worker = (TProofNodeInfo *)to;
const Char_t *image = worker->GetImage().Data();
const Char_t *workdir = worker->GetWorkDir().Data();
Int_t perfidx = worker->GetPerfIndex();
Int_t sport = worker->GetPort();
if (sport == -1)
sport = fUrl.GetPort();
TString fullord;
if (worker->GetOrdinal().Length() > 0) {
fullord.Form("%s.%s", gProofServ->GetOrdinal(), worker->GetOrdinal().Data());
} else {
fullord.Form("%s.%d", gProofServ->GetOrdinal(), ord);
}
dummysi->SetOrdinal(fullord);
TSlaveInfo *rmsi = (TSlaveInfo *)fTerminatedSlaveInfos->Remove(dummysi);
if (rmsi) SafeDelete(rmsi);
TString wn(worker->GetNodeName());
if (wn == "localhost" || wn.BeginsWith("localhost.")) wn = gSystem->HostName();
TUrl u(TString::Format("%s:%d", wn.Data(), sport));
if (strlen(gProofServ->GetGroup()) > 0) {
if (strlen(u.GetUser()) <= 0)
u.SetUser(gProofServ->GetUser());
u.SetPasswd(gProofServ->GetGroup());
}
TSlave *slave = 0;
if (worker->IsWorker()) {
slave = CreateSlave(u.GetUrl(), fullord, perfidx, image, workdir);
} else {
slave = CreateSubmaster(u.GetUrl(), fullord,
image, worker->GetMsd(), worker->GetNWrks());
}
Bool_t slaveOk = kTRUE;
fSlaves->Add(slave);
if (slave->IsValid()) {
addedWorkers->Add(slave);
} else {
slaveOk = kFALSE;
fBadSlaves->Add(slave);
Warning("AddWorkers", "worker '%s' is invalid", slave->GetOrdinal());
}
PDB(kGlobal,3)
Info("AddWorkers", "worker on host %s created"
" and added to list (ord: %s)", worker->GetName(), slave->GetOrdinal());
nSlavesDone++;
TMessage m(kPROOF_SERVERSTARTED);
m << TString("Opening connections to workers") << nSlaves
<< nSlavesDone << slaveOk;
gProofServ->GetSocket()->Send(m);
ord++;
}
SafeDelete(dummysi);
SafeDelete(workerList);
nSlavesDone = 0;
TIter nxsl(addedWorkers);
TSlave *sl = 0;
while ((sl = (TSlave *) nxsl())) {
if (sl->IsValid())
sl->SetupServ(TSlave::kSlave, 0);
Bool_t slaveOk = kTRUE;
if (sl->IsValid()) {
fAllMonitor->Add(sl->GetSocket());
PDB(kGlobal,3)
Info("AddWorkers", "worker on host %s finalized"
" and added to list", sl->GetOrdinal());
} else {
slaveOk = kFALSE;
fBadSlaves->Add(sl);
}
nSlavesDone++;
TMessage m(kPROOF_SERVERSTARTED);
m << TString("Setting up worker servers") << nSlaves
<< nSlavesDone << slaveOk;
gProofServ->GetSocket()->Send(m);
}
Int_t nwrk = GetRemoteProtocol() > 35 ? -1 : 9999;
TNamed *n = 0;
if (TProof::GetEnvVars() &&
(n = (TNamed *) TProof::GetEnvVars()->FindObject("PROOF_NWORKERS"))) {
TString s(n->GetTitle());
if (s.IsDigit()) nwrk = s.Atoi();
}
if (fDynamicStartup && goMoreParallel) {
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke GoMoreParallel()");
Int_t nw = GoMoreParallel(nwrk);
PDB(kGlobal, 3)
Info("AddWorkers", "GoMoreParallel()=%d", nw);
}
else {
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke GoParallel()");
GoParallel(nwrk, kFALSE, 0);
}
if (gProofServ && gProofServ->GetEnabledPackages() &&
gProofServ->GetEnabledPackages()->GetSize() > 0) {
TIter nxp(gProofServ->GetEnabledPackages());
TPair *pck = 0;
while ((pck = (TPair *) nxp())) {
if (fDynamicStartup && goMoreParallel) {
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke UploadPackage() and EnablePackage() on added workers");
if (UploadPackage(pck->GetName(), kUntar, addedWorkers) >= 0)
EnablePackage(pck->GetName(), (TList *) pck->Value(), kTRUE, addedWorkers);
}
else {
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke UploadPackage() and EnablePackage() on all workers");
if (UploadPackage(pck->GetName()) >= 0)
EnablePackage(pck->GetName(), (TList *) pck->Value(), kTRUE);
}
}
}
if (fLoadedMacros) {
TIter nxp(fLoadedMacros);
TObjString *os = 0;
while ((os = (TObjString *) nxp())) {
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke Load() on selected workers");
Printf("Loading a macro : %s", os->GetName());
Load(os->GetName(), kTRUE, kTRUE, addedWorkers);
}
}
TString dyn = gSystem->GetDynamicPath();
dyn.ReplaceAll(":", " ");
dyn.ReplaceAll("\"", " ");
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke AddDynamicPath() on selected workers");
AddDynamicPath(dyn, kFALSE, addedWorkers, fDynamicStartup);
TString inc = gSystem->GetIncludePath();
inc.ReplaceAll("-I", " ");
inc.ReplaceAll("\"", " ");
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke AddIncludePath() on selected workers");
AddIncludePath(inc, kFALSE, addedWorkers, fDynamicStartup);
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke SaveWorkerInfo()");
SaveWorkerInfo();
if (fDynamicStartup && gProofServ) {
PDB(kGlobal, 3)
Info("AddWorkers", "Will invoke SendParallel()");
gProofServ->SendParallel(kTRUE);
if (goMoreParallel && fPlayer) {
PDB(kGlobal, 3)
Info("AddWorkers", "Will send the PROCESS message to selected workers");
fPlayer->JoinProcess(addedWorkers);
}
}
delete addedWorkers;
return 0;
}
Int_t TProof::RemoveWorkers(TList *workerList)
{
if (!IsMaster()) {
Error("RemoveWorkers", "RemoveWorkers can only be called on the master!");
return -1;
}
fFileMap.clear();
if (!workerList) {
TIter nxsl(fSlaves);
TSlave *sl = 0;
while ((sl = (TSlave *) nxsl())) {
TerminateWorker(sl);
}
} else {
if (!(workerList->GetSize())) {
Error("RemoveWorkers", "The list of workers should not be empty!");
return -2;
}
TListIter next(workerList);
TObject *to;
TProofNodeInfo *worker;
while ((to = next())) {
TSlave *sl = 0;
if (!strcmp(to->ClassName(), "TProofNodeInfo")) {
worker = (TProofNodeInfo *)to;
TIter nxsl(fSlaves);
while ((sl = (TSlave *) nxsl())) {
if (sl->GetName() == worker->GetNodeName())
break;
}
} else if (to->InheritsFrom(TSlave::Class())) {
sl = (TSlave *) to;
} else {
Warning("RemoveWorkers","unknown object type: %s - it should be"
" TProofNodeInfo or inheriting from TSlave", to->ClassName());
}
if (sl) {
if (gDebug > 0)
Info("RemoveWorkers","terminating worker %s", sl->GetOrdinal());
TerminateWorker(sl);
}
}
}
if (gProofServ && fSlaves->GetSize() <= 0) gProofServ->ReleaseWorker("master");
return 0;
}
Bool_t TProof::StartSlaves(Bool_t attach)
{
if (TestBit(TProof::kIsMaster)) {
Int_t pc = 0;
TList *workerList = new TList;
if (gProofServ->GetWorkers(workerList, pc) == TProofServ::kQueryStop) {
TString emsg("no resource currently available for this session: please retry later");
if (gDebug > 0) Info("StartSlaves", "%s", emsg.Data());
gProofServ->SendAsynMessage(emsg.Data());
return kFALSE;
}
if (AddWorkers(workerList) < 0)
return kFALSE;
} else {
Printf("Starting master: opening connection ...");
TSlave *slave = CreateSubmaster(fUrl.GetUrl(), "0", "master", 0);
if (slave->IsValid()) {
fprintf(stderr,"Starting master:"
" connection open: setting up server ... \r");
StartupMessage("Connection to master opened", kTRUE, 1, 1);
if (!attach) {
slave->SetInterruptHandler(kTRUE);
slave->SetupServ(TSlave::kMaster, fConfFile);
if (slave->IsValid()) {
Printf("Starting master: OK ");
StartupMessage("Master started", kTRUE, 1, 1);
if (fProtocol == 1) {
Error("StartSlaves",
"client and remote protocols not compatible (%d and %d)",
kPROOF_Protocol, fProtocol);
slave->Close("S");
delete slave;
return kFALSE;
}
fSlaves->Add(slave);
fAllMonitor->Add(slave->GetSocket());
slave->SetInterruptHandler(kFALSE);
fIntHandler = new TProofInterruptHandler(this);
Int_t rc = Collect(slave, 300);
Int_t slStatus = slave->GetStatus();
if (slStatus == -99 || slStatus == -98 || rc == 0) {
fSlaves->Remove(slave);
fAllMonitor->Remove(slave->GetSocket());
if (slStatus == -99)
Error("StartSlaves", "no resources available or problems setting up workers (check logs)");
else if (slStatus == -98)
Error("StartSlaves", "could not setup output redirection on master");
else
Error("StartSlaves", "setting up master");
slave->Close("S");
delete slave;
return 0;
}
if (!slave->IsValid()) {
fSlaves->Remove(slave);
fAllMonitor->Remove(slave->GetSocket());
slave->Close("S");
delete slave;
Error("StartSlaves",
"failed to setup connection with PROOF master server");
return kFALSE;
}
if (!gROOT->IsBatch() && TestBit(kUseProgressDialog)) {
if ((fProgressDialog =
gROOT->GetPluginManager()->FindHandler("TProofProgressDialog")))
if (fProgressDialog->LoadPlugin() == -1)
fProgressDialog = 0;
}
} else {
Printf("Starting master: failure");
}
} else {
Printf("Starting master: OK ");
StartupMessage("Master attached", kTRUE, 1, 1);
if (!gROOT->IsBatch() && TestBit(kUseProgressDialog)) {
if ((fProgressDialog =
gROOT->GetPluginManager()->FindHandler("TProofProgressDialog")))
if (fProgressDialog->LoadPlugin() == -1)
fProgressDialog = 0;
}
fSlaves->Add(slave);
fIntHandler = new TProofInterruptHandler(this);
}
} else {
delete slave;
if (gDebug > 0)
Error("StartSlaves", "failed to create (or connect to) the PROOF master server");
return kFALSE;
}
}
return kTRUE;
}
void TProof::Close(Option_t *opt)
{
{ R__LOCKGUARD2(fCloseMutex);
fValid = kFALSE;
if (fSlaves) {
if (fIntHandler)
fIntHandler->Remove();
TIter nxs(fSlaves);
TSlave *sl = 0;
while ((sl = (TSlave *)nxs()))
sl->Close(opt);
fActiveSlaves->Clear("nodelete");
fUniqueSlaves->Clear("nodelete");
fAllUniqueSlaves->Clear("nodelete");
fNonUniqueMasters->Clear("nodelete");
fBadSlaves->Clear("nodelete");
fInactiveSlaves->Clear("nodelete");
fSlaves->Delete();
}
}
{
R__LOCKGUARD2(gROOTMutex);
gROOT->GetListOfSockets()->Remove(this);
if (fChains) {
while (TChain *chain = dynamic_cast<TChain*> (fChains->First()) ) {
chain->SetProof(0);
RemoveChain(chain);
}
}
if (IsProofd()) {
gROOT->GetListOfProofs()->Remove(this);
if (gProof && gProof == this) {
TIter pvp(gROOT->GetListOfProofs(), kIterBackward);
while ((gProof = (TProof *)pvp())) {
if (gProof->IsProofd())
break;
}
}
}
}
}
TSlave *TProof::CreateSlave(const char *url, const char *ord,
Int_t perf, const char *image, const char *workdir)
{
TSlave* sl = TSlave::Create(url, ord, perf, image,
this, TSlave::kSlave, workdir, 0);
if (sl->IsValid()) {
sl->SetInputHandler(new TProofInputHandler(this, sl->GetSocket()));
sl->fParallel = 1;
}
return sl;
}
TSlave *TProof::CreateSubmaster(const char *url, const char *ord,
const char *image, const char *msd, Int_t nwk)
{
TSlave *sl = TSlave::Create(url, ord, 100, image, this,
TSlave::kMaster, 0, msd, nwk);
if (sl->IsValid()) {
sl->SetInputHandler(new TProofInputHandler(this, sl->GetSocket()));
}
return sl;
}
TSlave *TProof::FindSlave(TSocket *s) const
{
TSlave *sl;
TIter next(fSlaves);
while ((sl = (TSlave *)next())) {
if (sl->IsValid() && sl->GetSocket() == s)
return sl;
}
return 0;
}
void TProof::FindUniqueSlaves()
{
fUniqueSlaves->Clear();
fUniqueMonitor->RemoveAll();
fAllUniqueSlaves->Clear();
fAllUniqueMonitor->RemoveAll();
fNonUniqueMasters->Clear();
TIter next(fActiveSlaves);
while (TSlave *sl = dynamic_cast<TSlave*>(next())) {
if (fImage == sl->fImage) {
if (sl->GetSlaveType() == TSlave::kMaster) {
fNonUniqueMasters->Add(sl);
fAllUniqueSlaves->Add(sl);
fAllUniqueMonitor->Add(sl->GetSocket());
}
continue;
}
TIter next2(fUniqueSlaves);
TSlave *replace_slave = 0;
Bool_t add = kTRUE;
while (TSlave *sl2 = dynamic_cast<TSlave*>(next2())) {
if (sl->fImage == sl2->fImage) {
add = kFALSE;
if (sl->GetSlaveType() == TSlave::kMaster) {
if (sl2->GetSlaveType() == TSlave::kSlave) {
replace_slave = sl2;
add = kTRUE;
} else if (sl2->GetSlaveType() == TSlave::kMaster) {
fNonUniqueMasters->Add(sl);
fAllUniqueSlaves->Add(sl);
fAllUniqueMonitor->Add(sl->GetSocket());
} else {
Error("FindUniqueSlaves", "TSlave is neither Master nor Slave");
R__ASSERT(0);
}
}
break;
}
}
if (add) {
fUniqueSlaves->Add(sl);
fAllUniqueSlaves->Add(sl);
fUniqueMonitor->Add(sl->GetSocket());
fAllUniqueMonitor->Add(sl->GetSocket());
if (replace_slave) {
fUniqueSlaves->Remove(replace_slave);
fAllUniqueSlaves->Remove(replace_slave);
fUniqueMonitor->Remove(replace_slave->GetSocket());
fAllUniqueMonitor->Remove(replace_slave->GetSocket());
}
}
}
fUniqueMonitor->DeActivateAll();
fAllUniqueMonitor->DeActivateAll();
}
Int_t TProof::GetNumberOfSlaves() const
{
return fSlaves->GetSize();
}
Int_t TProof::GetNumberOfActiveSlaves() const
{
return fActiveSlaves->GetSize();
}
Int_t TProof::GetNumberOfInactiveSlaves() const
{
return fInactiveSlaves->GetSize();
}
Int_t TProof::GetNumberOfUniqueSlaves() const
{
return fUniqueSlaves->GetSize();
}
Int_t TProof::GetNumberOfBadSlaves() const
{
return fBadSlaves->GetSize();
}
void TProof::AskStatistics()
{
if (!IsValid()) return;
Broadcast(kPROOF_GETSTATS, kActive);
Collect(kActive, fCollectTimeout);
}
void TProof::GetStatistics(Bool_t verbose)
{
if (fProtocol > 27) {
AskStatistics();
} else {
RedirectHandle_t rh;
gSystem->RedirectOutput(fLogFileName, "a", &rh);
Print();
gSystem->RedirectOutput(0, 0, &rh);
TMacro *mp = GetLastLog();
if (mp) {
TIter nxl(mp->GetListOfLines());
TObjString *os = 0;
while ((os = (TObjString *) nxl())) {
TString s(os->GetName());
if (s.Contains("Total MB's processed:")) {
s.ReplaceAll("Total MB's processed:", "");
if (s.IsFloat()) fBytesRead = (Long64_t) s.Atof() * (1024*1024);
} else if (s.Contains("Total real time used (s):")) {
s.ReplaceAll("Total real time used (s):", "");
if (s.IsFloat()) fRealTime = s.Atof();
} else if (s.Contains("Total CPU time used (s):")) {
s.ReplaceAll("Total CPU time used (s):", "");
if (s.IsFloat()) fCpuTime = s.Atof();
}
}
delete mp;
}
}
if (verbose) {
Printf(" Real/CPU time (s): %.3f / %.3f; workers: %d; processed: %.2f MBs",
GetRealTime(), GetCpuTime(), GetParallel(), float(GetBytesRead())/(1024*1024));
}
}
void TProof::AskParallel()
{
if (!IsValid()) return;
Broadcast(kPROOF_GETPARALLEL, kActive);
Collect(kActive, fCollectTimeout);
}
TList *TProof::GetListOfQueries(Option_t *opt)
{
if (!IsValid() || TestBit(TProof::kIsMaster)) return (TList *)0;
Bool_t all = ((strchr(opt,'A') || strchr(opt,'a'))) ? kTRUE : kFALSE;
TMessage m(kPROOF_QUERYLIST);
m << all;
Broadcast(m, kActive);
Collect(kActive, fCollectTimeout);
return fQueries;
}
Int_t TProof::GetNumberOfQueries()
{
if (fQueries)
return fQueries->GetSize() - fOtherQueries;
return 0;
}
void TProof::SetMaxDrawQueries(Int_t max)
{
if (max > 0) {
if (fPlayer)
fPlayer->SetMaxDrawQueries(max);
fMaxDrawQueries = max;
}
}
void TProof::GetMaxQueries()
{
TMessage m(kPROOF_MAXQUERIES);
m << kFALSE;
Broadcast(m, kActive);
Collect(kActive, fCollectTimeout);
}
TList *TProof::GetQueryResults()
{
return (fPlayer ? fPlayer->GetListOfResults() : (TList *)0);
}
TQueryResult *TProof::GetQueryResult(const char *ref)
{
return (fPlayer ? fPlayer->GetQueryResult(ref) : (TQueryResult *)0);
}
void TProof::ShowQueries(Option_t *opt)
{
Bool_t help = ((strchr(opt,'H') || strchr(opt,'h'))) ? kTRUE : kFALSE;
if (help) {
Printf("+++");
Printf("+++ Options: \"A\" show all queries known to server");
Printf("+++ \"L\" show retrieved queries");
Printf("+++ \"F\" full listing of query info");
Printf("+++ \"H\" print this menu");
Printf("+++");
Printf("+++ (case insensitive)");
Printf("+++");
Printf("+++ Use Retrieve(<#>) to retrieve the full"
" query results from the master");
Printf("+++ e.g. Retrieve(8)");
Printf("+++");
return;
}
if (!IsValid()) return;
Bool_t local = ((strchr(opt,'L') || strchr(opt,'l'))) ? kTRUE : kFALSE;
TObject *pq = 0;
if (!local) {
GetListOfQueries(opt);
if (!fQueries) return;
TIter nxq(fQueries);
if (fOtherQueries > 0) {
Printf("+++");
Printf("+++ Queries processed during other sessions: %d", fOtherQueries);
Int_t nq = 0;
while (nq++ < fOtherQueries && (pq = nxq()))
pq->Print(opt);
}
Printf("+++");
Printf("+++ Queries processed during this session: selector: %d, draw: %d",
GetNumberOfQueries(), fDrawQueries);
while ((pq = nxq()))
pq->Print(opt);
} else {
Printf("+++");
Printf("+++ Queries processed during this session: selector: %d, draw: %d",
GetNumberOfQueries(), fDrawQueries);
TList *listlocal = fPlayer ? fPlayer->GetListOfResults() : (TList *)0;
if (listlocal) {
Printf("+++");
Printf("+++ Queries available locally: %d", listlocal->GetSize());
TIter nxlq(listlocal);
while ((pq = nxlq()))
pq->Print(opt);
}
}
Printf("+++");
}
Bool_t TProof::IsDataReady(Long64_t &totalbytes, Long64_t &bytesready)
{
if (!IsValid()) return kFALSE;
TList submasters;
TIter nextSlave(GetListOfActiveSlaves());
while (TSlave *sl = dynamic_cast<TSlave*>(nextSlave())) {
if (sl->GetSlaveType() == TSlave::kMaster) {
submasters.Add(sl);
}
}
fDataReady = kTRUE;
fBytesReady = 0;
fTotalBytes = 0;
if (submasters.GetSize() > 0) {
Broadcast(kPROOF_DATA_READY, &submasters);
Collect(&submasters);
}
bytesready = fBytesReady;
totalbytes = fTotalBytes;
EmitVA("IsDataReady(Long64_t,Long64_t)", 2, totalbytes, bytesready);
PDB(kGlobal,2)
Info("IsDataReady", "%lld / %lld (%s)",
bytesready, totalbytes, fDataReady?"READY":"NOT READY");
return fDataReady;
}
void TProof::Interrupt(EUrgent type, ESlaves list)
{
if (!IsValid()) return;
TList *slaves = 0;
if (list == kAll) slaves = fSlaves;
if (list == kActive) slaves = fActiveSlaves;
if (list == kUnique) slaves = fUniqueSlaves;
if (list == kAllUnique) slaves = fAllUniqueSlaves;
if (slaves->GetSize() == 0) return;
TSlave *sl;
TIter next(slaves);
while ((sl = (TSlave *)next())) {
if (sl->IsValid()) {
sl->Interrupt((Int_t)type);
}
}
}
Int_t TProof::GetParallel() const
{
if (!IsValid()) return -1;
TIter nextSlave(GetListOfActiveSlaves());
Int_t nparallel = 0;
while (TSlave* sl = dynamic_cast<TSlave*>(nextSlave()))
if (sl->GetParallel() >= 0)
nparallel += sl->GetParallel();
return nparallel;
}
TList *TProof::GetListOfSlaveInfos()
{
if (!IsValid()) return 0;
if (fSlaveInfo == 0) {
fSlaveInfo = new TSortedList(kSortDescending);
fSlaveInfo->SetOwner();
} else {
fSlaveInfo->Delete();
}
TList masters;
TIter next(GetListOfSlaves());
TSlave *slave;
while ((slave = (TSlave *) next()) != 0) {
if (slave->GetSlaveType() == TSlave::kSlave) {
const char *name = IsLite() ? gSystem->HostName() : slave->GetName();
TSlaveInfo *slaveinfo = new TSlaveInfo(slave->GetOrdinal(),
name,
slave->GetPerfIdx());
fSlaveInfo->Add(slaveinfo);
TIter nextactive(GetListOfActiveSlaves());
TSlave *activeslave;
while ((activeslave = (TSlave *) nextactive())) {
if (TString(slaveinfo->GetOrdinal()) == activeslave->GetOrdinal()) {
slaveinfo->SetStatus(TSlaveInfo::kActive);
break;
}
}
TIter nextbad(GetListOfBadSlaves());
TSlave *badslave;
while ((badslave = (TSlave *) nextbad())) {
if (TString(slaveinfo->GetOrdinal()) == badslave->GetOrdinal()) {
slaveinfo->SetStatus(TSlaveInfo::kBad);
break;
}
}
if (slave->IsValid()) {
if (slave->GetSocket()->Send(kPROOF_GETSLAVEINFO) == -1)
MarkBad(slave, "could not send kPROOF_GETSLAVEINFO message");
else
masters.Add(slave);
}
} else if (slave->GetSlaveType() == TSlave::kMaster) {
if (slave->IsValid()) {
if (slave->GetSocket()->Send(kPROOF_GETSLAVEINFO) == -1)
MarkBad(slave, "could not send kPROOF_GETSLAVEINFO message");
else
masters.Add(slave);
}
} else {
Error("GetSlaveInfo", "TSlave is neither Master nor Slave");
R__ASSERT(0);
}
}
if (masters.GetSize() > 0) Collect(&masters);
return fSlaveInfo;
}
void TProof::Activate(TList *slaves)
{
TMonitor *mon = fAllMonitor;
mon->DeActivateAll();
slaves = !slaves ? fActiveSlaves : slaves;
TIter next(slaves);
TSlave *sl;
while ((sl = (TSlave*) next())) {
if (sl->IsValid())
mon->Activate(sl->GetSocket());
}
}
void TProof::SetMonitor(TMonitor *mon, Bool_t on)
{
TMonitor *m = (mon) ? mon : fCurrentMonitor;
if (m) {
if (on)
m->ActivateAll();
else
m->DeActivateAll();
}
}
Int_t TProof::BroadcastGroupPriority(const char *grp, Int_t priority, TList *workers)
{
if (!IsValid()) return -1;
if (workers->GetSize() == 0) return 0;
int nsent = 0;
TIter next(workers);
TSlave *wrk;
while ((wrk = (TSlave *)next())) {
if (wrk->IsValid()) {
if (wrk->SendGroupPriority(grp, priority) == -1)
MarkBad(wrk, "could not send group priority");
else
nsent++;
}
}
return nsent;
}
Int_t TProof::BroadcastGroupPriority(const char *grp, Int_t priority, ESlaves list)
{
TList *workers = 0;
if (list == kAll) workers = fSlaves;
if (list == kActive) workers = fActiveSlaves;
if (list == kUnique) workers = fUniqueSlaves;
if (list == kAllUnique) workers = fAllUniqueSlaves;
return BroadcastGroupPriority(grp, priority, workers);
}
void TProof::ResetMergePrg()
{
fMergePrg.Reset(fActiveSlaves->GetSize());
}
Int_t TProof::Broadcast(const TMessage &mess, TList *slaves)
{
if (!IsValid()) return -1;
if (!slaves || slaves->GetSize() == 0) return 0;
int nsent = 0;
TIter next(slaves);
TSlave *sl;
while ((sl = (TSlave *)next())) {
if (sl->IsValid()) {
if (sl->GetSocket()->Send(mess) == -1)
MarkBad(sl, "could not broadcast request");
else
nsent++;
}
}
return nsent;
}
Int_t TProof::Broadcast(const TMessage &mess, ESlaves list)
{
TList *slaves = 0;
if (list == kAll) slaves = fSlaves;
if (list == kActive) slaves = fActiveSlaves;
if (list == kUnique) slaves = fUniqueSlaves;
if (list == kAllUnique) slaves = fAllUniqueSlaves;
return Broadcast(mess, slaves);
}
Int_t TProof::Broadcast(const char *str, Int_t kind, TList *slaves)
{
TMessage mess(kind);
if (str) mess.WriteString(str);
return Broadcast(mess, slaves);
}
Int_t TProof::Broadcast(const char *str, Int_t kind, ESlaves list)
{
TMessage mess(kind);
if (str) mess.WriteString(str);
return Broadcast(mess, list);
}
Int_t TProof::BroadcastObject(const TObject *obj, Int_t kind, TList *slaves)
{
TMessage mess(kind);
mess.WriteObject(obj);
return Broadcast(mess, slaves);
}
Int_t TProof::BroadcastObject(const TObject *obj, Int_t kind, ESlaves list)
{
TMessage mess(kind);
mess.WriteObject(obj);
return Broadcast(mess, list);
}
Int_t TProof::BroadcastRaw(const void *buffer, Int_t length, TList *slaves)
{
if (!IsValid()) return -1;
if (slaves->GetSize() == 0) return 0;
int nsent = 0;
TIter next(slaves);
TSlave *sl;
while ((sl = (TSlave *)next())) {
if (sl->IsValid()) {
if (sl->GetSocket()->SendRaw(buffer, length) == -1)
MarkBad(sl, "could not send broadcast-raw request");
else
nsent++;
}
}
return nsent;
}
Int_t TProof::BroadcastRaw(const void *buffer, Int_t length, ESlaves list)
{
TList *slaves = 0;
if (list == kAll) slaves = fSlaves;
if (list == kActive) slaves = fActiveSlaves;
if (list == kUnique) slaves = fUniqueSlaves;
if (list == kAllUnique) slaves = fAllUniqueSlaves;
return BroadcastRaw(buffer, length, slaves);
}
Int_t TProof::BroadcastFile(const char *file, Int_t opt, const char *rfile, TList *wrks)
{
if (!IsValid()) return -1;
if (wrks->GetSize() == 0) return 0;
int nsent = 0;
TIter next(wrks);
TSlave *wrk;
while ((wrk = (TSlave *)next())) {
if (wrk->IsValid()) {
if (SendFile(file, opt, rfile, wrk) < 0)
Error("BroadcastFile",
"problems sending file to worker %s (%s)",
wrk->GetOrdinal(), wrk->GetName());
else
nsent++;
}
}
return nsent;
}
Int_t TProof::BroadcastFile(const char *file, Int_t opt, const char *rfile, ESlaves list)
{
TList *wrks = 0;
if (list == kAll) wrks = fSlaves;
if (list == kActive) wrks = fActiveSlaves;
if (list == kUnique) wrks = fUniqueSlaves;
if (list == kAllUnique) wrks = fAllUniqueSlaves;
return BroadcastFile(file, opt, rfile, wrks);
}
void TProof::ReleaseMonitor(TMonitor *mon)
{
if (mon && (mon != fAllMonitor) && (mon != fActiveMonitor)
&& (mon != fUniqueMonitor) && (mon != fAllUniqueMonitor)) {
delete mon;
}
}
Int_t TProof::Collect(const TSlave *sl, Long_t timeout, Int_t endtype, Bool_t deactonfail)
{
Int_t rc = 0;
TMonitor *mon = 0;
if (!sl->IsValid()) return 0;
if (fCurrentMonitor == fAllMonitor) {
mon = new TMonitor;
} else {
mon = fAllMonitor;
mon->DeActivateAll();
}
mon->Activate(sl->GetSocket());
rc = Collect(mon, timeout, endtype, deactonfail);
ReleaseMonitor(mon);
return rc;
}
Int_t TProof::Collect(TList *slaves, Long_t timeout, Int_t endtype, Bool_t deactonfail)
{
Int_t rc = 0;
TMonitor *mon = 0;
if (fCurrentMonitor == fAllMonitor) {
mon = new TMonitor;
} else {
mon = fAllMonitor;
mon->DeActivateAll();
}
TIter next(slaves);
TSlave *sl;
while ((sl = (TSlave*) next())) {
if (sl->IsValid())
mon->Activate(sl->GetSocket());
}
rc = Collect(mon, timeout, endtype, deactonfail);
ReleaseMonitor(mon);
return rc;
}
Int_t TProof::Collect(ESlaves list, Long_t timeout, Int_t endtype, Bool_t deactonfail)
{
Int_t rc = 0;
TMonitor *mon = 0;
if (list == kAll) mon = fAllMonitor;
if (list == kActive) mon = fActiveMonitor;
if (list == kUnique) mon = fUniqueMonitor;
if (list == kAllUnique) mon = fAllUniqueMonitor;
if (fCurrentMonitor == mon) {
mon = new TMonitor(*mon);
}
mon->ActivateAll();
rc = Collect(mon, timeout, endtype, deactonfail);
ReleaseMonitor(mon);
return rc;
}
Int_t TProof::Collect(TMonitor *mon, Long_t timeout, Int_t endtype, Bool_t deactonfail)
{
Int_t collectId = gRandom->Integer(9999);
PDB(kCollect, 3)
Info("Collect", ">>>>>> Entering collect responses #%04d", collectId);
fStatus = 0;
fRecvMessages->Clear();
Long_t actto = (Long_t)(gEnv->GetValue("Proof.SocketActivityTimeout", -1) * 1000);
if (!mon->GetActive(actto)) return 0;
DeActivateAsyncInput();
TMonitor *savedMonitor = 0;
if (fCurrentMonitor) {
savedMonitor = fCurrentMonitor;
fCurrentMonitor = mon;
} else {
fCurrentMonitor = mon;
fBytesRead = 0;
fRealTime = 0.0;
fCpuTime = 0.0;
}
Bool_t saveRedirLog = fRedirLog;
if (!IsIdle() && !IsSync())
fRedirLog = kFALSE;
int cnt = 0, rc = 0;
Long_t nto = timeout;
PDB(kCollect, 2)
Info("Collect","active: %d", mon->GetActive());
if (fIntHandler)
fIntHandler->Add();
Int_t nact = 0;
Long_t sto = -1;
Int_t nsto = 60;
mon->ResetInterrupt();
while ((nact = mon->GetActive(sto)) && (nto < 0 || nto > 0)) {
PDB(kCollect, 2) {
if (nact < 4) {
TList *al = mon->GetListOfActives();
if (al && al->GetSize() > 0) {
Info("Collect"," %d node(s) still active:", al->GetSize());
TIter nxs(al);
TSocket *xs = 0;
while ((xs = (TSocket *)nxs())) {
TSlave *wrk = FindSlave(xs);
if (wrk)
Info("Collect"," %s (%s)", wrk->GetName(), wrk->GetOrdinal());
else
Info("Collect"," %p: %s:%d", xs, xs->GetInetAddress().GetHostName(),
xs->GetInetAddress().GetPort());
}
}
}
}
if (TestBit(TProof::kIsMaster) && !IsIdle() && fDynamicStartup && !fIsPollingWorkers &&
((fLastPollWorkers_s == -1) || (time(0)-fLastPollWorkers_s >= kPROOF_DynWrkPollInt_s))) {
fIsPollingWorkers = kTRUE;
PollForNewWorkers();
fLastPollWorkers_s = time(0);
fIsPollingWorkers = kFALSE;
}
PDB(kCollect, 3)
Info("Collect", "Will invoke Select() #%04d", collectId);
TSocket *s = mon->Select(1000);
if (s && s != (TSocket *)(-1)) {
rc = CollectInputFrom(s, endtype, deactonfail);
if (rc == 1 || (rc == 2 && !savedMonitor)) {
mon->DeActivate(s);
PDB(kCollect, 2)
Info("Collect","deactivating %p (active: %d, %p)",
s, mon->GetActive(),
mon->GetListOfActives()->First());
} else if (rc == 2) {
if (savedMonitor) {
savedMonitor->DeActivate(s);
PDB(kCollect, 2)
Info("Collect","save monitor: deactivating %p (active: %d, %p)",
s, savedMonitor->GetActive(),
savedMonitor->GetListOfActives()->First());
}
}
if (rc >= 0)
cnt++;
} else {
if (!s)
if (fPlayer && (fPlayer->GetExitStatus() == TVirtualProofPlayer::kFinished))
mon->DeActivateAll();
if (s == (TSocket *)(-1) && nto > 0)
nto--;
}
if (IsMaster() && fWrksOutputReady && fWrksOutputReady->GetSize() > 0) {
Int_t mxws = gEnv->GetValue("Proof.ControlSendOutput", 1);
if (TProof::GetParameter(fPlayer->GetInputList(), "PROOF_ControlSendOutput", mxws) != 0)
mxws = gEnv->GetValue("Proof.ControlSendOutput", 1);
TIter nxwr(fWrksOutputReady);
TSlave *wrk = 0;
while (mxws && (wrk = (TSlave *) nxwr())) {
if (!wrk->TestBit(TSlave::kOutputRequested)) {
TMessage sendoutput(kPROOF_SENDOUTPUT);
PDB(kCollect, 2)
Info("Collect", "worker %s was asked to send its output to master",
wrk->GetOrdinal());
if (wrk->GetSocket()->Send(sendoutput) != 1) {
wrk->SetBit(TSlave::kOutputRequested);
mxws--;
}
} else {
mxws--;
}
}
}
sto = -1;
if (--nsto <= 0) {
sto = (Long_t) actto;
nsto = 60;
}
}
if (nto == 0) {
TList *al = mon->GetListOfActives();
if (al && al->GetSize() > 0) {
Info("Collect"," %d node(s) went in timeout:", al->GetSize());
TIter nxs(al);
TSocket *xs = 0;
while ((xs = (TSocket *)nxs())) {
TSlave *wrk = FindSlave(xs);
if (wrk)
Info("Collect"," %s", wrk->GetName());
else
Info("Collect"," %p: %s:%d", xs, xs->GetInetAddress().GetHostName(),
xs->GetInetAddress().GetPort());
}
}
mon->DeActivateAll();
}
if (fIntHandler)
fIntHandler->Remove();
SendGroupView();
fRedirLog = saveRedirLog;
fCurrentMonitor = savedMonitor;
ActivateAsyncInput();
PDB(kCollect, 3)
Info("Collect", "<<<<<< Exiting collect responses #%04d", collectId);
return cnt;
}
Int_t TProof::PollForNewWorkers()
{
Int_t dummy = 0;
TList *reqWorkers = new TList();
reqWorkers->SetOwner(kFALSE);
if (!TestBit(TProof::kIsMaster)) {
Error("PollForNewWorkers", "Can't invoke: not on a master -- should not happen!");
return -1;
}
if (!gProofServ) {
Error("PollForNewWorkers", "No ProofServ available -- should not happen!");
return -1;
}
gProofServ->GetWorkers(reqWorkers, dummy, kTRUE);
TList *newWorkers = new TList();
newWorkers->SetOwner(kTRUE);
TIter next(reqWorkers);
TProofNodeInfo *ni;
TString fullOrd;
while (( ni = dynamic_cast<TProofNodeInfo *>(next()) )) {
fullOrd.Form("%s.%s", gProofServ->GetOrdinal(), ni->GetOrdinal().Data());
TIter nextInner(fSlaves);
TSlave *sl;
Bool_t found = kFALSE;
while (( sl = dynamic_cast<TSlave *>(nextInner()) )) {
if ( strcmp(sl->GetOrdinal(), fullOrd.Data()) == 0 ) {
found = kTRUE;
break;
}
}
if (found) delete ni;
else {
newWorkers->Add(ni);
PDB(kGlobal, 1)
Info("PollForNewWorkers", "New worker found: %s:%s",
ni->GetNodeName().Data(), fullOrd.Data());
}
}
delete reqWorkers;
Int_t nNewWorkers = newWorkers->GetEntries();
if (nNewWorkers > 0) {
PDB(kGlobal, 1)
Info("PollForNewWorkers", "Requesting to add %d new worker(s)", newWorkers->GetEntries());
Int_t rv = AddWorkers(newWorkers);
if (rv < 0) {
Error("PollForNewWorkers", "Call to AddWorkers() failed (got %d < 0)", rv);
return -1;
}
}
else {
PDB(kGlobal, 2)
Info("PollForNewWorkers", "No new worker found");
delete newWorkers;
}
return nNewWorkers;
}
void TProof::CleanGDirectory(TList *ol)
{
if (ol) {
TIter nxo(ol);
TObject *o = 0;
while ((o = nxo()))
gDirectory->RecursiveRemove(o);
}
}
Int_t TProof::CollectInputFrom(TSocket *s, Int_t endtype, Bool_t deactonfail)
{
TMessage *mess;
Int_t recvrc = 0;
if ((recvrc = s->Recv(mess)) < 0) {
PDB(kCollect,2)
Info("CollectInputFrom","%p: got %d from Recv()", s, recvrc);
Bool_t bad = kTRUE;
if (recvrc == -5) {
if (fCurrentMonitor) fCurrentMonitor->Remove(s);
if (s->Reconnect() == 0) {
if (fCurrentMonitor) fCurrentMonitor->Add(s);
bad = kFALSE;
}
}
if (bad)
MarkBad(s, "problems receiving a message in TProof::CollectInputFrom(...)");
return -1;
}
if (!mess) {
MarkBad(s, "undefined message in TProof::CollectInputFrom(...)");
return -1;
}
Int_t rc = 0;
Int_t what = mess->What();
TSlave *sl = FindSlave(s);
rc = HandleInputMessage(sl, mess, deactonfail);
if (rc == 1 && (endtype >= 0) && (what != endtype))
rc = 2;
return rc;
}
Int_t TProof::HandleInputMessage(TSlave *sl, TMessage *mess, Bool_t deactonfail)
{
char str[512];
TObject *obj;
Int_t rc = 0;
if (!mess || !sl) {
Warning("HandleInputMessage", "given an empty message or undefined worker");
return -1;
}
Bool_t delete_mess = kTRUE;
TSocket *s = sl->GetSocket();
if (!s) {
Warning("HandleInputMessage", "worker socket is undefined");
return -1;
}
Int_t what = mess->What();
PDB(kCollect,3)
Info("HandleInputMessage", "got type %d from '%s'", what, sl->GetOrdinal());
switch (what) {
case kMESS_OK:
fRecvMessages->Add(mess);
delete_mess = kFALSE;
break;
case kMESS_OBJECT:
if (fPlayer) fPlayer->HandleRecvHisto(mess);
break;
case kPROOF_FATAL:
{ TString msg;
if ((mess->BufferSize() > mess->Length()))
(*mess) >> msg;
if (msg.IsNull()) {
MarkBad(s, "received kPROOF_FATAL");
} else {
MarkBad(s, msg);
}
}
if (fProgressDialogStarted) {
Emit("StopProcess(Bool_t)", kTRUE);
}
break;
case kPROOF_STOP:
Info("HandleInputMessage", "received kPROOF_STOP from %s: disabling any further collection this worker",
sl->GetOrdinal());
rc = 1;
break;
case kPROOF_GETTREEHEADER:
fRecvMessages->Add(mess);
delete_mess = kFALSE;
rc = 1;
break;
case kPROOF_TOUCH:
{
sl->Touch();
}
break;
case kPROOF_GETOBJECT:
mess->ReadString(str, sizeof(str));
obj = gDirectory->Get(str);
if (obj)
s->SendObject(obj);
else
s->Send(kMESS_NOTOK);
break;
case kPROOF_GETPACKET:
{
TDSetElement *elem = 0;
elem = fPlayer ? fPlayer->GetNextPacket(sl, mess) : 0;
if (elem != (TDSetElement*) -1) {
TMessage answ(kPROOF_GETPACKET);
answ << elem;
s->Send(answ);
while (fWaitingSlaves != 0 && fWaitingSlaves->GetSize()) {
TPair *p = (TPair*) fWaitingSlaves->First();
s = (TSocket*) p->Key();
TMessage *m = (TMessage*) p->Value();
elem = fPlayer ? fPlayer->GetNextPacket(sl, m) : 0;
if (elem != (TDSetElement*) -1) {
TMessage a(kPROOF_GETPACKET);
a << elem;
s->Send(a);
fWaitingSlaves->Remove(fWaitingSlaves->FirstLink());
delete p;
delete m;
} else {
break;
}
}
} else {
if (fWaitingSlaves == 0) fWaitingSlaves = new TList;
fWaitingSlaves->Add(new TPair(s, mess));
delete_mess = kFALSE;
}
}
break;
case kPROOF_LOGFILE:
{
Int_t size;
(*mess) >> size;
PDB(kGlobal,2)
Info("HandleInputMessage","%s: kPROOF_LOGFILE: size: %d", sl->GetOrdinal(), size);
RecvLogFile(s, size);
}
break;
case kPROOF_LOGDONE:
(*mess) >> sl->fStatus >> sl->fParallel;
PDB(kCollect,2)
Info("HandleInputMessage","%s: kPROOF_LOGDONE: status %d parallel %d",
sl->GetOrdinal(), sl->fStatus, sl->fParallel);
if (sl->fStatus != 0) {
fStatus = sl->fStatus;
if (deactonfail) DeactivateWorker(sl->fOrdinal);
}
if (fWrksOutputReady && fWrksOutputReady->FindObject(sl)) {
sl->ResetBit(TSlave::kOutputRequested);
fWrksOutputReady->Remove(sl);
}
rc = 1;
break;
case kPROOF_GETSTATS:
{
(*mess) >> sl->fBytesRead >> sl->fRealTime >> sl->fCpuTime
>> sl->fWorkDir >> sl->fProofWorkDir;
TString img;
if ((mess->BufferSize() > mess->Length()))
(*mess) >> img;
if (img.IsNull()) {
if (sl->fImage.IsNull())
sl->fImage.Form("%s:%s", TUrl(sl->fName).GetHostFQDN(),
sl->fProofWorkDir.Data());
} else {
sl->fImage = img;
}
PDB(kGlobal,2)
Info("HandleInputMessage",
"kPROOF_GETSTATS:%s image: %s", sl->GetOrdinal(), sl->GetImage());
fBytesRead += sl->fBytesRead;
fRealTime += sl->fRealTime;
fCpuTime += sl->fCpuTime;
rc = 1;
}
break;
case kPROOF_GETPARALLEL:
{
Bool_t async = kFALSE;
(*mess) >> sl->fParallel;
if ((mess->BufferSize() > mess->Length()))
(*mess) >> async;
rc = (async) ? 0 : 1;
}
break;
case kPROOF_CHECKFILE:
{
if ((mess->BufferSize() > mess->Length())) {
(*mess) >> fCheckFileStatus;
} else {
fCheckFileStatus = 1;
}
rc = 1;
}
break;
case kPROOF_SENDFILE:
{
rc = 1;
}
break;
case kPROOF_PACKAGE_LIST:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_PACKAGE_LIST: enter");
Int_t type = 0;
(*mess) >> type;
switch (type) {
case TProof::kListEnabledPackages:
SafeDelete(fEnabledPackages);
fEnabledPackages = (TList *) mess->ReadObject(TList::Class());
if (fEnabledPackages) {
fEnabledPackages->SetOwner();
} else {
Error("HandleInputMessage",
"kPROOF_PACKAGE_LIST: kListEnabledPackages: TList not found in message!");
}
break;
case TProof::kListPackages:
SafeDelete(fAvailablePackages);
fAvailablePackages = (TList *) mess->ReadObject(TList::Class());
if (fAvailablePackages) {
fAvailablePackages->SetOwner();
} else {
Error("HandleInputMessage",
"kPROOF_PACKAGE_LIST: kListPackages: TList not found in message!");
}
break;
default:
Error("HandleInputMessage", "kPROOF_PACKAGE_LIST: unknown type: %d", type);
}
}
break;
case kPROOF_SENDOUTPUT:
{
sl->ResetBit(TSlave::kOutputRequested);
PDB(kGlobal,2)
Info("HandleInputMessage","kPROOF_SENDOUTPUT: enter (%s)", sl->GetOrdinal());
if (!fWrksOutputReady) {
fWrksOutputReady = new TList;
fWrksOutputReady->SetOwner(kFALSE);
}
fWrksOutputReady->Add(sl);
}
break;
case kPROOF_OUTPUTOBJECT:
{
PDB(kGlobal,2)
Info("HandleInputMessage","kPROOF_OUTPUTOBJECT: enter");
Int_t type = 0;
const char *prefix = gProofServ ? gProofServ->GetPrefix() : "Lite-0";
if (!TestBit(TProof::kIsClient) && !fMergersSet && !fFinalizationRunning) {
Info("HandleInputMessage", "finalization on %s started ...", prefix);
fFinalizationRunning = kTRUE;
}
while ((mess->BufferSize() > mess->Length())) {
(*mess) >> type;
if (fPlayer) {
if (type == 0) {
TQueryResult *pq =
(TQueryResult *) mess->ReadObject(TQueryResult::Class());
if (pq) {
fPlayer->AddQueryResult(pq);
fPlayer->SetCurrentQuery(pq);
if (fPlayer->GetOutputList())
fPlayer->GetOutputList()->Clear();
TString qid = TString::Format("%s:%s",pq->GetTitle(),pq->GetName());
if (fPlayer->GetInputList()->FindObject("PROOF_QueryTag"))
fPlayer->GetInputList()->Remove(fPlayer->GetInputList()->FindObject("PROOF_QueryTag"));
fPlayer->AddInput(new TNamed("PROOF_QueryTag", qid.Data()));
} else {
Warning("HandleInputMessage","kPROOF_OUTPUTOBJECT: query result missing");
}
} else if (type > 0) {
TObject *o = mess->ReadObject(TObject::Class());
fMergePrg.IncreaseIdx();
TString msg;
Bool_t changed = kFALSE;
msg.Form("%s: merging output objects ... %s", prefix, fMergePrg.Export(changed));
if (gProofServ) {
gProofServ->SendAsynMessage(msg.Data(), kFALSE);
} else if (IsTty() || changed) {
fprintf(stderr, "%s\r", msg.Data());
}
if ((fPlayer->AddOutputObject(o) == 1)) {
SafeDelete(o);
}
if (type > 1) {
fMergePrg.DecreaseNWrks();
if (TestBit(TProof::kIsClient) && !IsLite()) {
TQueryResult *pq = fPlayer->GetCurrentQuery();
if (pq) {
pq->SetOutputList(fPlayer->GetOutputList(), kFALSE);
TObject *xo = 0;
TIter nxin(fPlayer->GetInputList());
if (!pq->GetInputList()) pq->SetInputList(new TList());
while ((xo = nxin()))
if (!pq->GetInputList()->FindObject(xo->GetName()))
pq->AddInput(xo->Clone());
QueryResultReady(TString::Format("%s:%s", pq->GetTitle(), pq->GetName()));
}
UpdateDialog();
}
}
}
} else {
Warning("HandleInputMessage", "kPROOF_OUTPUTOBJECT: player undefined!");
}
}
}
break;
case kPROOF_OUTPUTLIST:
{
PDB(kGlobal,2)
Info("HandleInputMessage","%s: kPROOF_OUTPUTLIST: enter", sl->GetOrdinal());
TList *out = 0;
if (fPlayer) {
if (TestBit(TProof::kIsMaster) || fProtocol < 7) {
out = (TList *) mess->ReadObject(TList::Class());
} else {
TQueryResult *pq =
(TQueryResult *) mess->ReadObject(TQueryResult::Class());
if (pq) {
fPlayer->AddQueryResult(pq);
fPlayer->SetCurrentQuery(pq);
out = pq->GetOutputList();
CleanGDirectory(out);
out = (TList *) out->Clone();
QueryResultReady(TString::Format("%s:%s", pq->GetTitle(), pq->GetName()));
} else {
PDB(kGlobal,2)
Info("HandleInputMessage",
"%s: kPROOF_OUTPUTLIST: query result missing", sl->GetOrdinal());
}
}
if (out) {
out->SetOwner();
fPlayer->AddOutput(out);
SafeDelete(out);
} else {
PDB(kGlobal,2)
Info("HandleInputMessage",
"%s: kPROOF_OUTPUTLIST: outputlist is empty", sl->GetOrdinal());
}
} else {
Warning("HandleInputMessage",
"%s: kPROOF_OUTPUTLIST: player undefined!", sl->GetOrdinal());
}
if (TestBit(TProof::kIsClient) && !IsLite())
UpdateDialog();
}
break;
case kPROOF_QUERYLIST:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_QUERYLIST: enter");
(*mess) >> fOtherQueries >> fDrawQueries;
if (fQueries) {
fQueries->Delete();
delete fQueries;
fQueries = 0;
}
fQueries = (TList *) mess->ReadObject(TList::Class());
}
break;
case kPROOF_RETRIEVE:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_RETRIEVE: enter");
TQueryResult *pq =
(TQueryResult *) mess->ReadObject(TQueryResult::Class());
if (pq && fPlayer) {
fPlayer->AddQueryResult(pq);
QueryResultReady(TString::Format("%s:%s", pq->GetTitle(), pq->GetName()));
} else {
PDB(kGlobal,2)
Info("HandleInputMessage",
"kPROOF_RETRIEVE: query result missing or player undefined");
}
}
break;
case kPROOF_MAXQUERIES:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_MAXQUERIES: enter");
Int_t max = 0;
(*mess) >> max;
Printf("Number of queries fully kept remotely: %d", max);
}
break;
case kPROOF_SERVERSTARTED:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_SERVERSTARTED: enter");
UInt_t tot = 0, done = 0;
TString action;
Bool_t st = kTRUE;
(*mess) >> action >> tot >> done >> st;
if (TestBit(TProof::kIsClient)) {
if (tot) {
TString type = (action.Contains("submas")) ? "submasters"
: "workers";
Int_t frac = (Int_t) (done*100.)/tot;
char msg[512] = {0};
if (frac >= 100) {
snprintf(msg, 512, "%s: OK (%d %s) \n",
action.Data(),tot, type.Data());
} else {
snprintf(msg, 512, "%s: %d out of %d (%d %%)\r",
action.Data(), done, tot, frac);
}
if (fSync)
fprintf(stderr,"%s", msg);
else
NotifyLogMsg(msg, 0);
}
StartupMessage(action.Data(), st, (Int_t)done, (Int_t)tot);
} else {
TMessage m(kPROOF_SERVERSTARTED);
m << action << tot << done << st;
gProofServ->GetSocket()->Send(m);
}
}
break;
case kPROOF_DATASET_STATUS:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_DATASET_STATUS: enter");
UInt_t tot = 0, done = 0;
TString action;
Bool_t st = kTRUE;
(*mess) >> action >> tot >> done >> st;
if (TestBit(TProof::kIsClient)) {
if (tot) {
TString type = "files";
Int_t frac = (Int_t) (done*100.)/tot;
char msg[512] = {0};
if (frac >= 100) {
snprintf(msg, 512, "%s: OK (%d %s) \n",
action.Data(),tot, type.Data());
} else {
snprintf(msg, 512, "%s: %d out of %d (%d %%)\r",
action.Data(), done, tot, frac);
}
if (fSync)
fprintf(stderr,"%s", msg);
else
NotifyLogMsg(msg, 0);
}
DataSetStatus(action.Data(), st, (Int_t)done, (Int_t)tot);
} else {
TMessage m(kPROOF_DATASET_STATUS);
m << action << tot << done << st;
gProofServ->GetSocket()->Send(m);
}
}
break;
case kPROOF_STARTPROCESS:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_STARTPROCESS: enter");
if (!IsLite()) {
fNotIdle = 1;
fIsWaiting = kFALSE;
}
fRedirLog = (fSync) ? fRedirLog : kTRUE;
if (!TestBit(TProof::kIsMaster)) {
TString selec;
Int_t dsz = -1;
Long64_t first = -1, nent = -1;
(*mess) >> selec >> dsz >> first >> nent;
if (!gROOT->IsBatch()) {
if (fProgressDialog &&
!TestBit(kUsingSessionGui) && TestBit(kUseProgressDialog)) {
if (!fProgressDialogStarted) {
fProgressDialog->ExecPlugin(5, this,
selec.Data(), dsz, first, nent);
fProgressDialogStarted = kTRUE;
} else {
ResetProgressDialog(selec, dsz, first, nent);
}
}
ResetBit(kUsingSessionGui);
}
}
}
break;
case kPROOF_ENDINIT:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_ENDINIT: enter");
if (TestBit(TProof::kIsMaster)) {
if (fPlayer)
fPlayer->SetInitTime();
}
}
break;
case kPROOF_SETIDLE:
{
PDB(kGlobal,2)
Info("HandleInputMessage","kPROOF_SETIDLE: enter");
if (IsLite()) {
if (fNotIdle > 0) {
fNotIdle--;
PDB(kGlobal,2)
Info("HandleInputMessage", "%s: got kPROOF_SETIDLE", sl->GetOrdinal());
} else {
Warning("HandleInputMessage",
"%s: got kPROOF_SETIDLE but no running workers ! protocol error?",
sl->GetOrdinal());
}
} else {
fNotIdle = 0;
if ((mess->BufferSize() > mess->Length()))
(*mess) >> fIsWaiting;
}
}
break;
case kPROOF_QUERYSUBMITTED:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_QUERYSUBMITTED: enter");
(*mess) >> fSeqNum;
Bool_t sync = fSync;
if ((mess->BufferSize() > mess->Length()))
(*mess) >> sync;
if (sync != fSync && fSync) {
Activate();
fSync = kFALSE;
}
DisableGoAsyn();
fIsWaiting = kTRUE;
if (!IsLite())
fNotIdle = 1;
rc = 1;
}
break;
case kPROOF_SESSIONTAG:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_SESSIONTAG: enter");
TString stag;
(*mess) >> stag;
SetName(stag);
sl->SetSessionTag(stag);
if ((mess->BufferSize() > mess->Length()))
(*mess) >> fGroup;
if ((mess->BufferSize() > mess->Length())) {
TString usr;
(*mess) >> usr;
if (!usr.IsNull()) fUrl.SetUser(usr.Data());
}
}
break;
case kPROOF_FEEDBACK:
{
PDB(kGlobal,2)
Info("HandleInputMessage","kPROOF_FEEDBACK: enter");
TList *out = (TList *) mess->ReadObject(TList::Class());
out->SetOwner();
if (fPlayer)
fPlayer->StoreFeedback(sl, out);
else
rc = 1;
}
break;
case kPROOF_AUTOBIN:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_AUTOBIN: enter");
TString name;
Double_t xmin, xmax, ymin, ymax, zmin, zmax;
(*mess) >> name >> xmin >> xmax >> ymin >> ymax >> zmin >> zmax;
if (fPlayer) fPlayer->UpdateAutoBin(name,xmin,xmax,ymin,ymax,zmin,zmax);
TMessage answ(kPROOF_AUTOBIN);
answ << name << xmin << xmax << ymin << ymax << zmin << zmax;
s->Send(answ);
}
break;
case kPROOF_PROGRESS:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_PROGRESS: enter");
if (GetRemoteProtocol() > 25) {
TProofProgressInfo *pi = 0;
(*mess) >> pi;
fPlayer->Progress(sl,pi);
} else if (GetRemoteProtocol() > 11) {
Long64_t total, processed, bytesread;
Float_t initTime, procTime, evtrti, mbrti;
(*mess) >> total >> processed >> bytesread
>> initTime >> procTime
>> evtrti >> mbrti;
if (fPlayer)
fPlayer->Progress(sl, total, processed, bytesread,
initTime, procTime, evtrti, mbrti);
} else {
Long64_t total, processed;
(*mess) >> total >> processed;
if (fPlayer)
fPlayer->Progress(sl, total, processed);
}
}
break;
case kPROOF_STOPPROCESS:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_STOPPROCESS: enter");
Long64_t events = 0;
Bool_t abort = kFALSE;
TProofProgressStatus *status = 0;
if ((mess->BufferSize() > mess->Length()) && (fProtocol > 18)) {
(*mess) >> status >> abort;
} else if ((mess->BufferSize() > mess->Length()) && (fProtocol > 8)) {
(*mess) >> events >> abort;
} else {
(*mess) >> events;
}
if (fPlayer) {
if (fProtocol > 18) {
TList *listOfMissingFiles = 0;
if (!(listOfMissingFiles = (TList *)GetOutput("MissingFiles"))) {
listOfMissingFiles = new TList();
listOfMissingFiles->SetName("MissingFiles");
if (fPlayer)
fPlayer->AddOutputObject(listOfMissingFiles);
}
if (fPlayer->GetPacketizer()) {
Int_t ret =
fPlayer->GetPacketizer()->AddProcessed(sl, status, 0, &listOfMissingFiles);
if (ret > 0)
fPlayer->GetPacketizer()->MarkBad(sl, status, &listOfMissingFiles);
status = 0;
}
if (status) fPlayer->AddEventsProcessed(status->GetEntries());
} else {
fPlayer->AddEventsProcessed(events);
}
}
SafeDelete(status);
if (!TestBit(TProof::kIsMaster))
Emit("StopProcess(Bool_t)", abort);
break;
}
case kPROOF_SUBMERGER:
{
PDB(kGlobal,2) Info("HandleInputMessage", "kPROOF_SUBMERGER: enter");
HandleSubmerger(mess, sl);
}
break;
case kPROOF_GETSLAVEINFO:
{
PDB(kGlobal,2) Info("HandleInputMessage", "kPROOF_GETSLAVEINFO: enter");
Bool_t active = (GetListOfActiveSlaves()->FindObject(sl) != 0);
Bool_t bad = (GetListOfBadSlaves()->FindObject(sl) != 0);
TList* tmpinfo = 0;
(*mess) >> tmpinfo;
if (tmpinfo == 0) {
Error("HandleInputMessage", "kPROOF_GETSLAVEINFO: no list received!");
} else {
tmpinfo->SetOwner(kFALSE);
Int_t nentries = tmpinfo->GetSize();
for (Int_t i=0; i<nentries; i++) {
TSlaveInfo* slinfo =
dynamic_cast<TSlaveInfo*>(tmpinfo->At(i));
if (slinfo) {
if (IsLite()) slinfo->fHostName = gSystem->HostName();
TIter nxw(fSlaveInfo);
TSlaveInfo *ourwi = 0;
while ((ourwi = (TSlaveInfo *)nxw())) {
if (!strcmp(ourwi->GetOrdinal(), slinfo->GetOrdinal())) {
ourwi->SetSysInfo(slinfo->GetSysInfo());
ourwi->fHostName = slinfo->GetName();
if (slinfo->GetDataDir() && (strlen(slinfo->GetDataDir()) > 0))
ourwi->fDataDir = slinfo->GetDataDir();
break;
}
}
if (!ourwi) {
fSlaveInfo->Add(slinfo);
} else {
slinfo = ourwi;
}
if (slinfo->fStatus != TSlaveInfo::kBad) {
if (!active) slinfo->SetStatus(TSlaveInfo::kNotActive);
if (bad) slinfo->SetStatus(TSlaveInfo::kBad);
}
if (sl->GetMsd() && (strlen(sl->GetMsd()) > 0))
slinfo->fMsd = sl->GetMsd();
}
}
delete tmpinfo;
rc = 1;
}
}
break;
case kPROOF_VALIDATE_DSET:
{
PDB(kGlobal,2)
Info("HandleInputMessage", "kPROOF_VALIDATE_DSET: enter");
TDSet* dset = 0;
(*mess) >> dset;
if (!fDSet)
Error("HandleInputMessage", "kPROOF_VALIDATE_DSET: fDSet not set");
else
fDSet->Validate(dset);
delete dset;
}
break;
case kPROOF_DATA_READY:
{
PDB(kGlobal,2) Info("HandleInputMessage", "kPROOF_DATA_READY: enter");
Bool_t dataready = kFALSE;
Long64_t totalbytes, bytesready;
(*mess) >> dataready >> totalbytes >> bytesready;
fTotalBytes += totalbytes;
fBytesReady += bytesready;
if (dataready == kFALSE) fDataReady = dataready;
}
break;
case kPROOF_PING:
break;
case kPROOF_MESSAGE:
{
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_MESSAGE: enter");
TString msg;
(*mess) >> msg;
Bool_t lfeed = kTRUE;
if ((mess->BufferSize() > mess->Length()))
(*mess) >> lfeed;
if (TestBit(TProof::kIsClient)) {
if (fSync) {
fprintf(stderr,"%s%c", msg.Data(), (lfeed ? '\n' : '\r'));
} else {
NotifyLogMsg(msg, (lfeed ? "\n" : "\r"));
}
} else {
fprintf(stderr,"%s%c", msg.Data(), (lfeed ? '\n' : '\r'));
if (gProofServ) {
gProofServ->FlushLogFile();
gProofServ->SendAsynMessage(msg, lfeed);
}
}
}
break;
case kPROOF_VERSARCHCOMP:
{
TString vac;
(*mess) >> vac;
PDB(kGlobal,2) Info("HandleInputMessage","kPROOF_VERSARCHCOMP: %s", vac.Data());
Int_t from = 0;
TString vers, archcomp;
if (vac.Tokenize(vers, from, "|"))
vac.Tokenize(archcomp, from, "|");
sl->SetArchCompiler(archcomp);
vers.ReplaceAll(":","|");
sl->SetROOTVersion(vers);
}
break;
default:
{
Error("HandleInputMessage", "unknown command received from '%s' (what = %d)",
sl->GetOrdinal(), what);
}
break;
}
if (delete_mess)
delete mess;
return rc;
}
void TProof::HandleSubmerger(TMessage *mess, TSlave *sl)
{
Int_t type = 0;
(*mess) >> type;
TSocket *s = sl->GetSocket();
switch (type) {
case kOutputSent:
{
if (IsEndMaster()) {
Int_t merger_id = -1;
(*mess) >> merger_id;
PDB(kSubmerger, 2)
Info("HandleSubmerger", "kOutputSent: Worker %s:%d:%s had sent its output to merger #%d",
sl->GetName(), sl->GetPort(), sl->GetOrdinal(), merger_id);
if (!fMergers || fMergers->GetSize() <= merger_id) {
Error("HandleSubmerger", "kOutputSize: #%d not in list ", merger_id);
break;
}
TMergerInfo * mi = (TMergerInfo *) fMergers->At(merger_id);
mi->SetMergedWorker();
if (mi->AreAllWorkersMerged()) {
mi->Deactivate();
if (GetActiveMergersCount() == 0) {
fMergers->Clear();
delete fMergers;
fMergersSet = kFALSE;
fMergersCount = -1;
fLastAssignedMerger = 0;
PDB(kSubmerger, 2) Info("HandleSubmerger", "all mergers removed ... ");
}
}
} else {
PDB(kSubmerger, 2) Error("HandleSubmerger","kOutputSent: received not on endmaster!");
}
}
break;
case kMergerDown:
{
Int_t merger_id = -1;
(*mess) >> merger_id;
PDB(kSubmerger, 2) Info("HandleSubmerger", "kMergerDown: #%d ", merger_id);
if (!fMergers || fMergers->GetSize() <= merger_id) {
Error("HandleSubmerger", "kMergerDown: #%d not in list ", merger_id);
break;
}
TMergerInfo * mi = (TMergerInfo *) fMergers->At(merger_id);
if (!mi->IsActive()) {
break;
} else {
mi->Deactivate();
}
TMessage stop(kPROOF_SUBMERGER);
stop << Int_t(kStopMerging);
stop << 0;
s->Send(stop);
AskForOutput(mi->GetMerger());
TIter nxo(mi->GetWorkers());
TObject * o = 0;
while ((o = nxo())) {
AskForOutput((TSlave *)o);
}
PDB(kSubmerger, 2) Info("HandleSubmerger", "kMergerDown:%d: exit", merger_id);
}
break;
case kOutputSize:
{
if (IsEndMaster()) {
PDB(kSubmerger, 2)
Info("HandleSubmerger", "worker %s reported as finished ", sl->GetOrdinal());
const char *prefix = gProofServ ? gProofServ->GetPrefix() : "Lite-0";
if (!fFinalizationRunning) {
Info("HandleSubmerger", "finalization on %s started ...", prefix);
fFinalizationRunning = kTRUE;
}
Int_t output_size = 0;
Int_t merging_port = 0;
(*mess) >> output_size >> merging_port;
PDB(kSubmerger, 2) Info("HandleSubmerger",
"kOutputSize: Worker %s:%d:%s reports %d output objects (+ available port %d)",
sl->GetName(), sl->GetPort(), sl->GetOrdinal(), output_size, merging_port);
TString msg;
if (!fMergersSet) {
Int_t activeWorkers = fCurrentMonitor ? fCurrentMonitor->GetActive() : GetNumberOfActiveSlaves();
fMergersCount = -1;
TParameter<Int_t> *mc = dynamic_cast<TParameter<Int_t> *>(GetParameter("PROOF_UseMergers"));
if (mc) fMergersCount = mc->GetVal();
TParameter<Int_t> *mh = dynamic_cast<TParameter<Int_t> *>(GetParameter("PROOF_MergersByHost"));
if (mh) fMergersByHost = (mh->GetVal() != 0) ? kTRUE : kFALSE;
if (fMergersCount < 0 || (fMergersCount > (activeWorkers/2) )) {
msg.Form("%s: Invalid request: cannot start %d mergers for %d workers",
prefix, fMergersCount, activeWorkers);
if (gProofServ)
gProofServ->SendAsynMessage(msg);
else
Printf("%s",msg.Data());
fMergersCount = 0;
}
if ((fMergersCount == 0) && (!fMergersByHost)) {
if (activeWorkers > 1) {
fMergersCount = TMath::Nint(TMath::Sqrt(activeWorkers));
if (activeWorkers / fMergersCount < 2)
fMergersCount = (Int_t) TMath::Sqrt(activeWorkers);
}
if (fMergersCount > 1)
msg.Form("%s: Number of mergers set dynamically to %d (for %d workers)",
prefix, fMergersCount, activeWorkers);
else {
msg.Form("%s: No mergers will be used for %d workers",
prefix, activeWorkers);
fMergersCount = -1;
}
if (gProofServ)
gProofServ->SendAsynMessage(msg);
else
Printf("%s",msg.Data());
} else if (fMergersByHost) {
if (activeWorkers > 1) {
fMergersCount = 0;
THashList hosts;
TIter nxwk(fSlaves);
TObject *wrk = 0;
while ((wrk = nxwk())) {
if (!hosts.FindObject(wrk->GetName())) {
hosts.Add(new TObjString(wrk->GetName()));
fMergersCount++;
}
}
}
if (fMergersCount > 1)
msg.Form("%s: Number of mergers set to %d (for %d workers), one for each slave host",
prefix, fMergersCount, activeWorkers);
else {
msg.Form("%s: No mergers will be used for %d workers",
prefix, activeWorkers);
fMergersCount = -1;
}
if (gProofServ)
gProofServ->SendAsynMessage(msg);
else
Printf("%s",msg.Data());
} else {
msg.Form("%s: Number of mergers set by user to %d (for %d workers)",
prefix, fMergersCount, activeWorkers);
if (gProofServ)
gProofServ->SendAsynMessage(msg);
else
Printf("%s",msg.Data());
}
if (fMergersCount > 0) {
fMergers = new TList();
fLastAssignedMerger = 0;
fWorkersToMerge = (activeWorkers - fMergersCount);
if (!CreateMerger(sl, merging_port)) {
AskForOutput(sl);
fWorkersToMerge--;
fMergersCount--;
}
if (IsLite()) fMergePrg.SetNWrks(fMergersCount);
} else {
AskForOutput(sl);
}
fMergersSet = kTRUE;
} else {
if (fMergersCount == -1) {
AskForOutput(sl);
} else {
if ((fRedirectNext > 0 ) && (!fMergersByHost)) {
RedirectWorker(s, sl, output_size);
fRedirectNext--;
} else {
Bool_t newMerger = kTRUE;
if (fMergersByHost) {
TIter nxmg(fMergers);
TMergerInfo *mgi = 0;
while ((mgi = (TMergerInfo *) nxmg())) {
if (!strcmp(sl->GetName(), mgi->GetMerger()->GetName())) {
newMerger = kFALSE;
break;
}
}
}
if ((fMergersCount > fMergers->GetSize()) && newMerger) {
if (!CreateMerger(sl, merging_port)) {
AskForOutput(sl);
fWorkersToMerge--;
fMergersCount--;
}
} else
RedirectWorker(s, sl, output_size);
}
}
}
} else {
Error("HandleSubMerger","kOutputSize received not on endmaster!");
}
}
break;
}
}
void TProof::RedirectWorker(TSocket *s, TSlave * sl, Int_t output_size)
{
Int_t merger_id = -1;
if (fMergersByHost) {
for (Int_t i = 0; i < fMergers->GetSize(); i++) {
TMergerInfo *mgi = (TMergerInfo *)fMergers->At(i);
if (!strcmp(sl->GetName(), mgi->GetMerger()->GetName())) {
merger_id = i;
break;
}
}
} else {
merger_id = FindNextFreeMerger();
}
if (merger_id == -1) {
AskForOutput(sl);
} else {
TMessage sendoutput(kPROOF_SUBMERGER);
sendoutput << Int_t(kSendOutput);
PDB(kSubmerger, 2)
Info("RedirectWorker", "redirecting worker %s to merger %d", sl->GetOrdinal(), merger_id);
PDB(kSubmerger, 2) Info("RedirectWorker", "redirecting output to merger #%d", merger_id);
if (!fMergers || fMergers->GetSize() <= merger_id) {
Error("RedirectWorker", "#%d not in list ", merger_id);
return;
}
TMergerInfo * mi = (TMergerInfo *) fMergers->At(merger_id);
TString hname = (IsLite()) ? "localhost" : mi->GetMerger()->GetName();
sendoutput << merger_id;
sendoutput << hname;
sendoutput << mi->GetPort();
s->Send(sendoutput);
mi->AddMergedObjects(output_size);
mi->AddWorker(sl);
}
}
Int_t TProof::FindNextFreeMerger()
{
while (fLastAssignedMerger < fMergers->GetSize() &&
(!((TMergerInfo*)fMergers->At(fLastAssignedMerger))->IsActive() ||
((TMergerInfo*)fMergers->At(fLastAssignedMerger))->AreAllWorkersAssigned())) {
fLastAssignedMerger++;
}
if (fLastAssignedMerger == fMergers->GetSize()) {
fLastAssignedMerger = 0;
} else {
return fLastAssignedMerger++;
}
while (fLastAssignedMerger < fMergers->GetSize() &&
(!((TMergerInfo*)fMergers->At(fLastAssignedMerger))->IsActive() ||
((TMergerInfo*)fMergers->At(fLastAssignedMerger))->AreAllWorkersAssigned())) {
fLastAssignedMerger++;
}
if (fLastAssignedMerger == fMergers->GetSize()) {
return -1;
} else {
return fLastAssignedMerger++;
}
}
void TProof::AskForOutput(TSlave *sl)
{
TMessage sendoutput(kPROOF_SUBMERGER);
sendoutput << Int_t(kSendOutput);
PDB(kSubmerger, 2) Info("AskForOutput",
"worker %s was asked to send its output to master",
sl->GetOrdinal());
sendoutput << -1;
sendoutput << TString("master");
sendoutput << -1;
sl->GetSocket()->Send(sendoutput);
if (IsLite()) fMergePrg.IncreaseNWrks();
}
void TProof::UpdateDialog()
{
if (!fPlayer) return;
if (fPlayer->GetExitStatus() == TVirtualProofPlayer::kAborted) {
if (fSync)
Info("UpdateDialog",
"processing was aborted - %lld events processed",
fPlayer->GetEventsProcessed());
if (GetRemoteProtocol() > 11) {
Progress(-1, fPlayer->GetEventsProcessed(), -1, -1., -1., -1., -1.);
} else {
Progress(-1, fPlayer->GetEventsProcessed());
}
Emit("StopProcess(Bool_t)", kTRUE);
}
if (fPlayer->GetExitStatus() == TVirtualProofPlayer::kStopped) {
if (fSync)
Info("UpdateDialog",
"processing was stopped - %lld events processed",
fPlayer->GetEventsProcessed());
if (GetRemoteProtocol() > 25) {
Progress(-1, fPlayer->GetEventsProcessed(), -1, -1., -1., -1., -1., -1, -1, -1.);
} else if (GetRemoteProtocol() > 11) {
Progress(-1, fPlayer->GetEventsProcessed(), -1, -1., -1., -1., -1.);
} else {
Progress(-1, fPlayer->GetEventsProcessed());
}
Emit("StopProcess(Bool_t)", kFALSE);
}
if (GetRemoteProtocol() > 25) {
EmitVA("Progress(Long64_t,Long64_t,Long64_t,Float_t,Float_t,Float_t,Float_t,Int_t,Int_t,Float_t)",
10, (Long64_t)(-1), (Long64_t)(-1), (Long64_t)(-1),(Float_t)(-1.),(Float_t)(-1.),
(Float_t)(-1.),(Float_t)(-1.),(Int_t)(-1),(Int_t)(-1),(Float_t)(-1.));
} else if (GetRemoteProtocol() > 11) {
EmitVA("Progress(Long64_t,Long64_t,Long64_t,Float_t,Float_t,Float_t,Float_t)",
7, (Long64_t)(-1), (Long64_t)(-1), (Long64_t)(-1),
(Float_t)(-1.),(Float_t)(-1.),(Float_t)(-1.),(Float_t)(-1.));
} else {
EmitVA("Progress(Long64_t,Long64_t)", 2, (Long64_t)(-1), (Long64_t)(-1));
}
}
void TProof::ActivateAsyncInput()
{
TIter next(fSlaves);
TSlave *sl;
while ((sl = (TSlave*) next()))
if (sl->GetInputHandler())
sl->GetInputHandler()->Add();
}
void TProof::DeActivateAsyncInput()
{
TIter next(fSlaves);
TSlave *sl;
while ((sl = (TSlave*) next()))
if (sl->GetInputHandler())
sl->GetInputHandler()->Remove();
}
Int_t TProof::GetActiveMergersCount()
{
if (!fMergers) return 0;
Int_t active_mergers = 0;
TIter mergers(fMergers);
TMergerInfo *mi = 0;
while ((mi = (TMergerInfo *)mergers())) {
if (mi->IsActive()) active_mergers++;
}
return active_mergers;
}
Bool_t TProof::CreateMerger(TSlave *sl, Int_t port)
{
PDB(kSubmerger, 2)
Info("CreateMerger", "worker %s will be merger ", sl->GetOrdinal());
PDB(kSubmerger, 2) Info("CreateMerger","Begin");
if (port <= 0) {
PDB(kSubmerger,2)
Info("CreateMerger", "cannot create merger on port %d - exit", port);
return kFALSE;
}
Int_t workers = -1;
if (!fMergersByHost) {
Int_t mergersToCreate = fMergersCount - fMergers->GetSize();
Int_t rest = fWorkersToMerge % mergersToCreate;
if (rest > 0 && fMergers->GetSize() < rest) {
rest = 1;
} else {
rest = 0;
}
workers = (fWorkersToMerge / mergersToCreate) + rest;
} else {
Int_t workersOnHost = 0;
for (Int_t i = 0; i < fActiveSlaves->GetSize(); i++) {
if(!strcmp(sl->GetName(), fActiveSlaves->At(i)->GetName())) workersOnHost++;
}
workers = workersOnHost - 1;
}
TString msg;
msg.Form("worker %s on host %s will be merger for %d additional workers", sl->GetOrdinal(), sl->GetName(), workers);
if (gProofServ) {
gProofServ->SendAsynMessage(msg);
} else {
Printf("%s",msg.Data());
}
TMergerInfo * merger = new TMergerInfo(sl, port, workers);
TMessage bemerger(kPROOF_SUBMERGER);
bemerger << Int_t(kBeMerger);
bemerger << fMergers->GetSize();
bemerger << workers;
sl->GetSocket()->Send(bemerger);
PDB(kSubmerger,2) Info("CreateMerger",
"merger #%d (port: %d) for %d workers started",
fMergers->GetSize(), port, workers);
fMergers->Add(merger);
fWorkersToMerge = fWorkersToMerge - workers;
fRedirectNext = workers / 2;
PDB(kSubmerger, 2) Info("CreateMerger", "exit");
return kTRUE;
}
void TProof::MarkBad(TSlave *wrk, const char *reason)
{
R__LOCKGUARD2(fCloseMutex);
if (!IsValid()) return;
if (!wrk) {
Error("MarkBad", "worker instance undefined: protocol error? ");
return;
}
static TString thisurl;
if (thisurl.IsNull()) {
if (IsMaster()) {
Int_t port = gEnv->GetValue("ProofServ.XpdPort",-1);
thisurl = TUrl(gSystem->HostName()).GetHostFQDN();
if (port > 0) thisurl += TString::Format(":%d", port);
} else {
thisurl.Form("%s@%s:%d", fUrl.GetUser(), fUrl.GetHost(), fUrl.GetPort());
}
}
if (!reason || (strcmp(reason, kPROOF_TerminateWorker) && strcmp(reason, kPROOF_WorkerIdleTO))) {
const char *mastertype = (gProofServ && gProofServ->IsTopMaster()) ? "top master" : "master";
TString src = IsMaster() ? Form("%s at %s", mastertype, thisurl.Data()) : "local session";
TString msg;
msg.Form("\n +++ Message from %s : marking %s:%d (%s) as bad\n +++ Reason: %s",
src.Data(), wrk->GetName(), wrk->GetPort(), wrk->GetOrdinal(),
(reason && strlen(reason)) ? reason : "unknown");
Info("MarkBad", "%s", msg.Data());
if (gProofServ) {
msg += TString::Format("\n\n +++ Most likely your code crashed on worker %s at %s:%d.\n",
wrk->GetOrdinal(), wrk->GetName(), wrk->GetPort());
} else {
msg += TString::Format("\n\n +++ Most likely your code crashed\n");
}
msg += TString::Format(" +++ Please check the session logs for error messages either using\n");
msg += TString::Format(" +++ the 'Show logs' button or executing\n");
msg += TString::Format(" +++\n");
if (gProofServ) {
msg += TString::Format(" +++ root [] TProof::Mgr(\"%s\")->GetSessionLogs()->"
"Display(\"%s\",0)\n\n", thisurl.Data(), wrk->GetOrdinal());
gProofServ->SendAsynMessage(msg, kTRUE);
} else {
msg += TString::Format(" +++ root [] TProof::Mgr(\"%s\")->GetSessionLogs()->"
"Display(\"*\")\n\n", thisurl.Data());
Printf("%s", msg.Data());
}
} else if (reason) {
if (gDebug > 0 && strcmp(reason, kPROOF_WorkerIdleTO)) {
Info("MarkBad", "worker %s at %s:%d asked to terminate",
wrk->GetOrdinal(), wrk->GetName(), wrk->GetPort());
}
}
if (IsMaster() && reason) {
if (strcmp(reason, kPROOF_TerminateWorker)) {
TList *listOfMissingFiles = 0;
if (!(listOfMissingFiles = (TList *)GetOutput("MissingFiles"))) {
listOfMissingFiles = new TList();
listOfMissingFiles->SetName("MissingFiles");
if (fPlayer)
fPlayer->AddOutputObject(listOfMissingFiles);
}
TVirtualPacketizer *packetizer = fPlayer ? fPlayer->GetPacketizer() : 0;
if (packetizer) {
packetizer->MarkBad(wrk, 0, &listOfMissingFiles);
}
} else {
if (gProofServ) {
TString ord(wrk->GetOrdinal());
Int_t id = ord.Last('.');
if (id != kNPOS) ord.Remove(0, id+1);
gProofServ->ReleaseWorker(ord.Data());
}
}
} else if (TestBit(TProof::kIsClient) && reason && !strcmp(reason, kPROOF_WorkerIdleTO)) {
fValid = kFALSE;
}
fActiveSlaves->Remove(wrk);
FindUniqueSlaves();
fAllMonitor->Remove(wrk->GetSocket());
fActiveMonitor->Remove(wrk->GetSocket());
fSendGroupView = kTRUE;
if (IsMaster()) {
if (reason && !strcmp(reason, kPROOF_TerminateWorker)) {
fSlaves->Remove(wrk);
fBadSlaves->Remove(wrk);
fActiveSlaves->Remove(wrk);
fInactiveSlaves->Remove(wrk);
fUniqueSlaves->Remove(wrk);
fAllUniqueSlaves->Remove(wrk);
fNonUniqueMasters->Remove(wrk);
TSlaveInfo *si = new TSlaveInfo(
wrk->GetOrdinal(),
Form("%s@%s:%d", wrk->GetUser(), wrk->GetName(), wrk->GetPort()),
0, "", wrk->GetWorkDir());
if (!fTerminatedSlaveInfos->Contains(si)) fTerminatedSlaveInfos->Add(si);
else delete si;
delete wrk;
} else {
fBadSlaves->Add(wrk);
fActiveSlaves->Remove(wrk);
fUniqueSlaves->Remove(wrk);
fAllUniqueSlaves->Remove(wrk);
fNonUniqueMasters->Remove(wrk);
if (fCurrentMonitor) fCurrentMonitor->DeActivate(wrk->GetSocket());
wrk->Close();
if (fMergersSet) {
Int_t mergersCount = -1;
TParameter<Int_t> *mc = dynamic_cast<TParameter<Int_t> *>(GetParameter("PROOF_UseMergers"));
if (mc) mergersCount = mc->GetVal();
if (mergersCount == 0) {
Int_t activeWorkers = fCurrentMonitor ? fCurrentMonitor->GetActive() : GetNumberOfActiveSlaves();
if (activeWorkers > 1) {
fMergersCount = TMath::Nint(TMath::Sqrt(activeWorkers));
if (activeWorkers / fMergersCount < 2)
fMergersCount = (Int_t) TMath::Sqrt(activeWorkers);
}
}
}
}
SaveWorkerInfo();
} else {
fSlaves->Remove(wrk);
if (fManager)
fManager->DiscardSession(this);
}
}
void TProof::MarkBad(TSocket *s, const char *reason)
{
R__LOCKGUARD2(fCloseMutex);
if (!IsValid()) return;
TSlave *wrk = FindSlave(s);
MarkBad(wrk, reason);
}
void TProof::TerminateWorker(TSlave *wrk)
{
if (!wrk) {
Warning("TerminateWorker", "worker instance undefined: protocol error? ");
return;
}
if (wrk->GetSocket() && wrk->GetSocket()->IsValid()) {
TMessage mess(kPROOF_STOP);
wrk->GetSocket()->Send(mess);
} else {
if (gDebug > 0)
Info("TerminateWorker", "connection to worker is already down: cannot"
" send termination message");
}
MarkBad(wrk, kPROOF_TerminateWorker);
}
void TProof::TerminateWorker(const char *ord)
{
if (ord && strlen(ord) > 0) {
Bool_t all = (ord[0] == '*') ? kTRUE : kFALSE;
if (IsMaster()) {
TIter nxw(fSlaves);
TSlave *wrk = 0;
while ((wrk = (TSlave *)nxw())) {
if (all || !strcmp(wrk->GetOrdinal(), ord)) {
TerminateWorker(wrk);
if (!all) break;
}
}
} else {
TMessage mess(kPROOF_STOP);
mess << TString(ord);
Broadcast(mess);
}
}
}
Int_t TProof::Ping()
{
return Ping(kActive);
}
Int_t TProof::Ping(ESlaves list)
{
TList *slaves = 0;
if (list == kAll) slaves = fSlaves;
if (list == kActive) slaves = fActiveSlaves;
if (list == kUnique) slaves = fUniqueSlaves;
if (list == kAllUnique) slaves = fAllUniqueSlaves;
if (slaves->GetSize() == 0) return 0;
int nsent = 0;
TIter next(slaves);
TSlave *sl;
while ((sl = (TSlave *)next())) {
if (sl->IsValid()) {
if (sl->Ping() == -1) {
MarkBad(sl, "ping unsuccessful");
} else {
nsent++;
}
}
}
return nsent;
}
void TProof::Touch()
{
TList *slaves = fSlaves;
if (slaves->GetSize() == 0) return;
TIter next(slaves);
TSlave *sl;
while ((sl = (TSlave *)next())) {
if (sl->IsValid()) {
sl->Touch();
}
}
return;
}
void TProof::Print(Option_t *option) const
{
TString secCont;
if (TestBit(TProof::kIsClient)) {
Printf("Connected to: %s (%s)", GetMaster(),
IsValid() ? "valid" : "invalid");
Printf("Port number: %d", GetPort());
Printf("User: %s", GetUser());
Printf("ROOT version|rev: %s|%s", gROOT->GetVersion(), gROOT->GetGitCommit());
Printf("Architecture-Compiler: %s-%s", gSystem->GetBuildArch(),
gSystem->GetBuildCompilerVersion());
TSlave *sl = (TSlave *)fActiveSlaves->First();
if (sl) {
TString sc;
if (sl->GetSocket()->GetSecContext())
Printf("Security context: %s",
sl->GetSocket()->GetSecContext()->AsString(sc));
Printf("Proofd protocol version: %d", sl->GetSocket()->GetRemoteProtocol());
} else {
Printf("Security context: Error - No connection");
Printf("Proofd protocol version: Error - No connection");
}
Printf("Client protocol version: %d", GetClientProtocol());
Printf("Remote protocol version: %d", GetRemoteProtocol());
Printf("Log level: %d", GetLogLevel());
Printf("Session unique tag: %s", IsValid() ? GetSessionTag() : "");
Printf("Default data pool: %s", IsValid() ? GetDataPoolUrl() : "");
if (IsValid())
const_cast<TProof*>(this)->SendPrint(option);
} else {
const_cast<TProof*>(this)->AskStatistics();
if (IsParallel())
Printf("*** Master server %s (parallel mode, %d workers):",
gProofServ->GetOrdinal(), GetParallel());
else
Printf("*** Master server %s (sequential mode):",
gProofServ->GetOrdinal());
Printf("Master host name: %s", gSystem->HostName());
Printf("Port number: %d", GetPort());
if (strlen(gProofServ->GetGroup()) > 0) {
Printf("User/Group: %s/%s", GetUser(), gProofServ->GetGroup());
} else {
Printf("User: %s", GetUser());
}
TString ver;
ver.Form("%s|%s", gROOT->GetVersion(), gROOT->GetGitCommit());
if (gSystem->Getenv("ROOTVERSIONTAG"))
ver.Form("%s|%s", gROOT->GetVersion(), gSystem->Getenv("ROOTVERSIONTAG"));
Printf("ROOT version|rev|tag: %s", ver.Data());
Printf("Architecture-Compiler: %s-%s", gSystem->GetBuildArch(),
gSystem->GetBuildCompilerVersion());
Printf("Protocol version: %d", GetClientProtocol());
Printf("Image name: %s", GetImage());
Printf("Working directory: %s", gSystem->WorkingDirectory());
Printf("Config directory: %s", GetConfDir());
Printf("Config file: %s", GetConfFile());
Printf("Log level: %d", GetLogLevel());
Printf("Number of workers: %d", GetNumberOfSlaves());
Printf("Number of active workers: %d", GetNumberOfActiveSlaves());
Printf("Number of unique workers: %d", GetNumberOfUniqueSlaves());
Printf("Number of inactive workers: %d", GetNumberOfInactiveSlaves());
Printf("Number of bad workers: %d", GetNumberOfBadSlaves());
Printf("Total MB's processed: %.2f", float(GetBytesRead())/(1024*1024));
Printf("Total real time used (s): %.3f", GetRealTime());
Printf("Total CPU time used (s): %.3f", GetCpuTime());
if (TString(option).Contains("a", TString::kIgnoreCase) && GetNumberOfSlaves()) {
Printf("List of workers:");
TList masters;
TIter nextslave(fSlaves);
while (TSlave* sl = dynamic_cast<TSlave*>(nextslave())) {
if (!sl->IsValid()) continue;
if (sl->GetSlaveType() == TSlave::kSlave) {
sl->Print(option);
} else if (sl->GetSlaveType() == TSlave::kMaster) {
TMessage mess(kPROOF_PRINT);
mess.WriteString(option);
if (sl->GetSocket()->Send(mess) == -1)
const_cast<TProof*>(this)->MarkBad(sl, "could not send kPROOF_PRINT request");
else
masters.Add(sl);
} else {
Error("Print", "TSlave is neither Master nor Worker");
R__ASSERT(0);
}
}
const_cast<TProof*>(this)->Collect(&masters, fCollectTimeout);
}
}
}
Int_t TProof::HandleOutputOptions(TString &opt, TString &target, Int_t action)
{
TString outfile, dsname, stfopt;
if (action == 0) {
TString tagf, tagd, tags, oo;
Ssiz_t from = 0, iof = kNPOS, iod = kNPOS, ios = kNPOS;
while (opt.Tokenize(oo, from, "[; ]")) {
if (oo.BeginsWith("of=")) {
tagf = "of=";
iof = opt.Index(tagf);
} else if (oo.BeginsWith("outfile=")) {
tagf = "outfile=";
iof = opt.Index(tagf);
} else if (oo.BeginsWith("ds")) {
tagd = "ds";
iod = opt.Index(tagd);
} else if (oo.BeginsWith("dataset")) {
tagd = "dataset";
iod = opt.Index(tagd);
} else if (oo.BeginsWith("stf")) {
tags = "stf";
ios = opt.Index(tags);
} else if (oo.BeginsWith("savetofile")) {
tags = "savetofile";
ios = opt.Index(tags);
}
}
if (iof != kNPOS && iod != kNPOS) {
Error("HandleOutputOptions", "options 'of'/'outfile' and 'ds'/'dataset' are incompatible!");
return -1;
}
if (iof != kNPOS) {
from = iof + tagf.Length();
if (!opt.Tokenize(outfile, from, "[; ]") || outfile.IsNull()) {
Error("HandleOutputOptions", "could not extract output file settings string! (%s)", opt.Data());
return -1;
}
tagf += outfile;
}
if (iod != kNPOS) {
from = iod + tagd.Length();
if (!opt.Tokenize(dsname, from, "[; ]"))
if (gDebug > 0) Info("HandleOutputOptions", "no dataset name found: use default");
tagd += dsname;
if (dsname.BeginsWith("=")) dsname.Replace(0, 1, "");
if (dsname.Contains("|V")) {
target = "ds|V";
dsname.ReplaceAll("|V", "");
}
if (dsname.IsNull()) dsname = "dataset_<qtag>";
}
if (ios != kNPOS) {
from = ios + tags.Length();
if (!opt.Tokenize(stfopt, from, "[; ]"))
if (gDebug > 0) Info("HandleOutputOptions", "save-to-file not found: use defualt");
tags += stfopt;
if (!stfopt.IsNull()) {
if (stfopt.BeginsWith("=")) stfopt.Replace(0,1,"");
if (!stfopt.IsNull()) {
if (!stfopt.IsDigit()) {
Error("HandleOutputOptions", "save-to-file option must be a digit! (%s)", stfopt.Data());
return -1;
}
} else {
stfopt = "1";
}
} else {
stfopt = "1";
}
}
opt.ReplaceAll(tagf, "");
opt.ReplaceAll(tagd, "");
opt.ReplaceAll(tags, "");
}
if (action == 0) {
if (!outfile.IsNull()) {
if (!outfile.BeginsWith("master:")) {
if (gSystem->AccessPathName(gSystem->DirName(outfile.Data()), kWritePermission)) {
Warning("HandleOutputOptions",
"directory '%s' for the output file does not exists or is not writable:"
" saving to master", gSystem->DirName(outfile.Data()));
outfile.Form("master:%s", gSystem->BaseName(outfile.Data()));
} else {
if (!IsLite()) {
target = outfile;
if (!stfopt.IsNull()) {
outfile.Form("master:%s", gSystem->BaseName(target.Data()));
} else {
outfile = "";
}
}
}
}
if (outfile.BeginsWith("master:")) {
outfile.ReplaceAll("master:", "");
if (outfile.IsNull() || !gSystem->IsAbsoluteFileName(outfile)) {
TString ddir, emsg;
if (!IsLite()) {
if (Exec("gProofServ->GetDataDir()", "0", kTRUE) == 0) {
TObjString *os = fMacroLog.GetLineWith("const char");
if (os) {
Ssiz_t fst = os->GetString().First('\"');
Ssiz_t lst = os->GetString().Last('\"');
ddir = os->GetString()(fst+1, lst-fst-1);
} else {
emsg = "could not find 'const char *' string in macro log! cannot continue";
}
} else {
emsg = "could not retrieve master data directory info! cannot continue";
}
if (!emsg.IsNull()) {
Error("HandleOutputOptions", "%s", emsg.Data());
return -1;
}
}
if (!ddir.IsNull()) ddir += "/";
if (outfile.IsNull()) {
outfile.Form("%s<file>", ddir.Data());
} else {
outfile.Insert(0, TString::Format("%s", ddir.Data()));
}
}
}
if (!outfile.IsNull()) {
if (!outfile.BeginsWith("of:")) outfile.Insert(0, "of:");
SetParameter("PROOF_DefaultOutputOption", outfile.Data());
}
}
if (!dsname.IsNull()) {
dsname.Insert(0, "ds:");
SetParameter("PROOF_DefaultOutputOption", dsname.Data());
if (!stfopt.IsNull()) {
Int_t ostf = (Int_t) stfopt.Atoi();
if (ostf%10 <= 0) {
Warning("HandleOutputOptions", "Dataset required bu Save-To-File disabled: enabling!");
stfopt.Form("%d", ostf+1);
}
} else {
stfopt = "1";
}
}
if (!stfopt.IsNull()) {
SetParameter("PROOF_SavePartialResults", (Int_t) stfopt.Atoi());
}
} else {
if (GetOutputList()) {
if (target == "ds|V") {
dsname = "";
TIter nxo(GetOutputList());
TObject *o = 0;
while ((o = nxo())) {
if (o->InheritsFrom(TFileCollection::Class())) {
VerifyDataSet(o->GetName());
dsname = o->GetName();
break;
}
}
if (!dsname.IsNull()) {
TFileCollection *fc = GetDataSet(dsname);
if (fc) {
fc->Print();
} else {
Warning("HandleOutputOptions", "could not retrieve TFileCollection for dataset '%s'", dsname.Data());
}
} else {
Warning("HandleOutputOptions", "dataset not found!");
}
} else {
Bool_t targetcopied = kFALSE;
TProofOutputFile *pf = 0;
if (!target.IsNull())
pf = (TProofOutputFile *) GetOutputList()->FindObject(gSystem->BaseName(target.Data()));
if (pf) {
if (strcmp(TUrl(pf->GetOutputFileName(), kTRUE).GetUrl(),
TUrl(target, kTRUE).GetUrl())) {
if (TFile::Cp(pf->GetOutputFileName(), target)) {
Printf(" Output successfully copied to %s", target.Data());
targetcopied = kTRUE;
} else {
Warning("HandleOutputOptions", "problems copying output to %s", target.Data());
}
}
}
TFile *fout = 0;
TObject *o = 0;
TIter nxo(GetOutputList());
Bool_t swapcopied = kFALSE;
while ((o = nxo())) {
TProofOutputFile *pof = dynamic_cast<TProofOutputFile *>(o);
if (pof) {
if (pof->TestBit(TProofOutputFile::kSwapFile) && !target.IsNull()) {
if (pof == pf && targetcopied) continue;
if (strcmp(TUrl(pf->GetOutputFileName(), kTRUE).GetUrl(),
TUrl(target, kTRUE).GetUrl())) {
if (TFile::Cp(pof->GetOutputFileName(), target)) {
Printf(" Output successfully copied to %s", target.Data());
swapcopied = kTRUE;
} else {
Warning("HandleOutputOptions", "problems copying output to %s", target.Data());
}
}
} else if (pof->IsRetrieve()) {
if (strcmp(TUrl(pf->GetOutputFileName(), kTRUE).GetUrl(),
TUrl(pof->GetTitle(), kTRUE).GetUrl())) {
if (TFile::Cp(pof->GetOutputFileName(), pof->GetTitle())) {
Printf(" Output successfully copied to %s", pof->GetTitle());
} else {
Warning("HandleOutputOptions",
"problems copying %s to %s", pof->GetOutputFileName(), pof->GetTitle());
}
}
}
}
}
if (!target.IsNull() && !swapcopied) {
if (!fout && !pf) {
fout = TFile::Open(target, "RECREATE");
if (!fout || (fout && fout->IsZombie())) {
SafeDelete(fout);
Warning("HandleOutputOptions", "problems opening output file %s", target.Data());
}
}
if (fout) {
nxo.Reset();
while ((o = nxo())) {
TProofOutputFile *pof = dynamic_cast<TProofOutputFile *>(o);
if (!pof) {
o->Write();
}
}
}
}
if (fout) {
fout->Close();
SafeDelete(fout);
Printf(" Output saved to %s", target.Data());
}
}
}
DeleteParameters("PROOF_DefaultOutputOption");
DeleteParameters("PROOF_SavePartialResults");
}
return 0;
}
void TProof::SetFeedback(TString &opt, TString &optfb, Int_t action)
{
Ssiz_t from = 0;
if (action == 0 || (action == 1 && optfb.IsNull())) {
TString tag("fb=");
Ssiz_t ifb = opt.Index(tag);
if (ifb == kNPOS) {
tag = "feedback=";
ifb = opt.Index(tag);
}
if (ifb == kNPOS) return;
from = ifb + tag.Length();
if (!opt.Tokenize(optfb, from, "[; ]") || optfb.IsNull()) {
Warning("SetFeedback", "could not extract feedback string! Ignoring ...");
return;
}
tag += optfb;
opt.ReplaceAll(tag, "");
}
TString nm, startdraw, stopdraw;
from = 0;
while (optfb.Tokenize(nm, from, ",")) {
if (nm == "stats") {
if (action == 0) {
startdraw.Form("gDirectory->Add(new TStatsFeedback((TProof *)%p))", this);
gROOT->ProcessLine(startdraw.Data());
SetParameter("PROOF_StatsHist", "");
AddFeedback("PROOF_EventsHist");
AddFeedback("PROOF_PacketsHist");
AddFeedback("PROOF_ProcPcktHist");
} else {
stopdraw.Form("TObject *o = gDirectory->FindObject(\"%s\"); "
" if (o && strcmp(o->ClassName(), \"TStatsFeedback\")) "
" { gDirectory->Remove(o); delete o; }", GetSessionTag());
gROOT->ProcessLine(stopdraw.Data());
DeleteParameters("PROOF_StatsHist");
RemoveFeedback("PROOF_EventsHist");
RemoveFeedback("PROOF_PacketsHist");
RemoveFeedback("PROOF_ProcPcktHist");
}
} else {
if (action == 0) {
AddFeedback(nm);
startdraw.Form("gDirectory->Add(new TDrawFeedback((TProof *)%p))", this);
gROOT->ProcessLine(startdraw.Data());
} else {
RemoveFeedback(nm);
stopdraw.Form("TObject *o = gDirectory->FindObject(\"%s\"); "
" if (o && strcmp(o->ClassName(), \"TDrawFeedback\")) "
" { gDirectory->Remove(o); delete o; }", GetSessionTag());
gROOT->ProcessLine(stopdraw.Data());
}
}
}
}
Long64_t TProof::Process(TDSet *dset, const char *selector, Option_t *option,
Long64_t nentries, Long64_t first)
{
if (!IsValid() || !fPlayer) return -1;
SetRunStatus(TProof::kRunning);
TString opt(option), optfb, outfile;
if (opt.Contains("fb=") || opt.Contains("feedback=")) SetFeedback(opt, optfb, 0);
if (HandleOutputOptions(opt, outfile, 0) != 0) return -1;
fSync = (GetQueryMode(opt) == kSync);
if (fSync && (!IsIdle() || IsWaiting())) {
Info("Process", "session is in waiting or processing status: switch to asynchronous mode");
fSync = kFALSE;
opt.ReplaceAll("SYNC","");
opt += "ASYN";
}
if ((IsIdle() && !IsWaiting()) && fRunningDSets && fRunningDSets->GetSize() > 0) {
fRunningDSets->SetOwner(kTRUE);
fRunningDSets->Delete();
}
TSignalHandler *sh = 0;
if (fSync) {
if (gApplication)
sh = gSystem->RemoveSignalHandler(gApplication->GetSignalHandler());
}
fOutputList.Clear();
if (fWrksOutputReady) {
fWrksOutputReady->SetOwner(kFALSE);
fWrksOutputReady->Clear();
}
Long64_t rv = -1;
if (selector && strlen(selector)) {
rv = fPlayer->Process(dset, selector, opt.Data(), nentries, first);
} else if (fSelector) {
rv = fPlayer->Process(dset, fSelector, opt.Data(), nentries, first);
} else {
Error("Process", "neither a selecrot file nor a selector object have"
" been specified: cannot process!");
}
if (!optfb.IsNull()) SetFeedback(opt, optfb, 1);
if (HandleOutputOptions(opt, outfile, 1) != 0) return -1;
if (rv >= 0) {
TParameter<Long64_t> *sst =
(TParameter<Long64_t> *) fOutputList.FindObject("PROOF_SelectorStatus");
if (sst) rv = sst->GetVal();
}
if (fSync) {
if (sh)
gSystem->AddSignalHandler(sh);
if (!fPerfTree.IsNull()) {
if (SavePerfTree() != 0) Error("Process", "saving performance info ...");
SetPerfTree(0);
}
}
return rv;
}
Long64_t TProof::Process(TFileCollection *fc, const char *selector,
Option_t *option, Long64_t nentries, Long64_t first)
{
if (!IsValid() || !fPlayer) return -1;
if (fProtocol < 17) {
Info("Process", "server version < 5.18/00:"
" processing of TFileCollection not supported");
return -1;
}
TDSet *dset = new TDSet(TString::Format("TFileCollection:%s", fc->GetName()), 0, 0, "");
fPlayer->AddInput(fc);
Long64_t retval = -1;
if (selector && strlen(selector)) {
retval = Process(dset, selector, option, nentries, first);
} else if (fSelector) {
retval = Process(dset, fSelector, option, nentries, first);
} else {
Error("Process", "neither a selecrot file nor a selector object have"
" been specified: cannot process!");
}
fPlayer->GetInputList()->Remove(fc);
if (IsLite() && !fSync) {
if (!fRunningDSets) fRunningDSets = new TList;
fRunningDSets->Add(dset);
} else {
delete dset;
}
return retval;
}
Long64_t TProof::Process(const char *dsetname, const char *selector,
Option_t *option, Long64_t nentries,
Long64_t first, TObject *elist)
{
if (fProtocol < 13) {
Info("Process", "processing 'by name' not supported by the server");
return -1;
}
TString dsname, fname(dsetname);
const char *separator = (fname.EndsWith(",")) ? "," : "|";
if (!strcmp(separator, ",") || fname.EndsWith("|")) fname.Remove(fname.Length()-1, 1);
if (!(gSystem->AccessPathName(fname, kReadPermission))) {
TUrl uf(fname, kTRUE);
uf.SetOptions(TString::Format("%sfiletype=raw", uf.GetOptions()));
TFile *f = TFile::Open(uf.GetUrl());
if (f && !(f->IsZombie())) {
const Int_t blen = 8192;
char buf[blen];
Long64_t rest = f->GetSize();
while (rest > 0) {
Long64_t len = (rest > blen - 1) ? blen - 1 : rest;
if (f->ReadBuffer(buf, len)) {
Error("Process", "problems reading from file '%s'", fname.Data());
dsname = "";
break;
}
buf[len] = '\0';
dsname += buf;
rest -= len;
}
f->Close();
SafeDelete(f);
if (rest > 0) return -1;
} else {
Error("Process", "could not open file '%s'", fname.Data());
return -1;
}
}
if (dsname.IsNull()) {
dsname = dsetname;
} else {
if (dsname.EndsWith("\n")) dsname.Remove(dsname.Length()-1, 1);
dsname.ReplaceAll("\n", separator);
if (gDebug > 0) {
Info("Process", "processing multi-dataset read from file '%s':", fname.Data());
Info("Process", " '%s'", dsname.Data());
}
}
TString names(dsname), name, enl, newname;
if (fProtocol < 28 && names.Index(TRegexp("[, |]")) != kNPOS) {
Info("Process", "multi-dataset processing not supported by the server");
return -1;
}
TEntryList *el = 0;
TString dsobj, dsdir;
Int_t from = 0;
while (names.Tokenize(name, from, "[, |]")) {
newname = name;
enl = "";
Int_t ienl = name.Index("?enl=");
if (ienl == kNPOS) {
ienl = name.Index("<<");
if (ienl != kNPOS) {
newname.Remove(ienl);
ienl += strlen("<<");
}
} else {
newname.Remove(ienl);
ienl += strlen("?enl=");
}
TString obj, dir("/");
Int_t idxc = newname.Index("#");
if (idxc != kNPOS) {
Int_t idxs = newname.Index("/", 1, idxc, TString::kExact);
if (idxs != kNPOS) {
obj = newname(idxs+1, newname.Length());
dir = newname(idxc+1, newname.Length());
dir.Remove(dir.Index("/") + 1);
newname.Remove(idxc);
} else {
obj = newname(idxc+1, newname.Length());
newname.Remove(idxc);
}
} else if (newname.Index(":") != kNPOS && newname.Index("://") == kNPOS) {
Error("Process", "bad name syntax (%s): please use"
" a '#' after the dataset name", name.Data());
dsname.ReplaceAll(name, "");
continue;
}
if (dsobj.IsNull() && dsdir.IsNull()) {
dsobj = obj;
dsdir = dir;
} else if (obj != dsobj || dir != dsdir) {
Warning("Process", "'obj' or 'dir' specification not consistent w/ the first given: ignore");
}
if (ienl != kNPOS) {
enl = name(ienl, name.Length());
el = 0;
TObject *oel = 0;
TList *inpl = GetInputList();
if (inpl && (oel = inpl->FindObject(enl))) el = dynamic_cast<TEntryList *>(oel);
if (!el && gDirectory && (oel = gDirectory->FindObject(enl))) {
if ((el = dynamic_cast<TEntryList *>(oel))) {
if (fProtocol >= 28)
if (!(inpl->FindObject(el->GetName()))) AddInput(el);
}
}
if (!el) {
if (!gSystem->AccessPathName(enl)) {
TFile *f = TFile::Open(enl);
if (f && !(f->IsZombie()) && f->GetListOfKeys()) {
TIter nxk(f->GetListOfKeys());
TKey *k = 0;
while ((k = (TKey *) nxk())) {
if (!strcmp(k->GetClassName(), "TEntryList")) {
if (!el) {
if ((el = dynamic_cast<TEntryList *>(f->Get(k->GetName())))) {
if (fProtocol >= 28) {
if (!(inpl->FindObject(el->GetName()))) {
el = (TEntryList *) el->Clone();
AddInput(el);
}
} else {
el = (TEntryList *) el->Clone();
}
}
} else if (strcmp(el->GetName(), k->GetName())) {
Warning("Process", "multiple entry lists found in file '%s': the first one is taken;\n"
"if this is not what you want, load first the content in memory"
"and select it by name ", enl.Data());
}
}
}
} else {
Warning("Process","file '%s' cannot be open or is empty - ignoring", enl.Data());
}
}
}
if (fProtocol >= 28) {
newname += "?enl=";
if (el) {
newname += el->GetName();
} else {
newname += enl;
}
}
}
dsname.ReplaceAll(name, newname);
}
TDSet *dset = new TDSet(dsname, dsobj, dsdir);
if (el && fProtocol < 28) {
dset->SetEntryList(el);
} else {
dset->SetEntryList(elist);
}
Long64_t retval = -1;
if (selector && strlen(selector)) {
retval = Process(dset, selector, option, nentries, first);
} else if (fSelector) {
retval = Process(dset, fSelector, option, nentries, first);
} else {
Error("Process", "neither a selector file nor a selector object have"
" been specified: cannot process!");
}
if (IsLite() && !fSync) {
if (!fRunningDSets) fRunningDSets = new TList;
fRunningDSets->Add(dset);
} else {
delete dset;
}
return retval;
}
Long64_t TProof::Process(const char *selector, Long64_t n, Option_t *option)
{
if (!IsValid()) return -1;
if (fProtocol < 16) {
Info("Process", "server version < 5.17/04: generic processing not supported");
return -1;
}
TDSet *dset = new TDSet;
dset->SetBit(TDSet::kEmpty);
Long64_t retval = -1;
if (selector && strlen(selector)) {
retval = Process(dset, selector, option, n);
} else if (fSelector) {
retval = Process(dset, fSelector, option, n);
} else {
Error("Process", "neither a selector file nor a selector object have"
" been specified: cannot process!");
}
if (IsLite() && !fSync) {
if (!fRunningDSets) fRunningDSets = new TList;
fRunningDSets->Add(dset);
} else {
delete dset;
}
return retval;
}
Long64_t TProof::Process(TDSet *dset, TSelector *selector, Option_t *option,
Long64_t nentries, Long64_t first)
{
if (fProtocol < 34) {
Error("Process", "server version < 5.33/02:"
"processing by object not supported");
return -1;
}
if (!selector) {
Error("Process", "selector object undefined!");
return -1;
}
fSelector = selector;
Long64_t rc = Process(dset, (const char*)0, option, nentries, first);
fSelector = 0;
return rc;
}
Long64_t TProof::Process(TFileCollection *fc, TSelector *selector,
Option_t *option, Long64_t nentries, Long64_t first)
{
if (fProtocol < 34) {
Error("Process", "server version < 5.33/02:"
"processing by object not supported");
return -1;
}
if (!selector) {
Error("Process", "selector object undefined!");
return -1;
}
fSelector = selector;
Long64_t rc = Process(fc, (const char*)0, option, nentries, first);
fSelector = 0;
return rc;
}
Long64_t TProof::Process(const char *dsetname, TSelector *selector,
Option_t *option, Long64_t nentries,
Long64_t first, TObject *elist)
{
if (fProtocol < 34) {
Error("Process", "server version < 5.33/02:"
"processing by object not supported");
return -1;
}
if (!selector) {
Error("Process", "selector object undefined!");
return -1;
}
fSelector = selector;
Long64_t rc = Process(dsetname, (const char*)0, option, nentries, first, elist);
fSelector = 0;
return rc;
}
Long64_t TProof::Process(TSelector *selector, Long64_t n, Option_t *option)
{
if (fProtocol < 34) {
Error("Process", "server version < 5.33/02:"
"processing by object not supported");
return -1;
}
if (!selector) {
Error("Process", "selector object undefined!");
return -1;
}
fSelector = selector;
Long64_t rc = Process((const char*)0, n, option);
fSelector = 0;
return rc;
}
Int_t TProof::GetQueryReference(Int_t qry, TString &ref)
{
ref = "";
if (qry > 0) {
if (!fQueries)
GetListOfQueries();
if (fQueries) {
TIter nxq(fQueries);
TQueryResult *qr = 0;
while ((qr = (TQueryResult *) nxq()))
if (qr->GetSeqNum() == qry) {
ref.Form("%s:%s", qr->GetTitle(), qr->GetName());
return 0;
}
}
}
return -1;
}
Long64_t TProof::Finalize(Int_t qry, Bool_t force)
{
if (fPlayer) {
if (qry > 0) {
TString ref;
if (GetQueryReference(qry, ref) == 0) {
return Finalize(ref, force);
} else {
Info("Finalize", "query #%d not found", qry);
}
} else {
return Finalize("", force);
}
}
return -1;
}
Long64_t TProof::Finalize(const char *ref, Bool_t force)
{
if (fPlayer) {
TQueryResult *qr = (ref && strlen(ref) > 0) ? fPlayer->GetQueryResult(ref)
: GetQueryResult();
Bool_t retrieve = kFALSE;
TString xref(ref);
if (!qr) {
if (!xref.IsNull()) {
retrieve = kTRUE;
}
} else {
if (qr->IsFinalized()) {
if (force) {
retrieve = kTRUE;
} else {
Info("Finalize","query already finalized:"
" use Finalize(<qry>,kTRUE) to force new retrieval");
qr = 0;
}
} else {
retrieve = kTRUE;
xref.Form("%s:%s", qr->GetTitle(), qr->GetName());
}
}
if (retrieve) {
Retrieve(xref.Data());
qr = fPlayer->GetQueryResult(xref.Data());
}
if (qr)
return fPlayer->Finalize(qr);
}
return -1;
}
Int_t TProof::Retrieve(Int_t qry, const char *path)
{
if (qry > 0) {
TString ref;
if (GetQueryReference(qry, ref) == 0)
return Retrieve(ref, path);
else
Info("Retrieve", "query #%d not found", qry);
} else {
Info("Retrieve","positive argument required - do nothing");
}
return -1;
}
Int_t TProof::Retrieve(const char *ref, const char *path)
{
if (ref) {
TMessage m(kPROOF_RETRIEVE);
m << TString(ref);
Broadcast(m, kActive);
Collect(kActive, fCollectTimeout);
if (path) {
TQueryResult *qr = fPlayer ? fPlayer->GetQueryResult(ref) : 0;
if (qr) {
TFile *farc = TFile::Open(path,"UPDATE");
if (!farc || (farc && !(farc->IsOpen()))) {
Info("Retrieve", "archive file cannot be open (%s)", path);
return 0;
}
farc->cd();
qr->SetArchived(path);
qr->Write();
farc->Close();
SafeDelete(farc);
} else {
Info("Retrieve", "query not found after retrieve");
return -1;
}
}
return 0;
}
return -1;
}
Int_t TProof::Remove(Int_t qry, Bool_t all)
{
if (qry > 0) {
TString ref;
if (GetQueryReference(qry, ref) == 0)
return Remove(ref, all);
else
Info("Remove", "query #%d not found", qry);
} else {
Info("Remove","positive argument required - do nothing");
}
return -1;
}
Int_t TProof::Remove(const char *ref, Bool_t all)
{
if (all) {
if (fPlayer)
fPlayer->RemoveQueryResult(ref);
}
if (IsLite()) return 0;
if (ref) {
TMessage m(kPROOF_REMOVE);
m << TString(ref);
Broadcast(m, kActive);
Collect(kActive, fCollectTimeout);
return 0;
}
return -1;
}
Int_t TProof::Archive(Int_t qry, const char *path)
{
if (qry > 0) {
TString ref;
if (GetQueryReference(qry, ref) == 0)
return Archive(ref, path);
else
Info("Archive", "query #%d not found", qry);
} else {
Info("Archive","positive argument required - do nothing");
}
return -1;
}
Int_t TProof::Archive(const char *ref, const char *path)
{
if (ref) {
TMessage m(kPROOF_ARCHIVE);
m << TString(ref) << TString(path);
Broadcast(m, kActive);
Collect(kActive, fCollectTimeout);
return 0;
}
return -1;
}
Int_t TProof::CleanupSession(const char *sessiontag)
{
if (sessiontag) {
TMessage m(kPROOF_CLEANUPSESSION);
m << TString(sessiontag);
Broadcast(m, kActive);
Collect(kActive, fCollectTimeout);
return 0;
}
return -1;
}
void TProof::SetQueryMode(EQueryMode mode)
{
fQueryMode = mode;
if (gDebug > 0)
Info("SetQueryMode","query mode is set to: %s", fQueryMode == kSync ?
"Sync" : "Async");
}
TProof::EQueryMode TProof::GetQueryMode(Option_t *mode) const
{
EQueryMode qmode = fQueryMode;
if (mode && (strlen(mode) > 0)) {
TString m(mode);
m.ToUpper();
if (m.Contains("ASYN")) {
qmode = kAsync;
} else if (m.Contains("SYNC")) {
qmode = kSync;
}
}
if (gDebug > 0)
Info("GetQueryMode","query mode is set to: %s", qmode == kSync ?
"Sync" : "Async");
return qmode;
}
Long64_t TProof::DrawSelect(TDSet *dset, const char *varexp,
const char *selection, Option_t *option,
Long64_t nentries, Long64_t first)
{
if (!IsValid() || !fPlayer) return -1;
if (!IsIdle()) {
Info("DrawSelect","not idle, asynchronous Draw not supported");
return -1;
}
TString opt(option);
Int_t idx = opt.Index("ASYN", 0, TString::kIgnoreCase);
if (idx != kNPOS)
opt.Replace(idx,4,"");
return fPlayer->DrawSelect(dset, varexp, selection, opt, nentries, first);
}
Long64_t TProof::DrawSelect(const char *dsetname, const char *varexp,
const char *selection, Option_t *option,
Long64_t nentries, Long64_t first, TObject *enl)
{
if (fProtocol < 13) {
Info("Process", "processing 'by name' not supported by the server");
return -1;
}
TString name(dsetname);
TString obj;
TString dir = "/";
Int_t idxc = name.Index("#");
if (idxc != kNPOS) {
Int_t idxs = name.Index("/", 1, idxc, TString::kExact);
if (idxs != kNPOS) {
obj = name(idxs+1, name.Length());
dir = name(idxc+1, name.Length());
dir.Remove(dir.Index("/") + 1);
name.Remove(idxc);
} else {
obj = name(idxc+1, name.Length());
name.Remove(idxc);
}
} else if (name.Index(":") != kNPOS && name.Index("://") == kNPOS) {
Error("DrawSelect", "bad name syntax (%s): please use"
" a '#' after the dataset name", dsetname);
return -1;
}
TDSet *dset = new TDSet(name, obj, dir);
dset->SetEntryList(enl);
Long64_t retval = DrawSelect(dset, varexp, selection, option, nentries, first);
delete dset;
return retval;
}
void TProof::StopProcess(Bool_t abort, Int_t timeout)
{
PDB(kGlobal,2)
Info("StopProcess","enter %d", abort);
if (!IsValid())
return;
ERunStatus rst = abort ? TProof::kAborted : TProof::kStopped;
SetRunStatus(rst);
if (fPlayer)
fPlayer->StopProcess(abort, timeout);
if (TestBit(TProof::kIsClient) || abort)
InterruptCurrentMonitor();
if (fSlaves->GetSize() == 0)
return;
TSlave *sl;
TIter next(fSlaves);
while ((sl = (TSlave *)next()))
if (sl->IsValid())
sl->StopProcess(abort, timeout);
}
void TProof::DisableGoAsyn()
{
Emit("DisableGoAsyn()");
}
void TProof::GoAsynchronous()
{
if (!IsValid()) return;
if (GetRemoteProtocol() < 22) {
Info("GoAsynchronous", "functionality not supported by the server - ignoring");
return;
}
if (fSync && !IsIdle()) {
TMessage m(kPROOF_GOASYNC);
Broadcast(m);
} else {
Info("GoAsynchronous", "either idle or already in asynchronous mode - ignoring");
}
}
void TProof::RecvLogFile(TSocket *s, Int_t size)
{
const Int_t kMAXBUF = 16384;
char buf[kMAXBUF];
if (fSaveLogToMacro && fMacroLog.GetListOfLines()) {
fMacroLog.GetListOfLines()->SetOwner(kTRUE);
fMacroLog.GetListOfLines()->Clear();
}
Int_t fdout = -1;
if (!fLogToWindowOnly) {
fdout = (fRedirLog) ? fileno(fLogFileW) : fileno(stdout);
if (fdout < 0) {
Warning("RecvLogFile", "file descriptor for outputs undefined (%d):"
" will not log msgs", fdout);
return;
}
lseek(fdout, (off_t) 0, SEEK_END);
}
Int_t left, rec, r;
Long_t filesize = 0;
while (filesize < size) {
left = Int_t(size - filesize);
if (left >= kMAXBUF)
left = kMAXBUF-1;
rec = s->RecvRaw(&buf, left);
filesize = (rec > 0) ? (filesize + rec) : filesize;
if (!fLogToWindowOnly && !fSaveLogToMacro) {
if (rec > 0) {
char *p = buf;
r = rec;
while (r) {
Int_t w;
w = write(fdout, p, r);
if (w < 0) {
SysError("RecvLogFile", "error writing to unit: %d", fdout);
break;
}
r -= w;
p += w;
}
} else if (rec < 0) {
Error("RecvLogFile", "error during receiving log file");
break;
}
}
if (rec > 0) {
buf[rec] = 0;
EmitVA("LogMessage(const char*,Bool_t)", 2, buf, kFALSE);
if (fSaveLogToMacro) fMacroLog.AddLine(buf);
}
}
if (fRedirLog && IsIdle() && !TestBit(TProof::kIsMaster))
fRedirLog = kFALSE;
}
void TProof::NotifyLogMsg(const char *msg, const char *sfx)
{
Int_t len = 0;
if (!msg || (len = strlen(msg)) <= 0)
return;
Int_t lsfx = (sfx) ? strlen(sfx) : 0;
Int_t fdout = -1;
if (!fLogToWindowOnly) {
fdout = (fRedirLog) ? fileno(fLogFileW) : fileno(stdout);
if (fdout < 0) {
Warning("NotifyLogMsg", "file descriptor for outputs undefined (%d):"
" will not notify msgs", fdout);
return;
}
lseek(fdout, (off_t) 0, SEEK_END);
}
if (!fLogToWindowOnly) {
if (len > 0) {
char *p = (char *)msg;
Int_t r = len;
while (r) {
Int_t w = write(fdout, p, r);
if (w < 0) {
SysError("NotifyLogMsg", "error writing to unit: %d", fdout);
break;
}
r -= w;
p += w;
}
if (lsfx > 0)
if (write(fdout, sfx, lsfx) != lsfx)
SysError("NotifyLogMsg", "error writing to unit: %d", fdout);
}
}
if (len > 0) {
EmitVA("LogMessage(const char*,Bool_t)", 2, msg, kFALSE);
}
if (fRedirLog && IsIdle())
fRedirLog = kFALSE;
}
void TProof::LogMessage(const char *msg, Bool_t all)
{
PDB(kGlobal,1)
Info("LogMessage","Enter ... %s, 'all: %s", msg ? msg : "",
all ? "true" : "false");
if (gROOT->IsBatch()) {
PDB(kGlobal,1) Info("LogMessage","GUI not started - use TProof::ShowLog()");
return;
}
if (msg)
EmitVA("LogMessage(const char*,Bool_t)", 2, msg, all);
if (all)
lseek(fileno(fLogFileR), (off_t) 0, SEEK_SET);
const Int_t kMAXBUF = 32768;
char buf[kMAXBUF];
Int_t len;
do {
while ((len = read(fileno(fLogFileR), buf, kMAXBUF-1)) < 0 &&
TSystem::GetErrno() == EINTR)
TSystem::ResetErrno();
if (len < 0) {
Error("LogMessage", "error reading log file");
break;
}
if (len > 0) {
buf[len] = 0;
EmitVA("LogMessage(const char*,Bool_t)", 2, buf, kFALSE);
}
} while (len > 0);
}
Int_t TProof::SendGroupView()
{
if (!IsValid()) return -1;
if (TestBit(TProof::kIsClient)) return 0;
if (!fSendGroupView) return 0;
fSendGroupView = kFALSE;
TIter next(fActiveSlaves);
TSlave *sl;
int bad = 0, cnt = 0, size = GetNumberOfActiveSlaves();
char str[32];
while ((sl = (TSlave *)next())) {
snprintf(str, 32, "%d %d", cnt, size);
if (sl->GetSocket()->Send(str, kPROOF_GROUPVIEW) == -1) {
MarkBad(sl, "could not send kPROOF_GROUPVIEW message");
bad++;
} else
cnt++;
}
if (bad) SendGroupView();
return GetNumberOfActiveSlaves();
}
Bool_t TProof::GetFileInCmd(const char *cmd, TString &fn)
{
TString s = cmd;
s = s.Strip(TString::kBoth);
if (s.Length() > 0 &&
(s.BeginsWith(".L") || s.BeginsWith(".x") || s.BeginsWith(".X"))) {
TString file = s(2, s.Length());
TString acm, arg, io;
fn = gSystem->SplitAclicMode(file, acm, arg, io);
if (!fn.IsNull())
return kTRUE;
}
return kFALSE;
}
Int_t TProof::Exec(const char *cmd, Bool_t plusMaster)
{
return Exec(cmd, kActive, plusMaster);
}
Int_t TProof::Exec(const char *cmd, ESlaves list, Bool_t plusMaster)
{
if (!IsValid()) return -1;
TString s = cmd;
s = s.Strip(TString::kBoth);
if (!s.Length()) return 0;
TString filename;
if (TProof::GetFileInCmd(s.Data(), filename)) {
char *fn = gSystem->Which(TROOT::GetMacroPath(), filename, kReadPermission);
if (fn) {
if (GetNumberOfUniqueSlaves() > 0) {
if (SendFile(fn, kAscii | kForward | kCpBin) < 0) {
Error("Exec", "file %s could not be transfered", fn);
delete [] fn;
return -1;
}
} else {
TString scmd = s(0,3) + fn;
Int_t n = SendCommand(scmd, list);
delete [] fn;
return n;
}
} else {
Error("Exec", "macro %s not found", filename.Data());
return -1;
}
delete [] fn;
}
if (plusMaster) {
if (IsLite()) {
gROOT->ProcessLine(cmd);
} else {
DeactivateWorker("*");
Int_t res = SendCommand(cmd, list);
ActivateWorker("restore");
if (res < 0)
return res;
}
}
return SendCommand(cmd, list);
}
Int_t TProof::Exec(const char *cmd, const char *ord, Bool_t logtomacro)
{
if (!IsValid()) return -1;
TString s = cmd;
s = s.Strip(TString::kBoth);
if (!s.Length()) return 0;
Int_t res = 0;
if (IsLite()) {
gROOT->ProcessLine(cmd);
} else {
Bool_t oldRedirLog = fRedirLog;
fRedirLog = kTRUE;
DeactivateWorker("*");
fRedirLog = kFALSE;
if (strcmp(ord, "master") && strcmp(ord, "0")) ActivateWorker(ord);
Bool_t oldSaveLog = fSaveLogToMacro;
fSaveLogToMacro = logtomacro;
res = SendCommand(cmd, kActive);
fSaveLogToMacro = oldSaveLog;
fRedirLog = kTRUE;
ActivateWorker("restore");
fRedirLog = oldRedirLog;
}
return res;
}
Int_t TProof::SendCommand(const char *cmd, ESlaves list)
{
if (!IsValid()) return -1;
Broadcast(cmd, kMESS_CINT, list);
Collect(list);
return fStatus;
}
TString TProof::Getenv(const char *env, const char *ord)
{
TString cmd = TString::Format("gSystem->Getenv(\"%s\")", env);
if (Exec(cmd.Data(), ord, kTRUE) != 0) return TString("");
TObjString *os = fMacroLog.GetLineWith("const char");
if (os) {
TString info;
Ssiz_t from = 0;
os->GetString().Tokenize(info, from, "\"");
os->GetString().Tokenize(info, from, "\"");
if (gDebug > 0) Printf("%s: '%s'", env, info.Data());
return info;
}
return TString("");
}
Int_t TProof::GetRC(const char *rcenv, Int_t &env, const char *ord)
{
TString cmd = TString::Format("if (gEnv->Lookup(\"%s\")) { gEnv->GetValue(\"%s\",\"\"); }", rcenv, rcenv);
if (Exec(cmd.Data(), ord, kTRUE) != 0) return -1;
TObjString *os = fMacroLog.GetLineWith("const char");
Int_t rc = -1;
if (os) {
Ssiz_t fst = os->GetString().First('\"');
Ssiz_t lst = os->GetString().Last('\"');
TString info = os->GetString()(fst+1, lst-fst-1);
if (info.IsDigit()) {
env = info.Atoi();
rc = 0;
if (gDebug > 0)
Printf("%s: %d", rcenv, env);
}
}
return rc;
}
Int_t TProof::GetRC(const char *rcenv, Double_t &env, const char *ord)
{
TString cmd = TString::Format("if (gEnv->Lookup(\"%s\")) { gEnv->GetValue(\"%s\",\"\"); }", rcenv, rcenv);
if (Exec(cmd.Data(), ord, kTRUE) != 0) return -1;
TObjString *os = fMacroLog.GetLineWith("const char");
Int_t rc = -1;
if (os) {
Ssiz_t fst = os->GetString().First('\"');
Ssiz_t lst = os->GetString().Last('\"');
TString info = os->GetString()(fst+1, lst-fst-1);
if (info.IsFloat()) {
env = info.Atof();
rc = 0;
if (gDebug > 0)
Printf("%s: %f", rcenv, env);
}
}
return rc;
}
Int_t TProof::GetRC(const char *rcenv, TString &env, const char *ord)
{
TString cmd = TString::Format("if (gEnv->Lookup(\"%s\")) { gEnv->GetValue(\"%s\",\"\"); }", rcenv, rcenv);
if (Exec(cmd.Data(), ord, kTRUE) != 0) return -1;
TObjString *os = fMacroLog.GetLineWith("const char");
Int_t rc = -1;
if (os) {
Ssiz_t fst = os->GetString().First('\"');
Ssiz_t lst = os->GetString().Last('\"');
env = os->GetString()(fst+1, lst-fst-1);
rc = 0;
if (gDebug > 0)
Printf("%s: %s", rcenv, env.Data());
}
return rc;
}
Int_t TProof::SendCurrentState(ESlaves list)
{
if (!IsValid()) return -1;
Broadcast(gDirectory->GetPath(), kPROOF_RESET, list);
return GetParallel();
}
Int_t TProof::SendInitialState()
{
if (!IsValid()) return -1;
SetLogLevel(fLogLevel, gProofDebugMask);
return GetNumberOfActiveSlaves();
}
Bool_t TProof::CheckFile(const char *file, TSlave *slave, Long_t modtime, Int_t cpopt)
{
Bool_t sendto = kFALSE;
TString sn = slave->GetName();
sn += ":";
sn += slave->GetOrdinal();
sn += ":";
sn += gSystem->BaseName(file);
FileMap_t::const_iterator it;
if ((it = fFileMap.find(sn)) != fFileMap.end()) {
MD5Mod_t md = (*it).second;
if (md.fModtime != modtime) {
TMD5 *md5 = TMD5::FileChecksum(file);
if (md5) {
if ((*md5) != md.fMD5) {
sendto = kTRUE;
md.fMD5 = *md5;
md.fModtime = modtime;
fFileMap[sn] = md;
if (TestBit(TProof::kIsMaster)) {
sendto = kFALSE;
TMessage mess(kPROOF_CHECKFILE);
mess << TString(gSystem->BaseName(file)) << md.fMD5 << cpopt;
slave->GetSocket()->Send(mess);
fCheckFileStatus = 0;
Collect(slave, fCollectTimeout, kPROOF_CHECKFILE);
sendto = (fCheckFileStatus == 0) ? kTRUE : kFALSE;
}
}
delete md5;
} else {
Error("CheckFile", "could not calculate local MD5 check sum - dont send");
return kFALSE;
}
}
} else {
TMD5 *md5 = TMD5::FileChecksum(file);
MD5Mod_t md;
if (md5) {
md.fMD5 = *md5;
md.fModtime = modtime;
fFileMap[sn] = md;
delete md5;
} else {
Error("CheckFile", "could not calculate local MD5 check sum - dont send");
return kFALSE;
}
TMessage mess(kPROOF_CHECKFILE);
mess << TString(gSystem->BaseName(file)) << md.fMD5 << cpopt;
slave->GetSocket()->Send(mess);
fCheckFileStatus = 0;
Collect(slave, fCollectTimeout, kPROOF_CHECKFILE);
sendto = (fCheckFileStatus == 0) ? kTRUE : kFALSE;
}
return sendto;
}
Int_t TProof::SendFile(const char *file, Int_t opt, const char *rfile, TSlave *wrk)
{
if (!IsValid()) return -1;
TList *slaves = (rfile && !strcmp(rfile, "cache")) ? fUniqueSlaves : fActiveSlaves;
if (wrk) {
slaves = new TList();
slaves->Add(wrk);
}
if (slaves->GetSize() == 0) return 0;
#ifndef R__WIN32
Int_t fd = open(file, O_RDONLY);
#else
Int_t fd = open(file, O_RDONLY | O_BINARY);
#endif
if (fd < 0) {
SysError("SendFile", "cannot open file %s", file);
return -1;
}
Long64_t size = -1;
Long_t id, flags, modtime = 0;
if (gSystem->GetPathInfo(file, &id, &size, &flags, &modtime) == 1) {
Error("SendFile", "cannot stat file %s", file);
close(fd);
return -1;
}
if (size == 0) {
Error("SendFile", "empty file %s", file);
close(fd);
return -1;
}
Bool_t bin = (opt & kBinary) ? kTRUE : kFALSE;
Bool_t force = (opt & kForce) ? kTRUE : kFALSE;
Bool_t fw = (opt & kForward) ? kTRUE : kFALSE;
Int_t cpopt = 0;
if ((opt & kCp)) cpopt |= kCp;
if ((opt & kCpBin)) cpopt |= (kCp | kCpBin);
const Int_t kMAXBUF = 32768;
char buf[kMAXBUF];
Int_t nsl = 0;
TIter next(slaves);
TSlave *sl;
TString fnam(rfile);
if (fnam == "cache") {
fnam += TString::Format(":%s", gSystem->BaseName(file));
} else if (fnam.IsNull()) {
fnam = gSystem->BaseName(file);
}
fStatus = 0;
while ((sl = (TSlave *)next())) {
if (!sl->IsValid())
continue;
Bool_t sendto = force ? kTRUE : CheckFile(file, sl, modtime, cpopt);
PDB(kPackage,2) {
const char *snd = (sl->fSlaveType == TSlave::kSlave && sendto) ? "" : "not";
Info("SendFile", "%s sending file %s to: %s:%s (%d)", snd,
file, sl->GetName(), sl->GetOrdinal(), sendto);
}
if (sl->fSlaveType == TSlave::kSlave && !sendto)
continue;
Long64_t siz = sendto ? size : 0;
snprintf(buf, kMAXBUF, "%s %d %lld %d", fnam.Data(), bin, siz, fw);
if (sl->GetSocket()->Send(buf, kPROOF_SENDFILE) == -1) {
MarkBad(sl, "could not send kPROOF_SENDFILE request");
continue;
}
if (sendto) {
lseek(fd, 0, SEEK_SET);
Int_t len;
do {
while ((len = read(fd, buf, kMAXBUF)) < 0 && TSystem::GetErrno() == EINTR)
TSystem::ResetErrno();
if (len < 0) {
SysError("SendFile", "error reading from file %s", file);
Interrupt(kSoftInterrupt, kActive);
close(fd);
return -1;
}
if (len > 0 && sl->GetSocket()->SendRaw(buf, len) == -1) {
SysError("SendFile", "error writing to slave %s:%s (now offline)",
sl->GetName(), sl->GetOrdinal());
MarkBad(sl, "sendraw failure");
sl = 0;
break;
}
} while (len > 0);
nsl++;
}
if (sl)
Collect(sl, fCollectTimeout, kPROOF_SENDFILE);
}
close(fd);
if (slaves != fActiveSlaves && slaves != fUniqueSlaves)
SafeDelete(slaves);
return (fStatus != 0) ? -1 : nsl;
}
Int_t TProof::Echo(const TObject *obj)
{
if (!IsValid() || !obj) return -1;
TMessage mess(kPROOF_ECHO);
mess.WriteObject(obj);
return Broadcast(mess);
}
Int_t TProof::Echo(const char *str)
{
TObjString *os = new TObjString(str);
Int_t rv = Echo(os);
delete os;
return rv;
}
Int_t TProof::SendObject(const TObject *obj, ESlaves list)
{
if (!IsValid() || !obj) return -1;
TMessage mess(kMESS_OBJECT);
mess.WriteObject(obj);
return Broadcast(mess, list);
}
Int_t TProof::SendPrint(Option_t *option)
{
if (!IsValid()) return -1;
Broadcast(option, kPROOF_PRINT, kActive);
return Collect(kActive, fCollectTimeout);
}
void TProof::SetLogLevel(Int_t level, UInt_t mask)
{
char str[32];
fLogLevel = level;
gProofDebugLevel = level;
gProofDebugMask = (TProofDebug::EProofDebugMask) mask;
snprintf(str, 32, "%d %u", level, mask);
Broadcast(str, kPROOF_LOGLEVEL, kAll);
}
void TProof::SetRealTimeLog(Bool_t on)
{
if (IsValid()) {
TMessage mess(kPROOF_REALTIMELOG);
mess << on;
Broadcast(mess);
} else {
Warning("SetRealTimeLog","session is invalid - do nothing");
}
}
Int_t TProof::SetParallelSilent(Int_t nodes, Bool_t random)
{
if (!IsValid()) return -1;
if (TestBit(TProof::kIsMaster)) {
if (!fDynamicStartup) GoParallel(nodes, kFALSE, random);
return SendCurrentState();
} else {
if (nodes < 0) {
PDB(kGlobal,1) Info("SetParallelSilent", "request all nodes");
} else {
PDB(kGlobal,1) Info("SetParallelSilent", "request %d node%s", nodes,
nodes == 1 ? "" : "s");
}
TMessage mess(kPROOF_PARALLEL);
mess << nodes << random;
Broadcast(mess);
Collect(kActive, fCollectTimeout);
Int_t n = GetParallel();
PDB(kGlobal,1) Info("SetParallelSilent", "got %d node%s", n, n == 1 ? "" : "s");
return n;
}
}
Int_t TProof::SetParallel(Int_t nodes, Bool_t random)
{
if (fDynamicStartup && nodes < 0) {
if (gSystem->Getenv("PROOF_NWORKERS")) gSystem->Unsetenv("PROOF_NWORKERS");
}
Int_t n = SetParallelSilent(nodes, random);
if (TestBit(TProof::kIsClient)) {
if (n < 1) {
Printf("PROOF set to sequential mode");
} else {
TString subfix = (n == 1) ? "" : "s";
if (random)
subfix += ", randomly selected";
Printf("PROOF set to parallel mode (%d worker%s)", n, subfix.Data());
}
} else if (fDynamicStartup && nodes >= 0) {
if (gSystem->Getenv("PROOF_NWORKERS")) gSystem->Unsetenv("PROOF_NWORKERS");
gSystem->Setenv("PROOF_NWORKERS", TString::Format("%d", nodes));
}
return n;
}
Int_t TProof::GoMoreParallel(Int_t nWorkersToAdd)
{
if (!IsValid() || !IsMaster() || IsIdle()) {
Error("GoMoreParallel", "Can't invoke here -- should not happen!");
return -1;
}
if (!gProofServ) {
Error("GoMoreParallel", "No ProofServ available -- should not happen!");
return -1;
}
TSlave *sl = 0x0;
TIter next( fSlaves );
Int_t nAddedWorkers = 0;
while (((nAddedWorkers < nWorkersToAdd) || (nWorkersToAdd == -1)) &&
(( sl = dynamic_cast<TSlave *>( next() ) ))) {
if ((sl->GetSlaveType() != TSlave::kSlave) &&
(sl->GetSlaveType() != TSlave::kMaster)) {
Error("GoMoreParallel", "TSlave is neither a Master nor a Slave: %s:%s",
sl->GetName(), sl->GetOrdinal());
R__ASSERT(0);
}
if ((!sl->IsValid()) || (fBadSlaves->FindObject(sl)) ||
(strcmp("IGNORE", sl->GetImage()) == 0)) {
PDB(kGlobal, 2)
Info("GoMoreParallel", "Worker %s:%s won't be considered",
sl->GetName(), sl->GetOrdinal());
continue;
}
if (fActiveSlaves->FindObject(sl)) {
Info("GoMoreParallel", "Worker %s:%s is already active: skipping",
sl->GetName(), sl->GetOrdinal());
continue;
}
if (sl->GetSlaveType() == TSlave::kSlave) {
sl->SetStatus(TSlave::kActive);
fActiveSlaves->Add(sl);
fInactiveSlaves->Remove(sl);
fActiveMonitor->Add(sl->GetSocket());
nAddedWorkers++;
PDB(kGlobal, 2)
Info("GoMoreParallel", "Worker %s:%s marked as active!",
sl->GetName(), sl->GetOrdinal());
}
else {
Error("GoMoreParallel", "Dynamic addition of master is not supported");
R__ASSERT(0);
}
}
PDB(kGlobal, 3)
Info("GoMoreParallel", "Will invoke AskStatistics() -- implies a Collect()");
AskStatistics();
PDB(kGlobal, 3)
Info("GoMoreParallel", "Will invoke FindUniqueSlaves()");
FindUniqueSlaves();
PDB(kGlobal, 3)
Info("GoMoreParallel", "Will invoke SendGroupView()");
SendGroupView();
PDB(kGlobal, 3)
Info("GoMoreParallel", "Will invoke GetParallel()");
Int_t nTotalWorkers = GetParallel();
TString s;
s.Form("PROOF just went more parallel (%d additional worker%s, %d worker%s total)",
nAddedWorkers, (nAddedWorkers == 1) ? "" : "s",
nTotalWorkers, (nTotalWorkers == 1) ? "" : "s");
gProofServ->SendAsynMessage(s);
Info("GoMoreParallel", "%s", s.Data());
return nTotalWorkers;
}
Int_t TProof::GoParallel(Int_t nodes, Bool_t attach, Bool_t random)
{
if (!IsValid()) return -1;
fActiveSlaves->Clear();
fActiveMonitor->RemoveAll();
TSlave *sl = 0;
TList *wlst = new TList;
TIter nxt(fSlaves);
fInactiveSlaves->Clear();
while ((sl = (TSlave *)nxt())) {
if (sl->IsValid() && !fBadSlaves->FindObject(sl)) {
if (strcmp("IGNORE", sl->GetImage()) == 0) continue;
if ((sl->GetSlaveType() != TSlave::kSlave) &&
(sl->GetSlaveType() != TSlave::kMaster)) {
Error("GoParallel", "TSlave is neither Master nor Slave");
R__ASSERT(0);
}
wlst->Add(sl);
fInactiveSlaves->Add(sl);
sl->SetStatus(TSlave::kInactive);
}
}
Int_t nwrks = (nodes < 0 || nodes > wlst->GetSize()) ? wlst->GetSize() : nodes;
int cnt = 0;
fEndMaster = TestBit(TProof::kIsMaster) ? kTRUE : kFALSE;
while (cnt < nwrks) {
if (random) {
Int_t iwrk = (Int_t) (gRandom->Rndm() * wlst->GetSize());
sl = (TSlave *) wlst->At(iwrk);
} else {
sl = (TSlave *) wlst->First();
}
if (!sl) {
Error("GoParallel", "attaching to candidate!");
break;
}
wlst->Remove(sl);
Int_t slavenodes = 0;
if (sl->GetSlaveType() == TSlave::kSlave) {
sl->SetStatus(TSlave::kActive);
fActiveSlaves->Add(sl);
fInactiveSlaves->Remove(sl);
fActiveMonitor->Add(sl->GetSocket());
slavenodes = 1;
} else if (sl->GetSlaveType() == TSlave::kMaster) {
fEndMaster = kFALSE;
TMessage mess(kPROOF_PARALLEL);
if (!attach) {
Int_t nn = (nodes < 0) ? -1 : nodes-cnt;
mess << nn;
} else {
mess.SetWhat(kPROOF_LOGFILE);
mess << -1 << -1;
}
if (sl->GetSocket()->Send(mess) == -1) {
MarkBad(sl, "could not send kPROOF_PARALLEL or kPROOF_LOGFILE request");
slavenodes = 0;
} else {
Collect(sl, fCollectTimeout);
if (sl->IsValid()) {
sl->SetStatus(TSlave::kActive);
fActiveSlaves->Add(sl);
fInactiveSlaves->Remove(sl);
fActiveMonitor->Add(sl->GetSocket());
if (sl->GetParallel() > 0) {
slavenodes = sl->GetParallel();
} else {
slavenodes = 1;
}
} else {
MarkBad(sl, "collect failed after kPROOF_PARALLEL or kPROOF_LOGFILE request");
slavenodes = 0;
}
}
}
cnt += slavenodes;
}
wlst->SetOwner(0);
SafeDelete(wlst);
AskStatistics();
FindUniqueSlaves();
if (!attach)
SendGroupView();
Int_t n = GetParallel();
if (TestBit(TProof::kIsClient)) {
if (n < 1)
printf("PROOF set to sequential mode\n");
else
printf("PROOF set to parallel mode (%d worker%s)\n",
n, n == 1 ? "" : "s");
}
PDB(kGlobal,1) Info("GoParallel", "got %d node%s", n, n == 1 ? "" : "s");
return n;
}
void TProof::ShowData()
{
if (!IsValid() || !fManager) return;
fManager->Find("~/data", "-type f", "all");
}
void TProof::ClearData(UInt_t what, const char *dsname)
{
if (!IsValid() || !fManager) return;
TString prompt, a("Y");
Bool_t force = (what & kForceClear) ? kTRUE : kFALSE;
Bool_t doask = (!force && IsTty()) ? kTRUE : kFALSE;
if ((what & TProof::kPurge)) {
if (doask && !Prompt("Do you really want to remove all data files")) return;
if (fManager->Rm("~/data/*", "-rf", "all") < 0)
Warning("ClearData", "problems purging data directory");
return;
} else if ((what & TProof::kDataset)) {
if (!dsname || strlen(dsname) <= 0) {
Error("ClearData", "dataset name mandatory when removing a full dataset");
return;
}
if (!ExistsDataSet(dsname)) {
Error("ClearData", "dataset '%s' does not exists", dsname);
return;
}
TFileCollection *fc = GetDataSet(dsname);
if (!fc) {
Error("ClearData", "could not retrieve info about dataset '%s'", dsname);
return;
}
TString pmpt = TString::Format("Do you really want to remove all data files"
" of dataset '%s'", dsname);
if (doask && !Prompt(pmpt.Data())) return;
Bool_t rmds = kTRUE;
TIter nxf(fc->GetList());
TFileInfo *fi = 0;
Int_t rfiles = 0, nfiles = fc->GetList()->GetSize();
while ((fi = (TFileInfo *) nxf())) {
TString host, file;
if (!(fi->GetFirstUrl())) {
Error("ClearData", "GetFirstUrl() returns NULL for '%s' - skipping",
fi->GetName());
continue;
}
TUrl uf(*(fi->GetFirstUrl()));
file = uf.GetFile();
host = uf.GetHost();
Int_t nurl = fi->GetNUrls();
fi->ResetUrl();
TUrl *up = 0;
while (nurl-- && fi->NextUrl()) {
up = fi->GetCurrentUrl();
if (!strcmp(up->GetProtocol(), "file")) {
TString opt(up->GetOptions());
if (opt.BeginsWith("node=")) {
host=opt;
host.ReplaceAll("node=","");
file = up->GetFile();
break;
}
}
}
if (fManager->Rm(file.Data(), "-f", host.Data()) != 0) {
Error("ClearData", "problems removing '%s'", file.Data());
rmds = kFALSE;
}
rfiles++;
ClearDataProgress(rfiles, nfiles);
}
fprintf(stderr, "\n");
if (rmds) {
RemoveDataSet(dsname);
}
} else if (what & TProof::kUnregistered) {
TString outtmp("ProofClearData_");
FILE *ftmp = gSystem->TempFileName(outtmp);
if (!ftmp) {
Error("ClearData", "cannot create temp file for logs");
return;
}
fclose(ftmp);
RedirectHandle_t h;
gSystem->RedirectOutput(outtmp.Data(), "w", &h);
ShowData();
gSystem->RedirectOutput(0, 0, &h);
std::ifstream in;
in.open(outtmp.Data());
if (!in.is_open()) {
Error("ClearData", "could not open temp file for logs: %s", outtmp.Data());
gSystem->Unlink(outtmp);
return;
}
Int_t nfiles = 0;
TMap *afmap = new TMap;
TString line, host, file;
Int_t from = 0;
while (in.good()) {
line.ReadLine(in);
if (line.IsNull()) continue;
while (line.EndsWith("\n")) { line.Strip(TString::kTrailing, '\n'); }
from = 0;
host = "";
if (!line.Tokenize(host, from, "| ")) continue;
file = "";
if (!line.Tokenize(file, from, "| ")) continue;
if (!host.IsNull() && !file.IsNull()) {
TList *fl = (TList *) afmap->GetValue(host.Data());
if (!fl) {
fl = new TList();
fl->SetName(host);
afmap->Add(new TObjString(host), fl);
}
fl->Add(new TObjString(file));
nfiles++;
PDB(kDataset,2)
Info("ClearData", "added info for: h:%s, f:%s", host.Data(), file.Data());
} else {
Warning("ClearData", "found incomplete line: '%s'", line.Data());
}
}
in.close();
gSystem->Unlink(outtmp);
TString sel = TString::Format("/%s/%s/", GetGroup(), GetUser());
TMap *fcmap = GetDataSets(sel);
if (!fcmap || (fcmap && fcmap->GetSize() <= 0)) {
PDB(kDataset,1)
Warning("ClearData", "no dataset beloning to '%s'", sel.Data());
SafeDelete(fcmap);
}
TString opt;
TObjString *os = 0;
if (fcmap) {
TIter nxfc(fcmap);
while ((os = (TObjString *) nxfc())) {
TFileCollection *fc = 0;
if ((fc = (TFileCollection *) fcmap->GetValue(os))) {
TFileInfo *fi = 0;
TIter nxfi(fc->GetList());
while ((fi = (TFileInfo *) nxfi())) {
fi->ResetUrl();
Int_t nurl = fi->GetNUrls();
TUrl *up = 0;
while (nurl-- && fi->NextUrl()) {
up = fi->GetCurrentUrl();
if (!strcmp(up->GetProtocol(), "file")) {
opt = up->GetOptions();
if (opt.BeginsWith("node=")) {
host=opt;
host.ReplaceAll("node=","");
file = up->GetFile();
PDB(kDataset,2)
Info("ClearData", "found: host: %s, file: %s", host.Data(), file.Data());
TList *fl = (TList *) afmap->GetValue(host.Data());
if (fl) {
TObjString *fn = (TObjString *) fl->FindObject(file.Data());
if (fn) {
fl->Remove(fn);
SafeDelete(fn);
nfiles--;
} else {
Warning("ClearData",
"registered file '%s' not found in the full list!",
file.Data());
}
}
break;
}
}
}
}
}
}
if (fcmap) fcmap->SetOwner(kTRUE);
SafeDelete(fcmap);
}
Info("ClearData", "%d unregistered files to be removed:", nfiles);
afmap->Print();
TString pmpt = TString::Format("Do you really want to remove all %d"
" unregistered data files", nfiles);
if (doask && !Prompt(pmpt.Data())) return;
Int_t rfiles = 0;
TIter nxls(afmap);
while ((os = (TObjString *) nxls())) {
TList *fl = 0;
if ((fl = (TList *) afmap->GetValue(os))) {
TIter nxf(fl);
TObjString *fn = 0;
while ((fn = (TObjString *) nxf())) {
if (fManager->Rm(fn->GetName(), "-f", os->GetName()) != 0) {
Error("ClearData", "problems removing '%s' on host '%s'",
fn->GetName(), os->GetName());
}
rfiles++;
ClearDataProgress(rfiles, nfiles);
}
}
}
fprintf(stderr, "\n");
afmap->SetOwner(kTRUE);
SafeDelete(afmap);
}
}
Bool_t TProof::Prompt(const char *p)
{
TString pp(p);
if (!pp.Contains("?")) pp += "?";
if (!pp.Contains("[y/N]")) pp += " [y/N]";
TString a = Getline(pp.Data());
if (a != "\n" && a[0] != 'y' && a[0] != 'Y' && a[0] != 'n' && a[0] != 'N') {
Printf("Please answer y, Y, n or N");
return kFALSE;
} else if (a == "\n" || a[0] == 'n' || a[0] == 'N') {
return kFALSE;
}
return kTRUE;
}
void TProof::ClearDataProgress(Int_t r, Int_t t)
{
fprintf(stderr, "[TProof::ClearData] Total %5d files\t|", t);
for (Int_t l = 0; l < 20; l++) {
if (r > 0 && t > 0) {
if (l < 20*r/t)
fprintf(stderr, "=");
else if (l == 20*r/t)
fprintf(stderr, ">");
else if (l > 20*r/t)
fprintf(stderr, ".");
} else
fprintf(stderr, "=");
}
fprintf(stderr, "| %.02f %% \r", 100.0*(t ? (r/t) : 1));
}
void TProof::ShowCache(Bool_t all)
{
if (!IsValid()) return;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kShowCache) << all;
Broadcast(mess, kUnique);
if (all) {
TMessage mess2(kPROOF_CACHE);
mess2 << Int_t(kShowSubCache) << all;
Broadcast(mess2, fNonUniqueMasters);
Collect(kAllUnique, fCollectTimeout);
} else {
Collect(kUnique, fCollectTimeout);
}
}
void TProof::ClearCache(const char *file)
{
if (!IsValid()) return;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kClearCache) << TString(file);
Broadcast(mess, kUnique);
TMessage mess2(kPROOF_CACHE);
mess2 << Int_t(kClearSubCache) << TString(file);
Broadcast(mess2, fNonUniqueMasters);
Collect(kAllUnique);
fFileMap.clear();
}
void TProof::SystemCmd(const char *cmd, Int_t fdout)
{
if (fdout < 0) {
gSystem->Exec(cmd);
} else {
FILE *fin = gSystem->OpenPipe(cmd, "r");
if (fin) {
char line[2048];
while (fgets(line, 2048, fin)) {
Int_t r = strlen(line);
if (r > 0) {
if (write(fdout, line, r) < 0) {
::Warning("TProof::SystemCmd",
"errno %d writing to file descriptor %d",
TSystem::GetErrno(), fdout);
}
} else {
break;
}
}
gSystem->ClosePipe(fin);
}
}
}
void TProof::ShowPackages(Bool_t all, Bool_t redirlog)
{
if (!IsValid()) return;
Bool_t oldredir = fRedirLog;
if (redirlog) fRedirLog = kTRUE;
FILE *fout = (fRedirLog) ? fLogFileW : stdout;
if (!fout) {
Warning("ShowPackages", "file descriptor for outputs undefined (%p):"
" will not log msgs", fout);
return;
}
lseek(fileno(fout), (off_t) 0, SEEK_END);
if (TestBit(TProof::kIsClient)) {
if (fGlobalPackageDirList && fGlobalPackageDirList->GetSize() > 0) {
TIter nxd(fGlobalPackageDirList);
TNamed *nm = 0;
while ((nm = (TNamed *)nxd())) {
fprintf(fout, "*** Global Package cache %s client:%s ***\n",
nm->GetName(), nm->GetTitle());
fflush(fout);
SystemCmd(TString::Format("%s %s", kLS, nm->GetTitle()), fileno(fout));
fprintf(fout, "\n");
fflush(fout);
}
}
fprintf(fout, "*** Package cache client:%s ***\n", fPackageDir.Data());
fflush(fout);
SystemCmd(TString::Format("%s %s", kLS, fPackageDir.Data()), fileno(fout));
fprintf(fout, "\n");
}
if (IsLite()) {
fRedirLog = oldredir;
return;
}
TMessage mess(kPROOF_CACHE);
mess << Int_t(kShowPackages) << all;
Broadcast(mess, kUnique);
if (all) {
TMessage mess2(kPROOF_CACHE);
mess2 << Int_t(kShowSubPackages) << all;
Broadcast(mess2, fNonUniqueMasters);
Collect(kAllUnique, fCollectTimeout);
} else {
Collect(kUnique, fCollectTimeout);
}
fRedirLog = oldredir;
}
void TProof::ShowEnabledPackages(Bool_t all)
{
if (!IsValid()) return;
if (TestBit(TProof::kIsClient)) {
printf("*** Enabled packages on client on %s\n", gSystem->HostName());
TIter next(fEnabledPackagesOnClient);
while (TObjString *str = (TObjString*) next())
printf("%s\n", str->GetName());
}
if (IsLite()) return;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kShowEnabledPackages) << all;
Broadcast(mess);
Collect(kActive, fCollectTimeout);
}
Int_t TProof::ClearPackages()
{
if (!IsValid()) return -1;
if (UnloadPackages() == -1)
return -1;
if (DisablePackages() == -1)
return -1;
return fStatus;
}
Int_t TProof::ClearPackage(const char *package)
{
if (!IsValid()) return -1;
if (!package || !package[0]) {
Error("ClearPackage", "need to specify a package name");
return -1;
}
TString pac = package;
if (pac.EndsWith(".par"))
pac.Remove(pac.Length()-4);
pac = gSystem->BaseName(pac);
if (UnloadPackage(pac) == -1)
return -1;
if (DisablePackage(pac) == -1)
return -1;
return fStatus;
}
Int_t TProof::DisablePackage(const char *package)
{
if (!IsValid()) return -1;
if (!package || !package[0]) {
Error("DisablePackage", "need to specify a package name");
return -1;
}
TString pac = package;
if (pac.EndsWith(".par"))
pac.Remove(pac.Length()-4);
pac = gSystem->BaseName(pac);
if (DisablePackageOnClient(pac) == -1)
return -1;
if (IsLite()) return 0;
Int_t st = -1;
Bool_t done = kFALSE;
if (fManager) {
TString path;
path.Form("~/packages/%s", package);
if (fManager->Rm(path, "-rf", "all") != -1) {
path.Append(".par");
if (fManager->Rm(path, "-f", "all") != -1) {
done = kTRUE;
st = 0;
}
}
}
if (!done) {
TMessage mess(kPROOF_CACHE);
mess << Int_t(kDisablePackage) << pac;
Broadcast(mess, kUnique);
TMessage mess2(kPROOF_CACHE);
mess2 << Int_t(kDisableSubPackage) << pac;
Broadcast(mess2, fNonUniqueMasters);
Collect(kAllUnique);
st = fStatus;
}
return st;
}
Int_t TProof::DisablePackageOnClient(const char *pack)
{
TString s;
if (TestBit(TProof::kIsClient)) {
fPackageLock->Lock();
s.Form("%s %s/%s", kRM, fPackageDir.Data(), pack);
gSystem->Exec(s.Data());
s.Form("%s %s/%s.par", kRM, fPackageDir.Data(), pack);
gSystem->Exec(s.Data());
s.Form("%s %s/%s/%s.par", kRM, fPackageDir.Data(), kPROOF_PackDownloadDir, pack);
gSystem->Exec(s.Data());
fPackageLock->Unlock();
s.Form("%s/%s/%s.par", fPackageDir.Data(), kPROOF_PackDownloadDir, pack);
if (!gSystem->AccessPathName(s.Data()))
Warning("DisablePackageOnClient",
"unable to remove cached package PAR file for %s (%s)", pack, s.Data());
s.Form("%s/%s.par", fPackageDir.Data(), pack);
if (!gSystem->AccessPathName(s.Data()))
Warning("DisablePackageOnClient",
"unable to remove package PAR file for %s (%s)", pack, s.Data());
s.Form("%s/%s", fPackageDir.Data(), pack);
if (!gSystem->AccessPathName(s.Data()))
Warning("DisablePackageOnClient",
"unable to remove package directory for %s (%s)", pack, s.Data());
}
return 0;
}
Int_t TProof::DisablePackages()
{
if (!IsValid()) return -1;
if (TestBit(TProof::kIsClient)) {
fPackageLock->Lock();
gSystem->Exec(TString::Format("%s %s/*", kRM, fPackageDir.Data()));
fPackageLock->Unlock();
}
if (IsLite()) return 0;
Int_t st = -1;
Bool_t done = kFALSE;
if (fManager) {
if (fManager->Rm("~/packages/*", "-rf", "all") != -1) {
done = kTRUE;
st = 0;
}
}
if (!done) {
TMessage mess(kPROOF_CACHE);
mess << Int_t(kDisablePackages);
Broadcast(mess, kUnique);
TMessage mess2(kPROOF_CACHE);
mess2 << Int_t(kDisableSubPackages);
Broadcast(mess2, fNonUniqueMasters);
Collect(kAllUnique);
st = fStatus;
}
return st;
}
Int_t TProof::BuildPackage(const char *package, EBuildPackageOpt opt, Int_t chkveropt)
{
if (!IsValid()) return -1;
if (!package || !package[0]) {
Error("BuildPackage", "need to specify a package name");
return -1;
}
TString pac = package;
if (pac.EndsWith(".par"))
pac.Remove(pac.Length()-4);
pac = gSystem->BaseName(pac);
Bool_t buildOnClient = kTRUE;
if (opt == kDontBuildOnClient) {
buildOnClient = kFALSE;
opt = kBuildAll;
}
TString pdir;
Int_t st = 0;
if (buildOnClient) {
if (TestBit(TProof::kIsClient) && fPackageLock) fPackageLock->Lock();
if ((st = BuildPackageOnClient(pac, 1, &pdir, chkveropt) != 0)) {
if (TestBit(TProof::kIsClient) && fPackageLock) fPackageLock->Unlock();
return -1;
}
}
if (opt <= kBuildAll && (!IsLite() || !buildOnClient)) {
TMessage mess(kPROOF_CACHE);
mess << Int_t(kBuildPackage) << pac << chkveropt;
Broadcast(mess, kUnique);
TMessage mess2(kPROOF_CACHE);
mess2 << Int_t(kBuildSubPackage) << pac << chkveropt;
Broadcast(mess2, fNonUniqueMasters);
}
if (opt >= kBuildAll) {
if (buildOnClient) {
st = BuildPackageOnClient(pac, 2, &pdir, chkveropt);
if (TestBit(TProof::kIsClient) && fPackageLock) fPackageLock->Unlock();
}
fStatus = 0;
if (!IsLite() || !buildOnClient)
Collect(kAllUnique);
if (fStatus < 0 || st < 0)
return -1;
}
return 0;
}
Int_t TProof::BuildPackageOnClient(const char *pack, Int_t opt, TString *path, Int_t chkveropt)
{
TString downloaddir;
downloaddir.Form("%s/%s", fPackageDir.Data(), kPROOF_PackDownloadDir);
if (opt != 0 && !path) {
Error("BuildPackageOnClient", "for opt=%d != 0 'patyh' must be defined", opt);
return -1;
}
if (TestBit(TProof::kIsClient)) {
Int_t status = 0;
TString pdir, ocwd;
if (opt == 0 || opt == 1) {
pdir.Form("%s/%s", fPackageDir.Data(), pack);
if (gSystem->AccessPathName(pdir, kReadPermission) ||
gSystem->AccessPathName(pdir + "/PROOF-INF", kReadPermission)) {
pdir = "";
if (fGlobalPackageDirList && fGlobalPackageDirList->GetSize() > 0) {
TIter nxd(fGlobalPackageDirList);
TNamed *nm = 0;
while ((nm = (TNamed *)nxd())) {
pdir = Form("%s/%s", nm->GetTitle(), pack);
if (!gSystem->AccessPathName(pdir, kReadPermission) &&
!gSystem->AccessPathName(pdir + "/PROOF-INF", kReadPermission)) {
break;
}
pdir = "";
}
}
} else {
TString tpar(pdir);
if (!tpar.EndsWith(".par")) tpar += ".par";
Bool_t badPAR = kTRUE;
FileStat_t stpar;
if (gSystem->GetPathInfo(tpar, stpar) == 0) {
#ifndef WIN32
char ctmp[1024];
if (!R_ISLNK(stpar.fMode) || readlink(tpar.Data(), ctmp, 1024) > 0) {
badPAR = kFALSE;
}
#else
badPAR = kFALSE;
#endif
}
if (badPAR) {
gSystem->Exec(TString::Format("%s %s", kRM, pdir.Data()));
gSystem->Exec(TString::Format("%s %s", kRM, tpar.Data()));
pdir = "";
}
}
Bool_t wasDownloaded = kFALSE;
TString dlpar;
dlpar.Form("%s/%s", downloaddir.Data(), gSystem->BaseName(pack));
if (!dlpar.EndsWith(".par")) dlpar += ".par";
if (!pdir.IsNull()) {
if (!gSystem->AccessPathName(dlpar, kFileExists))
wasDownloaded = kTRUE;
}
if (pdir.IsNull() || wasDownloaded) {
if (DownloadPackage(pack, downloaddir) != 0) {
Error("BuildPackageOnClient",
"PAR file '%s.par' not found and could not be downloaded", pack);
return -1;
} else {
TMD5 *md5 = TMD5::FileChecksum(dlpar);
if (UploadPackageOnClient(dlpar, kUntar, md5) == -1) {
Error("BuildPackageOnClient",
"PAR file '%s.par' not found and could not be unpacked locally", pack);
delete md5;
return -1;
}
delete md5;
pdir.Form("%s/%s", fPackageDir.Data(), pack);
}
} else if (pdir.IsNull()) {
Error("BuildPackageOnClient", "PAR file '%s.par' not found", pack);
return -1;
}
PDB(kPackage, 1)
Info("BuildPackageOnClient", "package %s exists and has PROOF-INF directory", pack);
if (opt == 1) {
*path = pdir;
return 0;
}
}
if (opt == 0 || opt == 2) {
if (opt == 2) pdir = path->Data();
ocwd = gSystem->WorkingDirectory();
gSystem->ChangeDirectory(pdir);
if (!gSystem->AccessPathName("PROOF-INF/BUILD.sh")) {
Bool_t goodver = kTRUE;
Bool_t savever = kFALSE;
TString v, r;
FILE *f = fopen("PROOF-INF/proofvers.txt", "r");
if (f) {
v.Gets(f);
r.Gets(f);
fclose(f);
if (chkveropt == kCheckROOT || chkveropt == kCheckSVN) {
if (v != gROOT->GetVersion()) goodver = kFALSE;
if (goodver && chkveropt == kCheckSVN)
if (r != gROOT->GetGitCommit()) goodver = kFALSE;
}
}
if (!f || !goodver) {
savever = kTRUE;
Info("BuildPackageOnClient",
"%s: version change (current: %s:%s, build: %s:%s): cleaning ... ",
pack, gROOT->GetVersion(), gROOT->GetGitCommit(), v.Data(), r.Data());
gSystem->ChangeDirectory(fPackageDir);
gSystem->Exec(TString::Format("%s %s", kRM, pdir.Data()));
char *gunzip = gSystem->Which(gSystem->Getenv("PATH"), kGUNZIP, kExecutePermission);
if (gunzip) {
TString par = TString::Format("%s.par", pdir.Data());
TString cmd(TString::Format(kUNTAR3, gunzip, par.Data()));
status = gSystem->Exec(cmd);
if ((status = gSystem->Exec(cmd))) {
Error("BuildPackageOnClient", "failure executing: %s", cmd.Data());
} else {
gSystem->ChangeDirectory(pdir);
}
delete [] gunzip;
} else {
Error("BuildPackageOnClient", "%s not found", kGUNZIP);
status = -1;
}
}
if (gSystem->Exec("export ROOTPROOFCLIENT=\"1\" ; PROOF-INF/BUILD.sh")) {
Error("BuildPackageOnClient", "building package %s on the client failed", pack);
status = -1;
}
if (savever && !status) {
f = fopen("PROOF-INF/proofvers.txt", "w");
if (f) {
fputs(gROOT->GetVersion(), f);
fputs(TString::Format("\n%s", gROOT->GetGitCommit()), f);
fclose(f);
}
}
} else {
PDB(kPackage, 1)
Info("BuildPackageOnClient",
"package %s exists but has no PROOF-INF/BUILD.sh script", pack);
}
gSystem->ChangeDirectory(ocwd);
return status;
}
}
return 0;
}
Int_t TProof::LoadPackage(const char *package, Bool_t notOnClient,
TList *loadopts, TList *workers)
{
if (!IsValid()) return -1;
if (!package || !package[0]) {
Error("LoadPackage", "need to specify a package name");
return -1;
}
TString pac = package;
if (pac.EndsWith(".par"))
pac.Remove(pac.Length()-4);
pac = gSystem->BaseName(pac);
if (!notOnClient)
if (LoadPackageOnClient(pac, loadopts) == -1)
return -1;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kLoadPackage) << pac;
if (loadopts) mess << loadopts;
Bool_t deactivateOnFailure = (IsMaster()) ? kTRUE : kFALSE;
if (workers) {
PDB(kPackage, 3)
Info("LoadPackage", "Sending load message to selected workers only");
Broadcast(mess, workers);
Collect(workers, -1, -1, deactivateOnFailure);
}
else {
Broadcast(mess);
Collect(kActive, -1, -1, deactivateOnFailure);
}
return fStatus;
}
Int_t TProof::LoadPackageOnClient(const char *pack, TList *loadopts)
{
if (TestBit(TProof::kIsClient)) {
Int_t status = 0;
TString pdir, ocwd;
if (fEnabledPackagesOnClient->FindObject(pack)) {
Info("LoadPackageOnClient", "package %s already loaded", pack);
return 0;
}
pdir.Form("%s/%s", fPackageDir.Data(), pack);
if (gSystem->AccessPathName(pdir, kReadPermission)) {
if (fGlobalPackageDirList && fGlobalPackageDirList->GetSize() > 0) {
TIter nxd(fGlobalPackageDirList);
TNamed *nm = 0;
while ((nm = (TNamed *)nxd())) {
pdir.Form("%s/%s", nm->GetTitle(), pack);
if (!gSystem->AccessPathName(pdir, kReadPermission)) {
break;
}
pdir = "";
}
if (pdir.Length() <= 0) {
Error("LoadPackageOnClient", "failure locating %s ...", pack);
return -1;
}
}
}
ocwd = gSystem->WorkingDirectory();
gSystem->ChangeDirectory(pdir);
if (!gSystem->AccessPathName("PROOF-INF/SETUP.C")) {
TString setup, setupfn;
setup.Form("SETUP_%d_%x", gSystem->GetPid(), TString(pack).Hash());
setupfn.Form("%s/%s.C", gSystem->TempDirectory(), setup.Data());
TMacro setupmc("PROOF-INF/SETUP.C");
TObjString *setupline = setupmc.GetLineWith("SETUP(");
if (setupline) {
TString setupstring(setupline->GetString());
setupstring.ReplaceAll("SETUP(", TString::Format("%s(", setup.Data()));
setupline->SetString(setupstring);
} else {
Warning("LoadPackageOnClient", "macro '%s/PROOF-INF/SETUP.C' does not contain a SETUP()"
" function", pack);
}
setupmc.SaveSource(setupfn.Data());
if (gROOT->LoadMacro(setupfn.Data()) != 0) {
Error("LoadPackageOnClient", "macro '%s/PROOF-INF/SETUP.C' could not be loaded:"
" cannot continue", pack);
status = -1;
} else {
TFunction *fun = (TFunction *) gROOT->GetListOfGlobalFunctions()->FindObject(setup);
if (!fun) {
Error("LoadPackageOnClient", "function SETUP() not found in macro '%s/PROOF-INF/SETUP.C':"
" cannot continue", pack);
status = -1;
} else {
TMethodCall callEnv;
if (fun->GetNargs() == 0) {
callEnv.Init(fun);
if (loadopts)
Warning("LoadPackageOnClient", "loaded SETUP() does not take any argument:"
" the specified TList object will be ignored");
} else if (fun->GetNargs() == 1) {
TMethodArg *arg = (TMethodArg *) fun->GetListOfMethodArgs()->First();
if (arg) {
callEnv.Init(fun);
TString argsig(arg->GetTitle());
if (argsig.BeginsWith("TList")) {
callEnv.ResetParam();
callEnv.SetParam((Long_t) loadopts);
} else if (argsig.BeginsWith("const char")) {
callEnv.ResetParam();
TObjString *os = loadopts ? dynamic_cast<TObjString *>(loadopts->First()) : 0;
if (os) {
callEnv.SetParam((Long_t) os->GetName());
} else {
if (loadopts && loadopts->First()) {
Warning("LoadPackageOnClient", "found object argument of type %s:"
" SETUP expects 'const char *': ignoring",
loadopts->First()->ClassName());
}
callEnv.SetParam((Long_t) 0);
}
} else {
Error("LoadPackageOnClient", "unsupported SETUP signature: SETUP(%s)"
" cannot continue", arg->GetTitle());
status = -1;
}
} else {
Error("LoadPackageOnClient", "cannot get information about the SETUP() argument:"
" cannot continue");
status = -1;
}
} else if (fun->GetNargs() > 1) {
Error("LoadPackageOnClient", "function SETUP() can have at most a 'TList *' argument:"
" cannot continue");
status = -1;
}
Long_t setuprc = (status == 0) ? 0 : -1;
if (status == 0) {
callEnv.Execute(setuprc);
if (setuprc < 0) status = -1;
}
}
}
if (!gSystem->AccessPathName(setupfn.Data())) gSystem->Unlink(setupfn.Data());
} else {
PDB(kPackage, 1)
Info("LoadPackageOnClient",
"package %s exists but has no PROOF-INF/SETUP.C script", pack);
}
gSystem->ChangeDirectory(ocwd);
if (status == 0) {
gSystem->AddIncludePath(TString("-I") + pdir);
gROOT->ProcessLine(TString(".I ") + pdir);
fEnabledPackagesOnClient->Add(new TObjString(pack));
PDB(kPackage, 1)
Info("LoadPackageOnClient", "package %s successfully loaded", pack);
} else
Error("LoadPackageOnClient", "loading package %s on client failed", pack);
return status;
}
return 0;
}
Int_t TProof::UnloadPackage(const char *package)
{
if (!IsValid()) return -1;
if (!package || !package[0]) {
Error("UnloadPackage", "need to specify a package name");
return -1;
}
TString pac = package;
if (pac.EndsWith(".par"))
pac.Remove(pac.Length()-4);
pac = gSystem->BaseName(pac);
if (UnloadPackageOnClient(pac) == -1)
return -1;
if (IsLite()) return 0;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kUnloadPackage) << pac;
Broadcast(mess);
Collect();
return fStatus;
}
Int_t TProof::UnloadPackageOnClient(const char *package)
{
if (TestBit(TProof::kIsClient)) {
TObjString *pack = (TObjString *) fEnabledPackagesOnClient->FindObject(package);
if (pack) {
TString aclicincpath = gSystem->GetIncludePath();
TString cintincpath = gInterpreter->GetIncludePath();
aclicincpath.Remove(aclicincpath.Length() - cintincpath.Length() - 1);
aclicincpath.ReplaceAll(TString(" -I") + package, "");
gSystem->SetIncludePath(aclicincpath);
fEnabledPackagesOnClient->Remove(pack);
}
if (!gSystem->AccessPathName(package))
if (gSystem->Unlink(package) != 0)
Warning("UnloadPackageOnClient", "unable to remove symlink to %s", package);
delete pack;
}
return 0;
}
Int_t TProof::UnloadPackages()
{
if (!IsValid()) return -1;
if (TestBit(TProof::kIsClient)) {
TIter nextpackage(fEnabledPackagesOnClient);
while (TObjString *objstr = dynamic_cast<TObjString*>(nextpackage()))
if (UnloadPackageOnClient(objstr->String()) == -1 )
return -1;
}
if (IsLite()) return 0;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kUnloadPackages);
Broadcast(mess);
Collect();
return fStatus;
}
Int_t TProof::EnablePackage(const char *package, Bool_t notOnClient,
TList *workers)
{
return EnablePackage(package, (TList *)0, notOnClient, workers);
}
Int_t TProof::EnablePackage(const char *package, const char *loadopts,
Bool_t notOnClient, TList *workers)
{
TList *optls = 0;
if (loadopts && strlen(loadopts)) {
if (fProtocol > 28) {
TObjString *os = new TObjString(loadopts);
os->String().ReplaceAll("checkversion=", "chkv=");
Ssiz_t fcv = kNPOS, lcv = kNPOS;
if ((fcv = os->String().Index("chkv=")) != kNPOS) {
TRegexp re("[; |]");
if ((lcv = os->String().Index(re, fcv)) == kNPOS) {
lcv = os->String().Length();
}
TString ocv = os->String()(fcv, lcv - fcv);
Int_t cvopt = -1;
if (ocv.EndsWith("=off") || ocv.EndsWith("=0"))
cvopt = (Int_t) kDontCheck;
else if (ocv.EndsWith("=on") || ocv.EndsWith("=1"))
cvopt = (Int_t) kCheckROOT;
else if (ocv.EndsWith("=svn") || ocv.EndsWith("=2"))
cvopt = (Int_t) kCheckSVN;
else
Warning("EnablePackage", "'checkversion' option unknown from argument: '%s' - ignored", ocv.Data());
if (cvopt > -1) {
if (gDebug > 0)
Info("EnablePackage", "setting check version option from argument: %d", cvopt);
optls = new TList;
optls->Add(new TParameter<Int_t>("PROOF_Package_CheckVersion", (Int_t) cvopt));
if (lcv != kNPOS && fcv == 0) ocv += os->String()[lcv];
if (fcv > 0 && os->String().Index(re, fcv - 1) == fcv - 1) os->String().Remove(fcv - 1, 1);
os->String().ReplaceAll(ocv.Data(), "");
}
}
if (!os->String().IsNull()) {
if (!optls) optls = new TList;
optls->Add(new TObjString(os->String().Data()));
}
if (optls) optls->SetOwner(kTRUE);
} else {
Warning("EnablePackage", "remote server does not support options: ignoring the option string");
}
}
Int_t rc = EnablePackage(package, optls, notOnClient, workers);
SafeDelete(optls);
return rc;
}
Int_t TProof::EnablePackage(const char *package, TList *loadopts,
Bool_t notOnClient, TList *workers)
{
if (!IsValid()) return -1;
if (!package || !package[0]) {
Error("EnablePackage", "need to specify a package name");
return -1;
}
TString pac = package;
if (pac.EndsWith(".par"))
pac.Remove(pac.Length()-4);
pac = gSystem->BaseName(pac);
EBuildPackageOpt opt = kBuildAll;
if (notOnClient)
opt = kDontBuildOnClient;
Int_t chkveropt = kCheckROOT;
TString ocv = gEnv->GetValue("Proof.Package.CheckVersion", "");
if (!ocv.IsNull()) {
if (ocv == "off" || ocv == "0")
chkveropt = (Int_t) kDontCheck;
else if (ocv == "on" || ocv == "1")
chkveropt = (Int_t) kCheckROOT;
else if (ocv == "svn" || ocv == "2")
chkveropt = (Int_t) kCheckSVN;
else
Warning("EnablePackage", "'checkversion' option unknown from rootrc: '%s' - ignored", ocv.Data());
}
if (loadopts) {
TParameter<Int_t> *pcv = (TParameter<Int_t> *) loadopts->FindObject("PROOF_Package_CheckVersion");
if (pcv) {
chkveropt = pcv->GetVal();
loadopts->Remove(pcv);
delete pcv;
}
}
if (gDebug > 0)
Info("EnablePackage", "using check version option: %d", chkveropt);
if (BuildPackage(pac, opt, chkveropt) == -1)
return -1;
TList *optls = (loadopts && loadopts->GetSize() > 0) ? loadopts : 0;
if (optls && fProtocol <= 28) {
Warning("EnablePackage", "remote server does not support options: ignoring the option list");
optls = 0;
}
if (LoadPackage(pac, notOnClient, optls, workers) == -1)
return -1;
return 0;
}
Int_t TProof::DownloadPackage(const char *pack, const char *dstdir)
{
if (!fManager || !(fManager->IsValid())) {
Error("DownloadPackage", "the manager is undefined!");
return -1;
}
TString parname(gSystem->BaseName(pack)), src, dst;
if (!parname.EndsWith(".par")) parname += ".par";
src.Form("packages/%s", parname.Data());
if (!dstdir || strlen(dstdir) <= 0) {
dst.Form("./%s", parname.Data());
} else {
FileStat_t st;
if (gSystem->GetPathInfo(dstdir, st) != 0) {
if (gSystem->mkdir(dstdir, kTRUE) != 0) {
Error("DownloadPackage",
"could not create the destination directory '%s' (errno: %d)",
dstdir, TSystem::GetErrno());
return -1;
}
} else if (!R_ISDIR(st.fMode) && !R_ISLNK(st.fMode)) {
Error("DownloadPackage",
"destination path '%s' exist but is not a directory!", dstdir);
return -1;
}
dst.Form("%s/%s", dstdir, parname.Data());
}
FileStat_t stsrc;
RedirectHandle_t rh;
if (gSystem->RedirectOutput(fLogFileName, "a", &rh) != 0)
Warning("DownloadPackage", "problems redirecting output to '%s'", fLogFileName.Data());
Int_t rc = fManager->Stat(src, stsrc);
if (gSystem->RedirectOutput(0, 0, &rh) != 0)
Warning("DownloadPackage", "problems restoring output");
if (rc != 0) {
ShowPackages(kFALSE, kTRUE);
TMacro *mp = GetLastLog();
if (mp) {
Bool_t isGlobal = kFALSE;
TIter nxl(mp->GetListOfLines());
TObjString *os = 0;
TString globaldir;
while ((os = (TObjString *) nxl())) {
TString s(os->GetName());
if (s.Contains("*** Global Package cache")) {
s.Remove(0, s.Last(':') + 1);
s.Remove(s.Last(' '));
globaldir = s;
isGlobal = kTRUE;
} else if (s.Contains("*** Package cache")) {
isGlobal = kFALSE;
globaldir = "";
}
if (isGlobal && s.Contains(parname)) {
src.Form("%s/%s", globaldir.Data(), parname.Data());
break;
}
}
delete mp;
}
}
if (fManager->GetFile(src, dst, "silent") != 0) {
Error("DownloadPackage", "problems downloading '%s' (src:%s, dst:%s)",
pack, src.Data(), dst.Data());
return -1;
} else {
Info("DownloadPackage", "'%s' cross-checked against master repository (local path: %s)",
pack, dst.Data());
}
return 0;
}
Int_t TProof::UploadPackage(const char *pack, EUploadPackageOpt opt,
TList *workers)
{
if (!IsValid()) return -1;
TString par(pack), base, name;
if (par.EndsWith(".par")) {
base = gSystem->BaseName(par);
name = base(0, base.Length() - strlen(".par"));
} else {
name = gSystem->BaseName(par);
base.Form("%s.par", name.Data());
par += ".par";
}
gSystem->ExpandPathName(par);
if (gSystem->AccessPathName(par, kReadPermission)) {
TString tried = par;
par.Form("%s/%s", fPackageDir.Data(), base.Data());
if (gSystem->AccessPathName(par, kReadPermission)) {
if (fGlobalPackageDirList && fGlobalPackageDirList->GetSize() > 0) {
TIter nxd(fGlobalPackageDirList);
TNamed *nm = 0;
TString pdir;
while ((nm = (TNamed *)nxd())) {
pdir.Form("%s/%s", nm->GetTitle(), name.Data());
if (!gSystem->AccessPathName(pdir, kReadPermission)) {
break;
}
pdir = "";
}
if (pdir.Length() > 0) {
if (gDebug > 0)
Info("UploadPackage", "global package found (%s): no upload needed",
pdir.Data());
return 0;
}
}
Error("UploadPackage", "PAR file '%s' not found; paths tried: %s, %s",
gSystem->BaseName(par), tried.Data(), par.Data());
return -1;
}
}
TMD5 *md5 = TMD5::FileChecksum(par);
if (TestBit(TProof::kIsClient)) {
if (!md5 || (md5 && UploadPackageOnClient(par, opt, md5) == -1)) {
if (md5) delete md5;
return -1;
}
}
if (IsLite()) {
delete md5;
return 0;
}
TString smsg;
smsg.Form("+%s", base.Data());
TMessage mess(kPROOF_CHECKFILE);
mess << smsg << (*md5);
TMessage mess2(kPROOF_CHECKFILE);
smsg.Replace(0, 1, "-");
mess2 << smsg << (*md5);
TMessage mess3(kPROOF_CHECKFILE);
smsg.Replace(0, 1, "=");
mess3 << smsg << (*md5);
delete md5;
if (fProtocol > 8) {
mess << (UInt_t) opt;
mess2 << (UInt_t) opt;
mess3 << (UInt_t) opt;
}
if (!workers)
workers = fUniqueSlaves;
TIter next(workers);
TSlave *sl = 0;
while ((sl = (TSlave *) next())) {
if (!sl->IsValid())
continue;
sl->GetSocket()->Send(mess);
fCheckFileStatus = 0;
Collect(sl, fCollectTimeout, kPROOF_CHECKFILE);
if (fCheckFileStatus == 0) {
if (fProtocol > 5) {
smsg.Form("%s/%s/%s", sl->GetProofWorkDir(), kPROOF_PackDir, base.Data());
if (SendFile(par, (kBinary | kForce | kCpBin | kForward), smsg.Data(), sl) < 0) {
Error("UploadPackage", "%s: problems uploading file %s",
sl->GetOrdinal(), par.Data());
return -1;
}
} else {
TFTP ftp(TString("root://")+sl->GetName(), 1);
if (!ftp.IsZombie()) {
smsg.Form("%s/%s", sl->GetProofWorkDir(), kPROOF_PackDir);
ftp.cd(smsg.Data());
ftp.put(par, base.Data());
}
}
sl->GetSocket()->Send(mess2);
fCheckFileStatus = 0;
Collect(sl, fCollectTimeout, kPROOF_CHECKFILE);
if (fCheckFileStatus == 0) {
Error("UploadPackage", "%s: unpacking of package %s failed",
sl->GetOrdinal(), base.Data());
return -1;
}
}
}
TIter nextmaster(fNonUniqueMasters);
TSlave *ma;
while ((ma = (TSlave *) nextmaster())) {
if (!ma->IsValid())
continue;
ma->GetSocket()->Send(mess3);
fCheckFileStatus = 0;
Collect(ma, fCollectTimeout, kPROOF_CHECKFILE);
if (fCheckFileStatus == 0) {
Error("UploadPackage", "package %s did not exist on submaster %s",
base.Data(), ma->GetOrdinal());
return -1;
}
}
return 0;
}
Int_t TProof::UploadPackageOnClient(const char *parpack, EUploadPackageOpt opt, TMD5 *md5)
{
Int_t status = 0;
if (TestBit(TProof::kIsClient)) {
TString par(parpack);
#ifndef WIN32
char ctmp[4096];
ssize_t sz = readlink(par.Data(), ctmp, 4096);
if (sz >= 4096) sz = 4095;
if (sz > 0) {
ctmp[sz] = '\0';
par = ctmp;
} else if (TSystem::GetErrno() != EINVAL) {
Warning("UploadPackageOnClient",
"could not resolve the symbolik link '%s'", par.Data());
}
#endif
fPackageLock->Lock();
TString downloadpath;
downloadpath.Form("%s/%s/%s", fPackageDir.Data(),
kPROOF_PackDownloadDir, gSystem->BaseName(par));
if (!gSystem->AccessPathName(downloadpath, kFileExists) && downloadpath != par) {
if (gSystem->Unlink(downloadpath) != 0) {
Warning("UploadPackageOnClient",
"problems removing downloaded version of '%s' (%s):\n"
"may imply inconsistencies in subsequent updates",
gSystem->BaseName(par), downloadpath.Data());
}
}
TString lpar;
lpar.Form("%s/%s", fPackageDir.Data(), gSystem->BaseName(par));
FileStat_t stat;
Int_t st = gSystem->GetPathInfo(lpar, stat);
if (stat.fIsLink)
gSystem->Unlink(lpar);
else if (st == 0) {
Error("UploadPackageOnClient", "cannot create symlink %s on client, "
"another item with same name already exists",
lpar.Data());
fPackageLock->Unlock();
return -1;
}
if (!gSystem->IsAbsoluteFileName(par)) {
TString fpar = par;
gSystem->Symlink(gSystem->PrependPathName(gSystem->WorkingDirectory(), fpar), lpar);
} else
gSystem->Symlink(par, lpar);
TString cmd;
TString packnam = par(0, par.Length() - 4);
packnam = gSystem->BaseName(packnam);
TString md5f = fPackageDir + "/" + packnam + "/PROOF-INF/md5.txt";
TMD5 *md5local = TMD5::ReadChecksum(md5f);
if (!md5local || (*md5) != (*md5local)) {
if ((opt & TProof::kRemoveOld)) {
cmd.Form("%s %s/%s", kRM, fPackageDir.Data(), packnam.Data());
if (gSystem->Exec(cmd.Data()))
Error("UploadPackageOnClient", "failure executing: %s", cmd.Data());
}
char *gunzip = gSystem->Which(gSystem->Getenv("PATH"), kGUNZIP,
kExecutePermission);
if (gunzip) {
cmd.Form(kUNTAR2, gunzip, par.Data(), fPackageDir.Data());
if (gSystem->Exec(cmd.Data()))
Error("Uploadpackage", "failure executing: %s", cmd.Data());
delete [] gunzip;
} else
Error("UploadPackageOnClient", "%s not found", kGUNZIP);
if (gSystem->AccessPathName(fPackageDir + "/" + packnam, kWritePermission)) {
Error("UploadPackageOnClient",
"package %s did not unpack into %s/%s", par.Data(), fPackageDir.Data(),
packnam.Data());
status = -1;
} else {
TMD5::WriteChecksum(md5f, md5);
}
}
fPackageLock->Unlock();
delete md5local;
}
return status;
}
Int_t TProof::Load(const char *macro, Bool_t notOnClient, Bool_t uniqueWorkers,
TList *wrks)
{
if (!IsValid()) return -1;
if (!macro || !macro[0]) {
Error("Load", "need to specify a macro name");
return -1;
}
if (TestBit(TProof::kIsClient)) {
if (wrks) {
Error("Load", "the 'wrks' arg can be used only on the master");
return -1;
}
TString addsname, implname = macro;
Ssiz_t icom = implname.Index(",");
if (icom != kNPOS) {
addsname = implname(icom + 1, implname.Length());
implname.Remove(icom);
}
TString basemacro = gSystem->BaseName(implname), mainmacro(implname);
TString bmsg(basemacro), acmode, args, io;
implname = gSystem->SplitAclicMode(implname, acmode, args, io);
Int_t dot = implname.Last('.');
if (dot == kNPOS) {
Info("Load", "macro '%s' does not contain a '.': do nothing", macro);
return -1;
}
Bool_t hasHeader = kTRUE;
TString headname = implname;
headname.Remove(dot);
headname += ".h";
if (gSystem->AccessPathName(headname, kReadPermission)) {
TString h = headname;
headname.Remove(dot);
headname += ".hh";
if (gSystem->AccessPathName(headname, kReadPermission)) {
hasHeader = kFALSE;
if (gDebug > 0)
Info("Load", "no associated header file found: tried: %s %s",
h.Data(), headname.Data());
}
}
TString addincs;
TList addfiles;
if (!addsname.IsNull()) {
TString fn;
Int_t from = 0;
while (addsname.Tokenize(fn, from, ",")) {
if (gSystem->AccessPathName(fn, kReadPermission)) {
Error("Load", "additional file '%s' not found", fn.Data());
return -1;
}
if (!notOnClient) {
TString dirn(gSystem->DirName(fn));
if (addincs.IsNull()) {
addincs.Form("-I%s", dirn.Data());
} else if (!addincs.Contains(dirn)) {
addincs += TString::Format(" -I%s", dirn.Data());
}
}
addfiles.Add(new TObjString(fn));
}
}
if (SendFile(implname, kAscii | kForward , "cache") == -1) {
Error("Load", "problems sending implementation file %s", implname.Data());
return -1;
}
if (hasHeader)
if (SendFile(headname, kAscii | kForward , "cache") == -1) {
Error("Load", "problems sending header file %s", headname.Data());
return -1;
}
if (addfiles.GetSize() > 0) {
TIter nxfn(&addfiles);
TObjString *os = 0;
while ((os = (TObjString *) nxfn())) {
if (SendFile(os->GetName(), kAscii | kForward, "cache") == -1) {
Error("Load", "problems sending additional file %s", os->GetName());
return -1;
}
bmsg += TString::Format(",%s", gSystem->BaseName(os->GetName()));
}
addfiles.SetOwner(kTRUE);
}
TMessage mess(kPROOF_CACHE);
if (GetRemoteProtocol() < 34) {
mess << Int_t(kLoadMacro) << basemacro;
AddIncludePath("../../cache");
} else {
mess << Int_t(kLoadMacro) << bmsg;
}
Broadcast(mess, kActive);
if (!notOnClient) {
TString oldincs = gSystem->GetIncludePath();
if (!addincs.IsNull()) gSystem->AddIncludePath(addincs);
gROOT->ProcessLine(TString::Format(".L %s", mainmacro.Data()));
if (!addincs.IsNull()) gSystem->SetIncludePath(oldincs);
TString mp(TROOT::GetMacroPath());
TString np(gSystem->DirName(macro));
if (!np.IsNull()) {
np += ":";
if (!mp.BeginsWith(np) && !mp.Contains(":"+np)) {
Int_t ip = (mp.BeginsWith(".:")) ? 2 : 0;
mp.Insert(ip, np);
TROOT::SetMacroPath(mp);
if (gDebug > 0)
Info("Load", "macro path set to '%s'", TROOT::GetMacroPath());
}
}
}
Collect(kActive);
} else {
TString basemacro = gSystem->BaseName(macro);
TMessage mess(kPROOF_CACHE);
if (uniqueWorkers) {
mess << Int_t(kLoadMacro) << basemacro;
if (wrks)
Broadcast(mess, wrks);
else
Broadcast(mess, kUnique);
} else {
Collect(kUnique);
TList others;
TSlave *wrk = 0;
TIter nxw(fActiveSlaves);
while ((wrk = (TSlave *)nxw())) {
if (!fUniqueSlaves->FindObject(wrk)) {
others.Add(wrk);
}
}
Int_t ld = basemacro.Last('.');
if (ld != kNPOS) {
Int_t lpp = basemacro.Index("++", ld);
if (lpp != kNPOS) basemacro.Replace(lpp, 2, "+");
}
mess << Int_t(kLoadMacro) << basemacro;
Broadcast(mess, &others);
Collect(&others);
}
PDB(kGlobal, 1) Info("Load", "adding loaded macro: %s", macro);
if (!fLoadedMacros) {
fLoadedMacros = new TList();
fLoadedMacros->SetOwner();
}
if (!wrks)
fLoadedMacros->Add(new TObjString(macro));
}
return 0;
}
Int_t TProof::AddDynamicPath(const char *libpath, Bool_t onClient, TList *wrks,
Bool_t doCollect)
{
if ((!libpath || !libpath[0])) {
if (gDebug > 0)
Info("AddDynamicPath", "list is empty - nothing to do");
return 0;
}
if (onClient)
HandleLibIncPath("lib", kTRUE, libpath);
TMessage m(kPROOF_LIB_INC_PATH);
m << TString("lib") << (Bool_t)kTRUE;
if (libpath && strlen(libpath))
m << TString(libpath);
else
m << TString("-");
if (wrks) {
Broadcast(m, wrks);
if (doCollect)
Collect(wrks, fCollectTimeout);
}
else {
Broadcast(m);
Collect(kActive, fCollectTimeout);
}
return 0;
}
Int_t TProof::AddIncludePath(const char *incpath, Bool_t onClient, TList *wrks,
Bool_t doCollect)
{
if ((!incpath || !incpath[0])) {
if (gDebug > 0)
Info("AddIncludePath", "list is empty - nothing to do");
return 0;
}
if (onClient)
HandleLibIncPath("inc", kTRUE, incpath);
TMessage m(kPROOF_LIB_INC_PATH);
m << TString("inc") << (Bool_t)kTRUE;
if (incpath && strlen(incpath))
m << TString(incpath);
else
m << TString("-");
if (wrks) {
Broadcast(m, wrks);
if (doCollect)
Collect(wrks, fCollectTimeout);
}
else {
Broadcast(m);
Collect(kActive, fCollectTimeout);
}
return 0;
}
Int_t TProof::RemoveDynamicPath(const char *libpath, Bool_t onClient)
{
if ((!libpath || !libpath[0])) {
if (gDebug > 0)
Info("RemoveDynamicPath", "list is empty - nothing to do");
return 0;
}
if (onClient)
HandleLibIncPath("lib", kFALSE, libpath);
TMessage m(kPROOF_LIB_INC_PATH);
m << TString("lib") <<(Bool_t)kFALSE;
if (libpath && strlen(libpath))
m << TString(libpath);
else
m << TString("-");
Broadcast(m);
Collect(kActive, fCollectTimeout);
return 0;
}
Int_t TProof::RemoveIncludePath(const char *incpath, Bool_t onClient)
{
if ((!incpath || !incpath[0])) {
if (gDebug > 0)
Info("RemoveIncludePath", "list is empty - nothing to do");
return 0;
}
if (onClient)
HandleLibIncPath("in", kFALSE, incpath);
TMessage m(kPROOF_LIB_INC_PATH);
m << TString("inc") << (Bool_t)kFALSE;
if (incpath && strlen(incpath))
m << TString(incpath);
else
m << TString("-");
Broadcast(m);
Collect(kActive, fCollectTimeout);
return 0;
}
void TProof::HandleLibIncPath(const char *what, Bool_t add, const char *dirs)
{
TString type(what);
TString path(dirs);
if ((type != "lib") && (type != "inc")) {
Error("HandleLibIncPath","unknown action type: %s - protocol error?", type.Data());
return;
}
path.ReplaceAll(","," ");
TObjArray *op = 0;
if (path.Length() > 0 && path != "-") {
if (!(op = path.Tokenize(" "))) {
Warning("HandleLibIncPath","decomposing path %s", path.Data());
return;
}
}
if (add) {
if (type == "lib") {
TIter nxl(op, kIterBackward);
TObjString *lib = 0;
while ((lib = (TObjString *) nxl())) {
TString xlib = lib->GetName();
gSystem->ExpandPathName(xlib);
if (!gSystem->AccessPathName(xlib, kReadPermission)) {
TString newlibpath = gSystem->GetDynamicPath();
Int_t pos = 0;
if (newlibpath.BeginsWith(".:"))
pos = 2;
if (newlibpath.Index(xlib) == kNPOS) {
newlibpath.Insert(pos,TString::Format("%s:", xlib.Data()));
gSystem->SetDynamicPath(newlibpath);
}
} else {
if (gDebug > 0)
Info("HandleLibIncPath",
"libpath %s does not exist or cannot be read - not added", xlib.Data());
}
}
} else {
TIter nxi(op);
TObjString *inc = 0;
while ((inc = (TObjString *) nxi())) {
TString xinc = inc->GetName();
gSystem->ExpandPathName(xinc);
if (!gSystem->AccessPathName(xinc, kReadPermission)) {
TString curincpath = gSystem->GetIncludePath();
if (curincpath.Index(xinc) == kNPOS)
gSystem->AddIncludePath(TString::Format("-I%s", xinc.Data()));
} else
if (gDebug > 0)
Info("HandleLibIncPath",
"incpath %s does not exist or cannot be read - not added", xinc.Data());
}
}
} else {
if (type == "lib") {
TIter nxl(op);
TObjString *lib = 0;
while ((lib = (TObjString *) nxl())) {
TString xlib = lib->GetName();
gSystem->ExpandPathName(xlib);
TString newlibpath = gSystem->GetDynamicPath();
newlibpath.ReplaceAll(TString::Format("%s:", xlib.Data()),"");
gSystem->SetDynamicPath(newlibpath);
}
} else {
TIter nxi(op);
TObjString *inc = 0;
while ((inc = (TObjString *) nxi())) {
TString newincpath = gSystem->GetIncludePath();
newincpath.ReplaceAll(TString::Format("-I%s", inc->GetName()),"");
newincpath.ReplaceAll(gInterpreter->GetIncludePath(),"");
gSystem->SetIncludePath(newincpath);
}
}
}
}
TList *TProof::GetListOfPackages()
{
if (!IsValid())
return (TList *)0;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kListPackages);
Broadcast(mess);
Collect(kActive, fCollectTimeout);
return fAvailablePackages;
}
TList *TProof::GetListOfEnabledPackages()
{
if (!IsValid())
return (TList *)0;
TMessage mess(kPROOF_CACHE);
mess << Int_t(kListEnabledPackages);
Broadcast(mess);
Collect(kActive, fCollectTimeout);
return fEnabledPackages;
}
void TProof::PrintProgress(Long64_t total, Long64_t processed,
Float_t procTime, Long64_t bytesread)
{
if (fPrintProgress) {
Bool_t redirlog = fRedirLog;
fRedirLog = kFALSE;
(*fPrintProgress)(total, processed, procTime, bytesread);
fRedirLog = redirlog;
return;
}
fprintf(stderr, "[TProof::Progress] Total %lld events\t|", total);
for (int l = 0; l < 20; l++) {
if (total > 0) {
if (l < 20*processed/total)
fprintf(stderr, "=");
else if (l == 20*processed/total)
fprintf(stderr, ">");
else if (l > 20*processed/total)
fprintf(stderr, ".");
} else
fprintf(stderr, "=");
}
Float_t evtrti = (procTime > 0. && processed > 0) ? processed / procTime : -1.;
Float_t mbsrti = (procTime > 0. && bytesread > 0) ? bytesread / procTime : -1.;
TString sunit("B/s");
if (evtrti > 0.) {
Float_t remainingTime = (total >= processed) ? (total - processed) / evtrti : -1;
if (mbsrti > 0.) {
const Float_t toK = 1024., toM = 1048576., toG = 1073741824.;
if (mbsrti >= toG) {
mbsrti /= toG;
sunit = "GB/s";
} else if (mbsrti >= toM) {
mbsrti /= toM;
sunit = "MB/s";
} else if (mbsrti >= toK) {
mbsrti /= toK;
sunit = "kB/s";
}
fprintf(stderr, "| %.02f %% [%.1f evts/s, %.1f %s, time left: %.1f s]\r",
(total ? ((100.0*processed)/total) : 100.0), evtrti, mbsrti, sunit.Data(), remainingTime);
} else {
fprintf(stderr, "| %.02f %% [%.1f evts/s, time left: %.1f s]\r",
(total ? ((100.0*processed)/total) : 100.0), evtrti, remainingTime);
}
} else {
fprintf(stderr, "| %.02f %%\r",
(total ? ((100.0*processed)/total) : 100.0));
}
if (processed >= total) {
fprintf(stderr, "\n Query processing time: %.1f s\n", procTime);
}
}
void TProof::Progress(Long64_t total, Long64_t processed)
{
if (fPrintProgress) {
return (*fPrintProgress)(total, processed, -1., -1);
}
PDB(kGlobal,1)
Info("Progress","%2f (%lld/%lld)", 100.*processed/total, processed, total);
if (gROOT->IsBatch()) {
if (total > 0)
PrintProgress(total, processed);
} else {
EmitVA("Progress(Long64_t,Long64_t)", 2, total, processed);
}
}
void TProof::Progress(Long64_t total, Long64_t processed, Long64_t bytesread,
Float_t initTime, Float_t procTime,
Float_t evtrti, Float_t mbrti)
{
PDB(kGlobal,1)
Info("Progress","%lld %lld %lld %f %f %f %f", total, processed, bytesread,
initTime, procTime, evtrti, mbrti);
if (gROOT->IsBatch()) {
if (total > 0)
PrintProgress(total, processed, procTime, bytesread);
} else {
EmitVA("Progress(Long64_t,Long64_t,Long64_t,Float_t,Float_t,Float_t,Float_t)",
7, total, processed, bytesread, initTime, procTime, evtrti, mbrti);
}
}
void TProof::Progress(Long64_t total, Long64_t processed, Long64_t bytesread,
Float_t initTime, Float_t procTime,
Float_t evtrti, Float_t mbrti, Int_t actw, Int_t tses, Float_t eses)
{
PDB(kGlobal,1)
Info("Progress","%lld %lld %lld %f %f %f %f %d %f", total, processed, bytesread,
initTime, procTime, evtrti, mbrti, actw, eses);
if (gROOT->IsBatch()) {
if (total > 0)
PrintProgress(total, processed, procTime, bytesread);
} else {
EmitVA("Progress(Long64_t,Long64_t,Long64_t,Float_t,Float_t,Float_t,Float_t,Int_t,Int_t,Float_t)",
10, total, processed, bytesread, initTime, procTime, evtrti, mbrti, actw, tses, eses);
}
}
void TProof::Feedback(TList *objs)
{
PDB(kGlobal,1)
Info("Feedback","%d objects", objs->GetSize());
PDB(kFeedback,1) {
Info("Feedback","%d objects", objs->GetSize());
objs->ls();
}
Emit("Feedback(TList *objs)", (Long_t) objs);
}
void TProof::CloseProgressDialog()
{
PDB(kGlobal,1)
Info("CloseProgressDialog",
"called: have progress dialog: %d", fProgressDialogStarted);
if (!fProgressDialogStarted)
return;
Emit("CloseProgressDialog()");
}
void TProof::ResetProgressDialog(const char *sel, Int_t sz, Long64_t fst,
Long64_t ent)
{
PDB(kGlobal,1)
Info("ResetProgressDialog","(%s,%d,%lld,%lld)", sel, sz, fst, ent);
EmitVA("ResetProgressDialog(const char*,Int_t,Long64_t,Long64_t)",
4, sel, sz, fst, ent);
}
void TProof::StartupMessage(const char *msg, Bool_t st, Int_t done, Int_t total)
{
PDB(kGlobal,1)
Info("StartupMessage","(%s,%d,%d,%d)", msg, st, done, total);
EmitVA("StartupMessage(const char*,Bool_t,Int_t,Int_t)",
4, msg, st, done, total);
}
void TProof::DataSetStatus(const char *msg, Bool_t st, Int_t done, Int_t total)
{
PDB(kGlobal,1)
Info("DataSetStatus","(%s,%d,%d,%d)", msg, st, done, total);
EmitVA("DataSetStatus(const char*,Bool_t,Int_t,Int_t)",
4, msg, st, done, total);
}
void TProof::SendDataSetStatus(const char *action, UInt_t done,
UInt_t tot, Bool_t st)
{
if (IsLite()) {
if (tot) {
TString type = "files";
Int_t frac = (Int_t) (done*100.)/tot;
char msg[512] = {0};
if (frac >= 100) {
snprintf(msg, 512, "%s: OK (%d %s) \n",
action,tot, type.Data());
} else {
snprintf(msg, 512, "%s: %d out of %d (%d %%)\r",
action, done, tot, frac);
}
if (fSync)
fprintf(stderr,"%s", msg);
else
NotifyLogMsg(msg, 0);
}
return;
}
if (TestBit(TProof::kIsMaster)) {
TMessage mess(kPROOF_DATASET_STATUS);
mess << TString(action) << tot << done << st;
gProofServ->GetSocket()->Send(mess);
}
}
void TProof::QueryResultReady(const char *ref)
{
PDB(kGlobal,1)
Info("QueryResultReady","ref: %s", ref);
Emit("QueryResultReady(const char*)",ref);
}
void TProof::ValidateDSet(TDSet *dset)
{
if (dset->ElementsValid()) return;
TList nodes;
nodes.SetOwner();
TList slholder;
slholder.SetOwner();
TList elemholder;
elemholder.SetOwner();
TIter nextSlave(GetListOfActiveSlaves());
while (TSlave *sl = dynamic_cast<TSlave*>(nextSlave())) {
TList *sllist = 0;
TPair *p = dynamic_cast<TPair*>(nodes.FindObject(sl->GetName()));
if (!p) {
sllist = new TList;
sllist->SetName(sl->GetName());
slholder.Add(sllist);
TList *elemlist = new TList;
elemlist->SetName(TString(sl->GetName())+"_elem");
elemholder.Add(elemlist);
nodes.Add(new TPair(sllist, elemlist));
} else {
sllist = dynamic_cast<TList*>(p->Key());
}
if (sllist) sllist->Add(sl);
}
TList nonLocal;
for (Int_t i = 0; i < 2; i++) {
Bool_t local = i>0?kFALSE:kTRUE;
TIter nextElem(local ? dset->GetListOfElements() : &nonLocal);
while (TDSetElement *elem = dynamic_cast<TDSetElement*>(nextElem())) {
if (elem->GetValid()) continue;
TPair *p = dynamic_cast<TPair*>(local?nodes.FindObject(TUrl(elem->GetFileName()).GetHost()):nodes.At(0));
if (p) {
TList *eli = dynamic_cast<TList*>(p->Value());
TList *sli = dynamic_cast<TList*>(p->Key());
if (eli && sli) {
eli->Add(elem);
TPair *p2 = p;
Bool_t stop = kFALSE;
while (!stop) {
TPair *p3 = dynamic_cast<TPair*>(nodes.After(p2->Key()));
if (p3) {
TList *p3v = dynamic_cast<TList*>(p3->Value());
TList *p3k = dynamic_cast<TList*>(p3->Key());
if (p3v && p3k) {
Int_t nelem = p3v->GetSize();
Int_t nsl = p3k->GetSize();
if (nelem*sli->GetSize() < eli->GetSize()*nsl) p2 = p3;
else stop = kTRUE;
}
} else {
stop = kTRUE;
}
}
if (p2!=p) {
nodes.Remove(p->Key());
nodes.AddAfter(p2->Key(), p);
}
} else {
Warning("ValidateDSet", "invalid values from TPair! Protocol error?");
continue;
}
} else {
if (local) {
nonLocal.Add(elem);
} else {
Warning("ValidateDSet", "no node to allocate TDSetElement to - ignoring");
}
}
}
}
TList usedslaves;
TIter nextNode(&nodes);
SetDSet(dset);
while (TPair *node = dynamic_cast<TPair*>(nextNode())) {
TList *slaves = dynamic_cast<TList*>(node->Key());
TList *setelements = dynamic_cast<TList*>(node->Value());
if (!slaves || !setelements) continue;
Int_t nslaves = slaves->GetSize();
Int_t nelements = setelements->GetSize();
for (Int_t i=0; i<nslaves; i++) {
TDSet copyset(dset->GetType(), dset->GetObjName(),
dset->GetDirectory());
for (Int_t j = (i*nelements)/nslaves;
j < ((i+1)*nelements)/nslaves;
j++) {
TDSetElement *elem =
dynamic_cast<TDSetElement*>(setelements->At(j));
if (elem) {
copyset.Add(elem->GetFileName(), elem->GetObjName(),
elem->GetDirectory(), elem->GetFirst(),
elem->GetNum(), elem->GetMsd());
}
}
if (copyset.GetListOfElements()->GetSize()>0) {
TMessage mesg(kPROOF_VALIDATE_DSET);
mesg << ©set;
TSlave *sl = dynamic_cast<TSlave*>(slaves->At(i));
if (sl) {
PDB(kGlobal,1) Info("ValidateDSet",
"Sending TDSet with %d elements to slave %s"
" to be validated",
copyset.GetListOfElements()->GetSize(),
sl->GetOrdinal());
sl->GetSocket()->Send(mesg);
usedslaves.Add(sl);
}
}
}
}
PDB(kGlobal,1)
Info("ValidateDSet","Calling Collect");
Collect(&usedslaves);
SetDSet(0);
}
void TProof::AddInputData(TObject *obj, Bool_t push)
{
if (obj) {
if (!fInputData) fInputData = new TList;
if (!fInputData->FindObject(obj)) {
fInputData->Add(obj);
SetBit(TProof::kNewInputData);
}
}
if (push) SetBit(TProof::kNewInputData);
}
void TProof::ClearInputData(TObject *obj)
{
if (!obj) {
if (fInputData) {
fInputData->SetOwner(kTRUE);
SafeDelete(fInputData);
}
ResetBit(TProof::kNewInputData);
TObject *o = 0;
TList *in = GetInputList();
while ((o = GetInputList()->FindObject("PROOF_InputDataFile")))
in->Remove(o);
while ((o = GetInputList()->FindObject("PROOF_InputData")))
in->Remove(o);
fInputDataFile = "";
gSystem->Unlink(kPROOF_InputDataFile);
} else if (fInputData) {
Int_t sz = fInputData->GetSize();
while (fInputData->FindObject(obj))
fInputData->Remove(obj);
if (sz != fInputData->GetSize())
SetBit(TProof::kNewInputData);
}
}
void TProof::ClearInputData(const char *name)
{
TObject *obj = (fInputData && name) ? fInputData->FindObject(name) : 0;
if (obj) ClearInputData(obj);
}
void TProof::SetInputDataFile(const char *datafile)
{
if (datafile && strlen(datafile) > 0) {
if (fInputDataFile != datafile && strcmp(datafile, kPROOF_InputDataFile))
SetBit(TProof::kNewInputData);
fInputDataFile = datafile;
} else {
if (!fInputDataFile.IsNull())
SetBit(TProof::kNewInputData);
fInputDataFile = "";
}
if (fInputDataFile != kPROOF_InputDataFile && !fInputDataFile.IsNull() &&
gSystem->AccessPathName(fInputDataFile, kReadPermission)) {
fInputDataFile = "";
}
}
void TProof::SendInputDataFile()
{
TString dataFile;
PrepareInputDataFile(dataFile);
if (dataFile.Length() > 0) {
Info("SendInputDataFile", "broadcasting %s", dataFile.Data());
BroadcastFile(dataFile.Data(), kBinary, "cache", kActive);
TString t = TString::Format("cache:%s", gSystem->BaseName(dataFile));
AddInput(new TNamed("PROOF_InputDataFile", t.Data()));
}
}
void TProof::PrepareInputDataFile(TString &dataFile)
{
Bool_t newdata = TestBit(TProof::kNewInputData) ? kTRUE : kFALSE;
ResetBit(TProof::kNewInputData);
Bool_t list_ok = (fInputData && fInputData->GetSize() > 0) ? kTRUE : kFALSE;
Bool_t file_ok = kFALSE;
if (fInputDataFile != kPROOF_InputDataFile && !fInputDataFile.IsNull() &&
!gSystem->AccessPathName(fInputDataFile, kReadPermission)) {
TFile *f = TFile::Open(fInputDataFile);
if (f && f->GetListOfKeys() && f->GetListOfKeys()->GetSize() > 0)
file_ok = kTRUE;
}
TObject *o = 0;
TList *in = GetInputList();
while ((o = GetInputList()->FindObject("PROOF_InputDataFile")))
in->Remove(o);
while ((o = GetInputList()->FindObject("PROOF_InputData")))
in->Remove(o);
dataFile = "";
if (!list_ok && !file_ok) return;
if (file_ok && !list_ok) {
dataFile = fInputDataFile;
} else if (!file_ok && list_ok) {
fInputDataFile = kPROOF_InputDataFile;
if (!newdata && !gSystem->AccessPathName(fInputDataFile)) return;
TFile *f = TFile::Open(fInputDataFile, "RECREATE");
if (f) {
f->cd();
TIter next(fInputData);
TObject *obj;
while ((obj = next())) {
obj->Write(0, TObject::kSingleKey, 0);
}
f->Close();
SafeDelete(f);
} else {
Error("PrepareInputDataFile", "could not (re-)create %s", fInputDataFile.Data());
return;
}
dataFile = fInputDataFile;
} else if (file_ok && list_ok) {
dataFile = kPROOF_InputDataFile;
if (newdata || gSystem->AccessPathName(dataFile)) {
if (!gSystem->AccessPathName(dataFile))
gSystem->Unlink(dataFile);
if (dataFile != fInputDataFile) {
if (gSystem->CopyFile(fInputDataFile, dataFile, kTRUE) != 0) {
Error("PrepareInputDataFile", "could not make local copy of %s", fInputDataFile.Data());
return;
}
}
TFile *f = TFile::Open(dataFile, "UPDATE");
if (f) {
f->cd();
TIter next(fInputData);
TObject *obj = 0;
while ((obj = next())) {
obj->Write(0, TObject::kSingleKey, 0);
}
f->Close();
SafeDelete(f);
} else {
Error("PrepareInputDataFile", "could not open %s for updating", dataFile.Data());
return;
}
}
}
return;
}
void TProof::AddInput(TObject *obj)
{
if (fPlayer) fPlayer->AddInput(obj);
}
void TProof::ClearInput()
{
if (fPlayer) fPlayer->ClearInput();
AddInput(fFeedback);
}
TList *TProof::GetInputList()
{
return (fPlayer ? fPlayer->GetInputList() : (TList *)0);
}
TObject *TProof::GetOutput(const char *name)
{
if (TestBit(TProof::kIsMaster))
return (fPlayer) ? fPlayer->GetOutput(name) : (TObject *)0;
return (GetOutputList()) ? GetOutputList()->FindObject(name) : (TObject *)0;
}
TObject *TProof::GetOutput(const char *name, TList *out)
{
TObject *o = 0;
if (!name || (name && strlen(name) <= 0) ||
!out || (out && out->GetSize() <= 0)) return o;
if ((o = out->FindObject(name))) return o;
TProofOutputFile *pf = 0;
TIter nxo(out);
while ((o = nxo())) {
if ((pf = dynamic_cast<TProofOutputFile *> (o))) {
TFile *f = 0;
if (!(f = (TFile *) gROOT->GetListOfFiles()->FindObject(pf->GetOutputFileName()))) {
TString fn = TString::Format("%s/%s", pf->GetDir(), pf->GetFileName());
f = TFile::Open(fn.Data());
if (!f || (f && f->IsZombie())) {
::Warning("TProof::GetOutput", "problems opening file %s", fn.Data());
}
}
if (f && (o = f->Get(name))) return o;
}
}
return o;
}
TList *TProof::GetOutputList()
{
if (fOutputList.GetSize() > 0) return &fOutputList;
if (fPlayer) {
fOutputList.AttachList(fPlayer->GetOutputList());
return &fOutputList;
}
return (TList *)0;
}
void TProof::SetParameter(const char *par, const char *value)
{
if (!fPlayer) {
Warning("SetParameter", "player undefined! Ignoring");
return;
}
TList *il = fPlayer->GetInputList();
TObject *item = il->FindObject(par);
if (item) {
il->Remove(item);
delete item;
}
il->Add(new TNamed(par, value));
}
void TProof::SetParameter(const char *par, Int_t value)
{
if (!fPlayer) {
Warning("SetParameter", "player undefined! Ignoring");
return;
}
TList *il = fPlayer->GetInputList();
TObject *item = il->FindObject(par);
if (item) {
il->Remove(item);
delete item;
}
il->Add(new TParameter<Int_t>(par, value));
}
void TProof::SetParameter(const char *par, Long_t value)
{
if (!fPlayer) {
Warning("SetParameter", "player undefined! Ignoring");
return;
}
TList *il = fPlayer->GetInputList();
TObject *item = il->FindObject(par);
if (item) {
il->Remove(item);
delete item;
}
il->Add(new TParameter<Long_t>(par, value));
}
void TProof::SetParameter(const char *par, Long64_t value)
{
if (!fPlayer) {
Warning("SetParameter", "player undefined! Ignoring");
return;
}
TList *il = fPlayer->GetInputList();
TObject *item = il->FindObject(par);
if (item) {
il->Remove(item);
delete item;
}
il->Add(new TParameter<Long64_t>(par, value));
}
void TProof::SetParameter(const char *par, Double_t value)
{
if (!fPlayer) {
Warning("SetParameter", "player undefined! Ignoring");
return;
}
TList *il = fPlayer->GetInputList();
TObject *item = il->FindObject(par);
if (item) {
il->Remove(item);
delete item;
}
il->Add(new TParameter<Double_t>(par, value));
}
TObject *TProof::GetParameter(const char *par) const
{
if (!fPlayer) {
Warning("GetParameter", "player undefined! Ignoring");
return (TObject *)0;
}
TList *il = fPlayer->GetInputList();
return il->FindObject(par);
}
void TProof::DeleteParameters(const char *wildcard)
{
if (!fPlayer) return;
if (!wildcard) wildcard = "";
TRegexp re(wildcard, kTRUE);
Int_t nch = strlen(wildcard);
TList *il = fPlayer->GetInputList();
if (il) {
TObject *p = 0;
TIter next(il);
while ((p = next())) {
TString s = p->GetName();
if (nch && s != wildcard && s.Index(re) == kNPOS) continue;
il->Remove(p);
delete p;
}
}
}
void TProof::ShowParameters(const char *wildcard) const
{
if (!fPlayer) return;
if (!wildcard) wildcard = "";
TRegexp re(wildcard, kTRUE);
Int_t nch = strlen(wildcard);
TList *il = fPlayer->GetInputList();
TObject *p;
TIter next(il);
while ((p = next())) {
TString s = p->GetName();
if (nch && s != wildcard && s.Index(re) == kNPOS) continue;
if (p->IsA() == TNamed::Class()) {
Printf("%s\t\t\t%s", s.Data(), p->GetTitle());
} else if (p->IsA() == TParameter<Long_t>::Class()) {
Printf("%s\t\t\t%ld", s.Data(), dynamic_cast<TParameter<Long_t>*>(p)->GetVal());
} else if (p->IsA() == TParameter<Long64_t>::Class()) {
Printf("%s\t\t\t%lld", s.Data(), dynamic_cast<TParameter<Long64_t>*>(p)->GetVal());
} else if (p->IsA() == TParameter<Double_t>::Class()) {
Printf("%s\t\t\t%f", s.Data(), dynamic_cast<TParameter<Double_t>*>(p)->GetVal());
} else {
Printf("%s\t\t\t%s", s.Data(), p->GetTitle());
}
}
}
void TProof::AddFeedback(const char *name)
{
PDB(kFeedback, 3)
Info("AddFeedback", "Adding object \"%s\" to feedback", name);
if (fFeedback->FindObject(name) == 0)
fFeedback->Add(new TObjString(name));
}
void TProof::RemoveFeedback(const char *name)
{
TObject *obj = fFeedback->FindObject(name);
if (obj != 0) {
fFeedback->Remove(obj);
delete obj;
}
}
void TProof::ClearFeedback()
{
fFeedback->Delete();
}
void TProof::ShowFeedback() const
{
if (fFeedback->GetSize() == 0) {
Info("","no feedback requested");
return;
}
fFeedback->Print();
}
TList *TProof::GetFeedbackList() const
{
return fFeedback;
}
TTree *TProof::GetTreeHeader(TDSet *dset)
{
TList *l = GetListOfActiveSlaves();
TSlave *sl = (TSlave*) l->First();
if (sl == 0) {
Error("GetTreeHeader", "No connection");
return 0;
}
TSocket *soc = sl->GetSocket();
TMessage msg(kPROOF_GETTREEHEADER);
msg << dset;
soc->Send(msg);
TMessage *reply;
Int_t d = -1;
if (fProtocol >= 20) {
Collect(sl, fCollectTimeout, kPROOF_GETTREEHEADER);
reply = (TMessage *) fRecvMessages->First();
} else {
d = soc->Recv(reply);
}
if (!reply) {
Error("GetTreeHeader", "Error getting a replay from the master.Result %d", (int) d);
return 0;
}
TString s1;
TTree *t = 0;
(*reply) >> s1;
if (s1 == "Success")
(*reply) >> t;
PDB(kGlobal, 1) {
if (t) {
Info("GetTreeHeader", "%s, message size: %d, entries: %d",
s1.Data(), reply->BufferSize(), (int) t->GetMaxEntryLoop());
} else {
Info("GetTreeHeader", "tree header retrieval failed");
}
}
delete reply;
return t;
}
TDrawFeedback *TProof::CreateDrawFeedback()
{
return (fPlayer ? fPlayer->CreateDrawFeedback(this) : (TDrawFeedback *)0);
}
void TProof::SetDrawFeedbackOption(TDrawFeedback *f, Option_t *opt)
{
if (fPlayer) fPlayer->SetDrawFeedbackOption(f, opt);
}
void TProof::DeleteDrawFeedback(TDrawFeedback *f)
{
if (fPlayer) fPlayer->DeleteDrawFeedback(f);
}
TList *TProof::GetOutputNames()
{
return 0;
}
void TProof::Browse(TBrowser *b)
{
b->Add(fActiveSlaves, fActiveSlaves->Class(), "fActiveSlaves");
b->Add(&fMaster, fMaster.Class(), "fMaster");
b->Add(fFeedback, fFeedback->Class(), "fFeedback");
b->Add(fChains, fChains->Class(), "fChains");
if (fPlayer) {
b->Add(fPlayer->GetInputList(), fPlayer->GetInputList()->Class(), "InputList");
if (fPlayer->GetOutputList())
b->Add(fPlayer->GetOutputList(), fPlayer->GetOutputList()->Class(), "OutputList");
if (fPlayer->GetListOfResults())
b->Add(fPlayer->GetListOfResults(),
fPlayer->GetListOfResults()->Class(), "ListOfResults");
}
}
void TProof::SetPlayer(TVirtualProofPlayer *player)
{
if (fPlayer)
delete fPlayer;
fPlayer = player;
};
TVirtualProofPlayer *TProof::MakePlayer(const char *player, TSocket *s)
{
if (!player)
player = "remote";
SetPlayer(TVirtualProofPlayer::Create(player, this, s));
return GetPlayer();
}
void TProof::AddChain(TChain *chain)
{
fChains->Add(chain);
}
void TProof::RemoveChain(TChain *chain)
{
fChains->Remove(chain);
}
void TProof::GetLog(Int_t start, Int_t end)
{
if (!IsValid() || TestBit(TProof::kIsMaster)) return;
TMessage msg(kPROOF_LOGFILE);
msg << start << end;
Broadcast(msg, kActive);
Collect(kActive, fCollectTimeout);
}
TMacro *TProof::GetLastLog()
{
TMacro *maclog = 0;
off_t nowlog = lseek(fileno(fLogFileR), (off_t) 0, SEEK_CUR);
if (nowlog < 0) {
SysError("GetLastLog",
"problem lseeking log file to current position (errno: %d)", TSystem::GetErrno());
return maclog;
}
off_t startlog = nowlog;
off_t endlog = lseek(fileno(fLogFileR), (off_t) 0, SEEK_END);
if (endlog < 0) {
SysError("GetLastLog",
"problem lseeking log file to end position (errno: %d)", TSystem::GetErrno());
return maclog;
}
UInt_t tolog = (UInt_t)(endlog - startlog);
if (tolog <= 0) return maclog;
if (lseek(fileno(fLogFileR), startlog, SEEK_SET) < 0) {
SysError("GetLastLog",
"problem lseeking log file to start position (errno: %d)", TSystem::GetErrno());
return maclog;
}
maclog = new TMacro;
char line[2048];
Int_t wanted = (tolog > sizeof(line)) ? sizeof(line) : tolog;
while (fgets(line, wanted, fLogFileR)) {
Int_t r = strlen(line);
if (r > 0) {
if (line[r-1] == '\n') line[r-1] = '\0';
maclog->AddLine(line);
} else {
break;
}
tolog -= r;
wanted = (tolog > sizeof(line)) ? sizeof(line) : tolog;
}
if (lseek(fileno(fLogFileR), nowlog, SEEK_SET) < 0) {
Warning("GetLastLog",
"problem lseeking log file to original position (errno: %d)", TSystem::GetErrno());
}
return maclog;
}
void TProof::PutLog(TQueryResult *pq)
{
if (!pq) return;
TList *lines = pq->GetLogFile()->GetListOfLines();
if (lines) {
TIter nxl(lines);
TObjString *l = 0;
while ((l = (TObjString *)nxl()))
EmitVA("LogMessage(const char*,Bool_t)", 2, l->GetName(), kFALSE);
}
}
void TProof::ShowLog(const char *queryref)
{
Retrieve(queryref);
if (fPlayer) {
if (queryref) {
if (fPlayer->GetListOfResults()) {
TIter nxq(fPlayer->GetListOfResults());
TQueryResult *qr = 0;
while ((qr = (TQueryResult *) nxq()))
if (strstr(queryref, qr->GetTitle()) &&
strstr(queryref, qr->GetName()))
break;
if (qr) {
PutLog(qr);
return;
}
}
}
}
}
void TProof::ShowLog(Int_t qry)
{
off_t nowlog = lseek(fileno(fLogFileR), (off_t) 0, SEEK_CUR);
if (nowlog < 0) {
SysError("ShowLog", "problem lseeking log file (errno: %d)", TSystem::GetErrno());
return;
}
off_t startlog = nowlog;
off_t endlog = lseek(fileno(fLogFileR), (off_t) 0, SEEK_END);
if (endlog < 0) {
SysError("ShowLog", "problem lseeking log file (errno: %d)", TSystem::GetErrno());
return;
}
lseek(fileno(fLogFileR), nowlog, SEEK_SET);
if (qry == 0) {
startlog = 0;
lseek(fileno(fLogFileR), (off_t) 0, SEEK_SET);
} else if (qry != -1) {
TQueryResult *pq = 0;
if (qry == -2) {
pq = (GetQueryResults()) ? ((TQueryResult *)(GetQueryResults()->Last())) : 0;
if (!pq) {
GetListOfQueries();
if (fQueries)
pq = (TQueryResult *)(fQueries->Last());
}
} else if (qry > 0) {
TList *queries = GetQueryResults();
if (queries) {
TIter nxq(queries);
while ((pq = (TQueryResult *)nxq()))
if (qry == pq->GetSeqNum())
break;
}
if (!pq) {
queries = GetListOfQueries();
TIter nxq(queries);
while ((pq = (TQueryResult *)nxq()))
if (qry == pq->GetSeqNum())
break;
}
}
if (pq) {
PutLog(pq);
return;
} else {
if (gDebug > 0)
Info("ShowLog","query %d not found in list", qry);
qry = -1;
}
}
UInt_t tolog = (UInt_t)(endlog - startlog);
if (tolog <= 0)
lseek(fileno(fLogFileR), startlog, SEEK_SET);
Int_t np = 0;
char line[2048];
Int_t wanted = (tolog > sizeof(line)) ? sizeof(line) : tolog;
while (fgets(line, wanted, fLogFileR)) {
Int_t r = strlen(line);
if (!SendingLogToWindow()) {
if (line[r-1] != '\n') line[r-1] = '\n';
if (r > 0) {
char *p = line;
while (r) {
Int_t w = write(fileno(stdout), p, r);
if (w < 0) {
SysError("ShowLog", "error writing to stdout");
break;
}
r -= w;
p += w;
}
}
tolog -= strlen(line);
np++;
if (!(np%10)) {
const char *opt = Getline("More (y/n)? [y]");
if (opt[0] == 'n')
break;
}
if (tolog <= 0)
break;
wanted = (tolog > sizeof(line)) ? sizeof(line) : tolog;
} else {
if (line[r-1] == '\n') line[r-1] = 0;
LogMessage(line, kFALSE);
}
}
if (!SendingLogToWindow()) {
if (write(fileno(stdout), "\n", 1) != 1)
SysError("ShowLog", "error writing to stdout");
}
if (qry > -1)
lseek(fileno(fLogFileR), nowlog, SEEK_SET);
}
void TProof::cd(Int_t id)
{
if (GetManager()) {
TProofDesc *d = GetManager()->GetProofDesc(id);
if (d) {
if (d->GetProof()) {
gProof = d->GetProof();
return;
}
}
gProof = this;
}
return;
}
void TProof::Detach(Option_t *opt)
{
if (!IsValid()) return;
TSlave *sl = (TSlave *) fActiveSlaves->First();
TSocket *s = 0;
if (!sl || !(sl->IsValid()) || !(s = sl->GetSocket())) {
Error("Detach","corrupted worker instance: wrk:%p, sock:%p", sl, s);
return;
}
Bool_t shutdown = (strchr(opt,'s') || strchr(opt,'S')) ? kTRUE : kFALSE;
if (shutdown && !IsIdle()) {
Remove("cleanupqueue");
Long_t timeout = gEnv->GetValue("Proof.ShutdownTimeout", 60);
timeout = (timeout > 20) ? timeout : 20;
StopProcess(kFALSE, (Long_t) (timeout / 2));
Collect(kActive, timeout);
}
DeActivateAsyncInput();
sl->FlushSocket();
Close(opt);
if (fProgressDialogStarted)
CloseProgressDialog();
if (GetManager() && GetManager()->QuerySessions("L")) {
TIter nxd(GetManager()->QuerySessions("L"));
TProofDesc *d = 0;
while ((d = (TProofDesc *)nxd())) {
if (d->GetProof() == this) {
d->SetProof(0);
GetManager()->QuerySessions("L")->Remove(d);
break;
}
}
}
fValid = kFALSE;
return;
}
void TProof::SetAlias(const char *alias)
{
TNamed::SetTitle(alias);
if (TestBit(TProof::kIsMaster))
TNamed::SetName(alias);
if (!IsValid()) return;
if (!IsProofd() && TestBit(TProof::kIsClient)) {
TSlave *sl = (TSlave *) fActiveSlaves->First();
if (sl)
sl->SetAlias(alias);
}
return;
}
Int_t TProof::UploadDataSet(const char *, TList *, const char *, Int_t, TList *)
{
Printf(" *** WARNING: this function is obsolete: it has been replaced by TProofMgr::UploadFiles ***");
return -1;
}
Int_t TProof::UploadDataSet(const char *, const char *, const char *, Int_t, TList *)
{
Printf(" *** WARNING: this function is obsolete: it has been replaced by TProofMgr::UploadFiles ***");
return -1;
}
Int_t TProof::UploadDataSetFromFile(const char *, const char *, const char *, Int_t, TList *)
{
Printf(" *** WARNING: this function is obsolete: it has been replaced by TProofMgr::UploadFiles ***");
return -1;
}
Bool_t TProof::RegisterDataSet(const char *dataSetName,
TFileCollection *dataSet, const char *optStr)
{
if (fProtocol < 17) {
Info("RegisterDataSet",
"functionality not available: the server does not have dataset support");
return kFALSE;
}
if (!dataSetName || strlen(dataSetName) <= 0) {
Info("RegisterDataSet", "specifying a dataset name is mandatory");
return kFALSE;
}
Bool_t parallelverify = kFALSE;
TString sopt(optStr);
if (sopt.Contains("V") && fProtocol >= 34 && !sopt.Contains("S")) {
parallelverify = kTRUE;
sopt.ReplaceAll("V", "");
}
sopt.ReplaceAll("S", "");
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kRegisterDataSet);
mess << TString(dataSetName);
mess << sopt;
mess.WriteObject(dataSet);
Broadcast(mess);
Bool_t result = kTRUE;
Collect();
if (fStatus != 0) {
Error("RegisterDataSet", "dataset was not saved");
result = kFALSE;
return result;
}
if (!parallelverify) return result;
sopt += "V";
if (VerifyDataSet(dataSetName, sopt) < 0){
Error("RegisterDataSet", "problems verifying dataset '%s'", dataSetName);
return kFALSE;
}
return kTRUE;
}
Int_t TProof::SetDataSetTreeName(const char *dataset, const char *treename)
{
if (fProtocol < 23) {
Info("SetDataSetTreeName", "functionality not supported by the server");
return -1;
}
if (!dataset || strlen(dataset) <= 0) {
Info("SetDataSetTreeName", "specifying a dataset name is mandatory");
return -1;
}
if (!treename || strlen(treename) <= 0) {
Info("SetDataSetTreeName", "specifying a tree name is mandatory");
return -1;
}
TUri uri(dataset);
TString fragment(treename);
if (!fragment.BeginsWith("/")) fragment.Insert(0, "/");
uri.SetFragment(fragment);
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kSetDefaultTreeName);
mess << uri.GetUri();
Broadcast(mess);
Collect();
if (fStatus != 0) {
Error("SetDataSetTreeName", "some error occured: default tree name not changed");
return -1;
}
return 0;
}
TMap *TProof::GetDataSets(const char *uri, const char *optStr)
{
if (fProtocol < 15) {
Info("GetDataSets",
"functionality not available: the server does not have dataset support");
return 0;
}
if (fProtocol < 31 && strstr(optStr, ":lite:"))
Warning("GetDataSets", "'lite' option not supported by the server");
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kGetDataSets);
mess << TString(uri ? uri : "");
mess << TString(optStr ? optStr : "");
Broadcast(mess);
Collect(kActive, fCollectTimeout);
TMap *dataSetMap = 0;
if (fStatus != 0) {
Error("GetDataSets", "error receiving datasets information");
} else {
TMessage *retMess = (TMessage *) fRecvMessages->First();
if (retMess && retMess->What() == kMESS_OK) {
if (!(dataSetMap = (TMap *)(retMess->ReadObject(TMap::Class()))))
Error("GetDataSets", "error receiving datasets");
} else
Error("GetDataSets", "message not found or wrong type (%p)", retMess);
}
return dataSetMap;
}
void TProof::ShowDataSets(const char *uri, const char* optStr)
{
if (fProtocol < 15) {
Info("ShowDataSets",
"functionality not available: the server does not have dataset support");
return;
}
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kShowDataSets);
mess << TString(uri ? uri : "");
mess << TString(optStr ? optStr : "");
Broadcast(mess);
Collect(kActive, fCollectTimeout);
if (fStatus != 0)
Error("ShowDataSets", "error receiving datasets information");
}
Bool_t TProof::ExistsDataSet(const char *dataset)
{
if (fProtocol < 15) {
Info("ExistsDataSet", "functionality not available: the server has an"
" incompatible version of TFileInfo");
return kFALSE;
}
if (!dataset || strlen(dataset) <= 0) {
Error("ExistsDataSet", "dataset name missing");
return kFALSE;
}
TMessage msg(kPROOF_DATASETS);
msg << Int_t(kCheckDataSetName) << TString(dataset);
Broadcast(msg);
Collect(kActive, fCollectTimeout);
if (fStatus == -1) {
return kTRUE;
}
return kFALSE;
}
void TProof::ClearDataSetCache(const char *dataset)
{
if (fProtocol < 28) {
Info("ClearDataSetCache", "functionality not available on server");
return;
}
TMessage msg(kPROOF_DATASETS);
msg << Int_t(kCache) << TString(dataset) << TString("clear");
Broadcast(msg);
Collect(kActive, fCollectTimeout);
return;
}
void TProof::ShowDataSetCache(const char *dataset)
{
if (fProtocol < 28) {
Info("ShowDataSetCache", "functionality not available on server");
return;
}
TMessage msg(kPROOF_DATASETS);
msg << Int_t(kCache) << TString(dataset) << TString("show");
Broadcast(msg);
Collect(kActive, fCollectTimeout);
return;
}
TFileCollection *TProof::GetDataSet(const char *uri, const char *optStr)
{
if (fProtocol < 15) {
Info("GetDataSet", "functionality not available: the server has an"
" incompatible version of TFileInfo");
return 0;
}
if (!uri || strlen(uri) <= 0) {
Info("GetDataSet", "specifying a dataset name is mandatory");
return 0;
}
TMessage nameMess(kPROOF_DATASETS);
nameMess << Int_t(kGetDataSet);
nameMess << TString(uri);
nameMess << TString(optStr ? optStr: "");
if (Broadcast(nameMess) < 0)
Error("GetDataSet", "sending request failed");
Collect(kActive, fCollectTimeout);
TFileCollection *fileList = 0;
if (fStatus != 0) {
Error("GetDataSet", "error receiving datasets information");
} else {
TMessage *retMess = (TMessage *) fRecvMessages->First();
if (retMess && retMess->What() == kMESS_OK) {
if (!(fileList = (TFileCollection*)(retMess->ReadObject(TFileCollection::Class()))))
Error("GetDataSet", "error reading list of files");
} else
Error("GetDataSet", "message not found or wrong type (%p)", retMess);
}
return fileList;
}
void TProof::ShowDataSet(const char *uri, const char* opt)
{
TFileCollection *fileList = 0;
if ((fileList = GetDataSet(uri))) {
fileList->Print(opt);
delete fileList;
} else
Warning("ShowDataSet","no such dataset: %s", uri);
}
Int_t TProof::RemoveDataSet(const char *uri, const char* optStr)
{
TMessage nameMess(kPROOF_DATASETS);
nameMess << Int_t(kRemoveDataSet);
nameMess << TString(uri?uri:"");
nameMess << TString(optStr?optStr:"");
if (Broadcast(nameMess) < 0)
Error("RemoveDataSet", "sending request failed");
Collect(kActive, fCollectTimeout);
if (fStatus != 0)
return -1;
else
return 0;
}
TList* TProof::FindDataSets(const char* , const char* )
{
Error ("FindDataSets", "not yet implemented");
return (TList *) 0;
}
Bool_t TProof::RequestStagingDataSet(const char *dataset)
{
if (fProtocol < 35) {
Error("RequestStagingDataSet",
"functionality not supported by the server");
return kFALSE;
}
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kRequestStaging);
mess << TString(dataset);
Broadcast(mess);
Collect();
if (fStatus != 0) {
Error("RequestStagingDataSet", "staging request was unsuccessful");
return kFALSE;
}
return kTRUE;
}
Bool_t TProof::CancelStagingDataSet(const char *dataset)
{
if (fProtocol < 36) {
Error("CancelStagingDataSet",
"functionality not supported by the server");
return kFALSE;
}
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kCancelStaging);
mess << TString(dataset);
Broadcast(mess);
Collect();
if (fStatus != 0) {
Error("CancelStagingDataSet", "cancel staging request was unsuccessful");
return kFALSE;
}
return kTRUE;
}
TFileCollection *TProof::GetStagingStatusDataSet(const char *dataset)
{
if (fProtocol < 35) {
Error("GetStagingStatusDataSet",
"functionality not supported by the server");
return NULL;
}
TMessage nameMess(kPROOF_DATASETS);
nameMess << Int_t(kStagingStatus);
nameMess << TString(dataset);
if (Broadcast(nameMess) < 0) {
Error("GetStagingStatusDataSet", "sending request failed");
return NULL;
}
Collect(kActive, fCollectTimeout);
TFileCollection *fc = NULL;
if (fStatus < 0) {
Error("GetStagingStatusDataSet", "problem processing the request");
}
else if (fStatus == 0) {
TMessage *retMess = (TMessage *)fRecvMessages->First();
if (retMess && (retMess->What() == kMESS_OK)) {
fc = (TFileCollection *)(
retMess->ReadObject(TFileCollection::Class()) );
if (!fc)
Error("GetStagingStatusDataSet", "error reading list of files");
}
else {
Error("GetStagingStatusDataSet",
"response message not found or wrong type (%p)", retMess);
}
}
return fc;
}
void TProof::ShowStagingStatusDataSet(const char *dataset, const char *opt)
{
TFileCollection *fc = GetStagingStatusDataSet(dataset);
if (fc) {
fc->Print(opt);
delete fc;
}
}
Int_t TProof::VerifyDataSet(const char *uri, const char *optStr)
{
if (fProtocol < 15) {
Info("VerifyDataSet", "functionality not available: the server has an"
" incompatible version of TFileInfo");
return -1;
}
if (!uri || (uri && strlen(uri) <= 0)) {
Error("VerifyDataSet", "dataset name is is mandatory");
return -1;
}
Int_t nmissingfiles = 0;
TString sopt(optStr);
if (fProtocol < 34 || sopt.Contains("S")) {
sopt.ReplaceAll("S", "");
Info("VerifyDataSet", "Master-only verification");
TMessage nameMess(kPROOF_DATASETS);
nameMess << Int_t(kVerifyDataSet);
nameMess << TString(uri ? uri : "");
nameMess << sopt;
Broadcast(nameMess);
Collect(kActive, fCollectTimeout);
if (fStatus < 0) {
Info("VerifyDataSet", "no such dataset %s", uri);
return -1;
} else
nmissingfiles = fStatus;
return nmissingfiles;
}
if (!IsParallel() && !fDynamicStartup) {
Error("VerifyDataSet", "PROOF is in sequential mode (no workers): cannot do parallel verification.");
Error("VerifyDataSet", "Either start PROOF with some workers or force sequential adding 'S' as option.");
return -1;
}
return VerifyDataSetParallel(uri, optStr);
}
Int_t TProof::VerifyDataSetParallel(const char *uri, const char *optStr)
{
Int_t nmissingfiles = 0;
SetParameter("PROOF_FilesToProcess", Form("dataset:%s", uri));
TString oldpack;
if (TProof::GetParameter(GetInputList(), "PROOF_Packetizer", oldpack) != 0) oldpack = "";
SetParameter("PROOF_Packetizer", "TPacketizerFile");
SetParameter("PROOF_VerifyDataSet", uri);
SetParameter("PROOF_VerifyDataSetOption", optStr);
SetParameter("PROOF_SavePartialResults", (Int_t)0);
Int_t oldifiip = -1;
if (TProof::GetParameter(GetInputList(), "PROOF_IncludeFileInfoInPacket", oldifiip) != 0) oldifiip = -1;
SetParameter("PROOF_IncludeFileInfoInPacket", (Int_t)1);
const char* mss="";
SetParameter("PROOF_MSS", mss);
const char* stageoption="";
SetParameter("PROOF_StageOption", stageoption);
Process("TSelVerifyDataSet", (Long64_t) 1);
if (!oldpack.IsNull())
SetParameter("PROOF_Packetizer", oldpack);
else
DeleteParameters("PROOF_Packetizer");
DeleteParameters("PROOF_FilesToProcess");
DeleteParameters("PROOF_VerifyDataSet");
DeleteParameters("PROOF_VerifyDataSetOption");
DeleteParameters("PROOF_MSS");
DeleteParameters("PROOF_StageOption");
if (oldifiip > -1) {
SetParameter("PROOF_IncludeFileInfoInPacket", oldifiip);
} else {
DeleteParameters("PROOF_IncludeFileInfoInPacket");
}
DeleteParameters("PROOF_SavePartialResults");
Int_t nopened = 0;
Int_t ntouched = 0;
Bool_t changed_ds = kFALSE;
TIter nxtout(GetOutputList());
TObject* obj;
TList *lfiindout = new TList;
while ((obj = nxtout())) {
TList *l = dynamic_cast<TList *>(obj);
if (l && TString(l->GetName()).BeginsWith("PROOF_ListFileInfos_")) {
TIter nxt(l);
TFileInfo *fiindout = 0;
while ((fiindout = (TFileInfo*) nxt())) {
lfiindout->Add(fiindout);
}
}
TParameter<Int_t>* pdisappeared = dynamic_cast<TParameter<Int_t>*>(obj);
if ( pdisappeared && TString(pdisappeared->GetName()).BeginsWith("PROOF_NoFilesDisppeared_")) {
nmissingfiles += pdisappeared->GetVal();
}
TParameter<Int_t>* pnopened = dynamic_cast<TParameter<Int_t>*>(obj);
if (pnopened && TString(pnopened->GetName()).BeginsWith("PROOF_NoFilesOpened_")) {
nopened += pnopened->GetVal();
}
TParameter<Int_t>* pntouched = dynamic_cast<TParameter<Int_t>*>(obj);
if (pntouched && TString(pntouched->GetName()).BeginsWith("PROOF_NoFilesTouched_")) {
ntouched += pntouched->GetVal();
}
TParameter<Bool_t>* pchanged_ds = dynamic_cast<TParameter<Bool_t>*>(obj);
if (pchanged_ds && TString(pchanged_ds->GetName()).BeginsWith("PROOF_DataSetChanged_")) {
if (pchanged_ds->GetVal() == kTRUE) changed_ds = kTRUE;
}
}
Info("VerifyDataSetParallel", "%s: changed? %d (# files opened = %d, # files touched = %d,"
" # missing files = %d)",
uri, changed_ds, nopened, ntouched, nmissingfiles);
return nmissingfiles;
}
TMap *TProof::GetDataSetQuota(const char* optStr)
{
if (IsLite()) {
Info("UploadDataSet", "Lite-session: functionality not implemented");
return (TMap *)0;
}
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kGetQuota);
mess << TString(optStr?optStr:"");
Broadcast(mess);
Collect(kActive, fCollectTimeout);
TMap *groupQuotaMap = 0;
if (fStatus < 0) {
Info("GetDataSetQuota", "could not receive quota");
} else {
TMessage *retMess = (TMessage *) fRecvMessages->First();
if (retMess && retMess->What() == kMESS_OK) {
if (!(groupQuotaMap = (TMap*)(retMess->ReadObject(TMap::Class()))))
Error("GetDataSetQuota", "error getting quotas");
} else
Error("GetDataSetQuota", "message not found or wrong type (%p)", retMess);
}
return groupQuotaMap;
}
void TProof::ShowDataSetQuota(Option_t* opt)
{
if (fProtocol < 15) {
Info("ShowDataSetQuota",
"functionality not available: the server does not have dataset support");
return;
}
if (IsLite()) {
Info("UploadDataSet", "Lite-session: functionality not implemented");
return;
}
TMessage mess(kPROOF_DATASETS);
mess << Int_t(kShowQuota);
mess << TString(opt?opt:"");
Broadcast(mess);
Collect();
if (fStatus != 0)
Error("ShowDataSetQuota", "error receiving quota information");
}
void TProof::InterruptCurrentMonitor()
{
if (fCurrentMonitor)
fCurrentMonitor->Interrupt();
}
Int_t TProof::ActivateWorker(const char *ord, Bool_t save)
{
return ModifyWorkerLists(ord, kTRUE, save);
}
Int_t TProof::DeactivateWorker(const char *ord, Bool_t save)
{
return ModifyWorkerLists(ord, kFALSE, save);
}
Int_t TProof::ModifyWorkerLists(const char *ord, Bool_t add, Bool_t save)
{
if (!ord || strlen(ord) <= 0) {
Info("ModifyWorkerLists",
"an ordinal number - e.g. \"0.4\" or \"*\" for all - is required as input");
return -1;
}
if (gDebug > 0)
Info("ModifyWorkerLists", "ord: '%s' (add: %d, save: %d)", ord, add, save);
if (IsEndMaster()) {
if (!strcmp(ord, "restore")) {
RestoreActiveList();
} else {
if (save) SaveActiveList();
}
}
Bool_t allord = strcmp(ord, "*") ? kFALSE : kTRUE;
if (TestBit(TProof::kIsMaster) && gProofServ) {
if (!allord &&
strncmp(ord, gProofServ->GetOrdinal(), strlen(gProofServ->GetOrdinal())))
return 0;
}
Bool_t fw = kTRUE;
Bool_t rs = kFALSE;
TList *in = (add) ? fInactiveSlaves : fActiveSlaves;
TList *out = (add) ? fActiveSlaves : fInactiveSlaves;
Int_t nwc = 0;
if (IsEndMaster()) {
THashList *ords = 0;
if (!allord) {
ords = new THashList();
TString oo(ord), o;
Int_t from = 0;
while(oo.Tokenize(o, from, ","))
if (o.BeginsWith(gProofServ->GetOrdinal())) ords->Add(new TObjString(o));
}
fw = kFALSE;
TObject *os = 0;
TSlave *wrk = 0;
if (in->GetSize() > 0) {
TIter nxw(in);
while ((wrk = (TSlave *) nxw())) {
os = 0;
if (allord || (ords && (os = ords->FindObject(wrk->GetOrdinal())))) {
if (!out->FindObject(wrk)) {
out->Add(wrk);
if (add)
fActiveMonitor->Add(wrk->GetSocket());
}
in->Remove(wrk);
if (!add) {
fActiveMonitor->Remove(wrk->GetSocket());
wrk->SetStatus(TSlave::kInactive);
} else
wrk->SetStatus(TSlave::kActive);
nwc++;
fw = kFALSE;
rs = kTRUE;
if (!allord && ords) {
if (os) ords->Remove(os);
if (ords->GetSize() == 0) break;
SafeDelete(os);
}
}
}
}
if (!fw && ords && ords->GetSize() > 0) {
TString oo;
TIter nxo(ords);
while ((os = nxo())) {
TIter nxw(out);
while ((wrk = (TSlave *) nxw()))
if (!strcmp(os->GetName(), wrk->GetOrdinal())) break;
if (!wrk) {
if (!oo.IsNull()) oo += ",";
oo += os->GetName();
}
}
if (!oo.IsNull()) {
Warning("ModifyWorkerLists", "worker(s) '%s' not found!", oo.Data());
nwc = -2;
}
}
if (ords) {
ords->Delete();
SafeDelete(ords);
}
}
if (rs)
FindUniqueSlaves();
Int_t action = (add) ? (Int_t) kActivateWorker : (Int_t) kDeactivateWorker;
if (fw) {
if (fProtocol > 32) {
TMessage mess(kPROOF_WORKERLISTS);
mess << action << TString(ord);
Broadcast(mess);
Collect(kActive, fCollectTimeout);
if (fStatus != 0) {
nwc = (fStatus < nwc) ? fStatus : nwc;
if (fStatus == -2) {
if (gDebug > 0)
Warning("ModifyWorkerLists", "request not completely full filled");
} else {
Error("ModifyWorkerLists", "request failed");
}
}
} else {
TString oo(ord), o;
if (oo.Contains(","))
Warning("ModifyWorkerLists", "block request not supported by server: splitting into pieces ...");
Int_t from = 0;
while(oo.Tokenize(o, from, ",")) {
TMessage mess(kPROOF_WORKERLISTS);
mess << action << o;
Broadcast(mess);
Collect(kActive, fCollectTimeout);
}
}
}
return nwc;
}
void TProof::SaveActiveList()
{
if (!fActiveSlavesSaved.IsNull()) fActiveSlavesSaved = "";
if (fInactiveSlaves->GetSize() == 0) {
fActiveSlavesSaved = "*";
} else {
TIter nxw(fActiveSlaves);
TSlave *wk = 0;
while ((wk = (TSlave *)nxw())) { fActiveSlavesSaved += TString::Format("%s,", wk->GetOrdinal()); }
}
}
void TProof::RestoreActiveList()
{
DeactivateWorker("*", kFALSE);
if (!fActiveSlavesSaved.IsNull())
ActivateWorker(fActiveSlavesSaved, kFALSE);
}
TProof *TProof::Open(const char *cluster, const char *conffile,
const char *confdir, Int_t loglevel)
{
const char *pn = "TProof::Open";
if (!cluster) {
TPluginManager *pm = gROOT->GetPluginManager();
if (!pm) {
::Error(pn, "plugin manager not found");
return 0;
}
if (gROOT->IsBatch()) {
::Error(pn, "we are in batch mode, cannot show PROOF Session Viewer");
return 0;
}
TPluginHandler *sv = pm->FindHandler("TSessionViewer", "");
if (!sv) {
::Error(pn, "no plugin found for TSessionViewer");
return 0;
}
if (sv->LoadPlugin() == -1) {
::Error(pn, "plugin for TSessionViewer could not be loaded");
return 0;
}
sv->ExecPlugin(0);
return 0;
} else {
TString clst(cluster);
if (PoDCheckUrl( &clst ) < 0) return 0;
if (clst.BeginsWith("workers=")) clst.Insert(0, "lite:///?");
if (clst.BeginsWith("tunnel=")) clst.Insert(0, "/?");
TUrl u(clst);
TString opts(u.GetOptions());
if (!opts.IsNull()) {
Int_t it = opts.Index("tunnel=");
if (it != kNPOS) {
TString sport = opts(it + strlen("tunnel="), opts.Length());
TString host("127.0.0.1");
Int_t port = -1;
Int_t ic = sport.Index(":");
if (ic != kNPOS) {
host = sport(0, ic);
sport.Remove(0, ic + 1);
}
if (!sport.IsDigit()) {
TRegexp re("[^0-9]");
Int_t ind = sport.Index(re);
if (ind != kNPOS)
sport.Remove(ind);
}
if (sport.IsDigit())
port = sport.Atoi();
if (port > 0) {
::Info("TProof::Open","using tunnel at %s:%d", host.Data(), port);
gEnv->SetValue("XNet.SOCKS4Host", host);
gEnv->SetValue("XNet.SOCKS4Port", port);
} else {
::Warning("TProof::Open",
"problems parsing tunnelling info from options: %s", opts.Data());
}
}
}
Int_t locid = -1;
Bool_t create = kFALSE;
if (opts.Length() > 0) {
if (opts.BeginsWith("N",TString::kIgnoreCase)) {
create = kTRUE;
opts.Remove(0,1);
u.SetOptions(opts);
} else if (opts.IsDigit()) {
locid = opts.Atoi();
}
}
TProofMgr *mgr = TProofMgr::Create(u.GetUrl());
TProof *proof = 0;
if (mgr && mgr->IsValid()) {
Bool_t attach = (create || mgr->IsProofd() || mgr->IsLite()) ? kFALSE : kTRUE;
if (attach) {
TProofDesc *d = 0;
if (locid < 0)
d = (TProofDesc *) mgr->QuerySessions("")->First();
else
d = (TProofDesc *) mgr->GetProofDesc(locid);
if (d) {
proof = (TProof*) mgr->AttachSession(d);
if (!proof || !proof->IsValid()) {
if (locid)
::Error(pn, "new session could not be attached");
SafeDelete(proof);
}
}
}
if (!proof) {
proof = (TProof*) mgr->CreateSession(conffile, confdir, loglevel);
if (!proof || !proof->IsValid()) {
::Error(pn, "new session could not be created");
SafeDelete(proof);
}
}
}
return proof;
}
}
TProofMgr *TProof::Mgr(const char *url)
{
if (!url)
return (TProofMgr *)0;
return TProofMgr::Create(url);
}
void TProof::Reset(const char *url, Bool_t hard)
{
if (url) {
TProofMgr *mgr = TProof::Mgr(url);
if (mgr && mgr->IsValid())
mgr->Reset(hard);
else
::Error("TProof::Reset",
"unable to initialize a valid manager instance");
}
}
const TList *TProof::GetEnvVars()
{
return fgProofEnvList;
}
void TProof::AddEnvVar(const char *name, const char *value)
{
if (gDebug > 0) ::Info("TProof::AddEnvVar","%s=%s", name, value);
if (fgProofEnvList == 0) {
fgProofEnvList = new TList;
fgProofEnvList->SetOwner();
} else {
TObject *o = fgProofEnvList->FindObject(name);
if (o != 0) {
fgProofEnvList->Remove(o);
}
}
fgProofEnvList->Add(new TNamed(name, value));
}
void TProof::DelEnvVar(const char *name)
{
if (fgProofEnvList == 0) return;
TObject *o = fgProofEnvList->FindObject(name);
if (o != 0) {
fgProofEnvList->Remove(o);
}
}
void TProof::ResetEnvVars()
{
if (fgProofEnvList == 0) return;
SafeDelete(fgProofEnvList);
}
void TProof::SaveWorkerInfo()
{
if (TestBit(TProof::kIsClient))
return;
if (!gProofServ) {
Error("SaveWorkerInfo","gProofServ undefined");
return;
}
if (!fSlaves && !fBadSlaves) {
Warning("SaveWorkerInfo","all relevant worker lists is undefined");
return;
}
TString fnwrk = TString::Format("%s/.workers",
gSystem->DirName(gProofServ->GetSessionDir()));
FILE *fwrk = fopen(fnwrk.Data(),"w");
if (!fwrk) {
Error("SaveWorkerInfo",
"cannot open %s for writing (errno: %d)", fnwrk.Data(), errno);
return;
}
TString addlogext;
TString addLogTag;
if (gSystem->Getenv("PROOF_ADDITIONALLOG")) {
addlogext = gSystem->Getenv("PROOF_ADDITIONALLOG");
TPMERegexp reLogTag("^__(.*)__\\.log");
if (reLogTag.Match(addlogext) == 2) {
addLogTag = reLogTag[1];
}
else {
addLogTag = "+++";
}
if (gDebug > 0)
Info("SaveWorkerInfo", "request for additional line with ext: '%s'", addlogext.Data());
}
TPMERegexp re("(.*?)-[0-9]+-[0-9]+$");
TIter nxa(fSlaves);
TSlave *wrk = 0;
TString logfile;
while ((wrk = (TSlave *) nxa())) {
Int_t status = (fBadSlaves && fBadSlaves->FindObject(wrk)) ? 0 : 1;
logfile = wrk->GetWorkDir();
if (re.Match(logfile) == 2) logfile = re[1];
else continue;
fprintf(fwrk,"%s@%s:%d %d %s %s.log\n",
wrk->GetUser(), wrk->GetName(), wrk->GetPort(), status,
wrk->GetOrdinal(), logfile.Data());
if (addlogext.Length() > 0) {
fprintf(fwrk,"%s@%s:%d %d %s(%s) %s.%s\n",
wrk->GetUser(), wrk->GetName(), wrk->GetPort(), status,
wrk->GetOrdinal(), addLogTag.Data(), logfile.Data(), addlogext.Data());
}
}
TIter nxb(fBadSlaves);
while ((wrk = (TSlave *) nxb())) {
logfile = wrk->GetWorkDir();
if (re.Match(logfile) == 2) logfile = re[1];
else continue;
if (!fSlaves->FindObject(wrk)) {
fprintf(fwrk,"%s@%s:%d 0 %s %s.log\n",
wrk->GetUser(), wrk->GetName(), wrk->GetPort(),
wrk->GetOrdinal(), logfile.Data());
}
}
TIter nxt(fTerminatedSlaveInfos);
TSlaveInfo *sli;
while (( sli = (TSlaveInfo *)nxt() )) {
logfile = sli->GetDataDir();
if (re.Match(logfile) == 2) logfile = re[1];
else continue;
fprintf(fwrk, "%s 2 %s %s.log\n",
sli->GetName(), sli->GetOrdinal(), logfile.Data());
if (addlogext.Length() > 0) {
fprintf(fwrk, "%s 2 %s(%s) %s.%s\n",
sli->GetName(), sli->GetOrdinal(), addLogTag.Data(),
logfile.Data(), addlogext.Data());
}
}
fclose(fwrk);
return;
}
Int_t TProof::GetParameter(TCollection *c, const char *par, TString &value)
{
TObject *obj = c ? c->FindObject(par) : (TObject *)0;
if (obj) {
TNamed *p = dynamic_cast<TNamed*>(obj);
if (p) {
value = p->GetTitle();
return 0;
}
}
return -1;
}
Int_t TProof::GetParameter(TCollection *c, const char *par, Int_t &value)
{
TObject *obj = c ? c->FindObject(par) : (TObject *)0;
if (obj) {
TParameter<Int_t> *p = dynamic_cast<TParameter<Int_t>*>(obj);
if (p) {
value = p->GetVal();
return 0;
}
}
return -1;
}
Int_t TProof::GetParameter(TCollection *c, const char *par, Long_t &value)
{
TObject *obj = c ? c->FindObject(par) : (TObject *)0;
if (obj) {
TParameter<Long_t> *p = dynamic_cast<TParameter<Long_t>*>(obj);
if (p) {
value = p->GetVal();
return 0;
}
}
return -1;
}
Int_t TProof::GetParameter(TCollection *c, const char *par, Long64_t &value)
{
TObject *obj = c ? c->FindObject(par) : (TObject *)0;
if (obj) {
TParameter<Long64_t> *p = dynamic_cast<TParameter<Long64_t>*>(obj);
if (p) {
value = p->GetVal();
return 0;
}
}
return -1;
}
Int_t TProof::GetParameter(TCollection *c, const char *par, Double_t &value)
{
TObject *obj = c ? c->FindObject(par) : (TObject *)0;
if (obj) {
TParameter<Double_t> *p = dynamic_cast<TParameter<Double_t>*>(obj);
if (p) {
value = p->GetVal();
return 0;
}
}
return -1;
}
Int_t TProof::AssertDataSet(TDSet *dset, TList *input,
TDataSetManager *mgr, TString &emsg)
{
emsg = "";
if (!dset || !input || !mgr) {
emsg.Form("invalid inputs (%p, %p, %p)", dset, input, mgr);
return -1;
}
TList *datasets = new TList;
TFileCollection *dataset = 0;
TString lookupopt;
TString dsname(dset->GetName());
if (dsname.BeginsWith("TFileCollection:")) {
dsname.ReplaceAll("TFileCollection:", "");
dataset = (TFileCollection *) input->FindObject(dsname);
if (!dataset) {
emsg.Form("TFileCollection %s not found in input list", dset->GetName());
return -1;
}
input->RecursiveRemove(dataset);
datasets->Add(new TPair(dataset, new TObjString("")));
if (TProof::GetParameter(input, "PROOF_LookupOpt", lookupopt) != 0) {
lookupopt = gEnv->GetValue("Proof.LookupOpt", "all");
input->Add(new TNamed("PROOF_LookupOpt", lookupopt.Data()));
}
}
TString dsnparse;
if (!dataset) {
TString dsns( dsname.Data() ), enl;
Ssiz_t eli = dsns.Index("?enl=");
TFileCollection *fc;
if (eli != kNPOS) {
enl = dsns(eli+5, dsns.Length());
dsns.Remove(eli, dsns.Length()-eli);
}
Bool_t validEnl = ((enl.Index("|") == kNPOS) &&
(enl.Index(",") == kNPOS) && (enl.Index(" ") == kNPOS));
if (validEnl && (( fc = mgr->GetDataSet(dsns) ))) {
TIter nxfi(fc->GetList());
TFileInfo *fi;
while (( fi = (TFileInfo *)nxfi() ))
fi->SetTitle(dsns.Data());
dataset = fc;
dsnparse = dsns;
datasets->Add( new TPair(dataset, new TObjString( enl.Data() )) );
}
else {
dsns = dsname.Data();
TString dsn1;
Int_t from1 = 0;
while (dsns.Tokenize(dsn1, from1, "[, ]")) {
TString dsn2;
Int_t from2 = 0;
while (dsn1.Tokenize(dsn2, from2, "|")) {
enl = "";
Int_t ienl = dsn2.Index("?enl=");
if (ienl != kNPOS) {
enl = dsn2(ienl + 5, dsn2.Length());
dsn2.Remove(ienl);
}
if ((fc = mgr->GetDataSet(dsn2.Data()))) {
TIter nxfi(fc->GetList());
TFileInfo *fi;
while ((fi = (TFileInfo *) nxfi())) { fi->SetTitle(dsn2.Data()); }
dsnparse = dsn2;
if (!dataset) {
dataset = fc;
} else {
dataset->Add(fc);
SafeDelete(fc);
}
}
}
if (dataset) {
if (dataset->GetList()->First())
((TFileInfo *)(dataset->GetList()->First()))->SetTitle(dsn1.Data());
datasets->Add(new TPair(dataset, new TObjString(enl.Data())));
}
dataset = 0;
}
}
if (!datasets || datasets->GetSize() <= 0) {
emsg.Form("no dataset(s) found on the master corresponding to: %s", dsname.Data());
return -1;
} else {
if (!(dataset = (TFileCollection *) ((TPair *)(datasets->First()))->Key())) {
emsg.Form("dataset pointer is null: corruption? - aborting");
return -1;
}
}
if (TProof::GetParameter(input, "PROOF_LookupOpt", lookupopt) != 0) {
lookupopt = gEnv->GetValue("Proof.LookupOpt", "stagedOnly");
input->Add(new TNamed("PROOF_LookupOpt", lookupopt.Data()));
}
} else {
dsnparse = dsname;
}
TString dsTree;
mgr->ParseUri(dsnparse.Data(), 0, 0, 0, &dsTree);
if (dsTree.IsNull()) {
dsTree += dset->GetDirectory();
dsTree += dset->GetObjName();
}
if (!dsTree.IsNull() && dsTree != "/") {
TString tree(dsTree);
Int_t idx = tree.Index("/");
if (idx != kNPOS) {
TString dir = tree(0, idx+1);
tree.Remove(0, idx);
dset->SetDirectory(dir);
}
dset->SetObjName(tree);
} else {
dsTree = dataset->GetDefaultTreeName();
}
TList *srvmapsref = TDataSetManager::GetDataSetSrvMaps();
TList *srvmapslist = srvmapsref;
TString srvmaps;
if (TProof::GetParameter(input, "PROOF_DataSetSrvMaps", srvmaps) == 0) {
srvmapslist = TDataSetManager::ParseDataSetSrvMaps(srvmaps);
if (gProofServ) {
TString msg;
if (srvmapsref && !srvmapslist) {
msg.Form("+++ Info: dataset server mapping(s) DISABLED by user");
} else if (srvmapsref && srvmapslist && srvmapslist != srvmapsref) {
msg.Form("+++ Info: dataset server mapping(s) modified by user");
} else if (!srvmapsref && srvmapslist) {
msg.Form("+++ Info: dataset server mapping(s) added by user");
}
gProofServ->SendAsynMessage(msg.Data());
}
}
if (datasets->GetSize() > 1) dset->SetBit(TDSet::kMultiDSet);
TList *listOfMissingFiles = new TList;
TEntryList *entrylist = 0;
TPair *pair = 0;
TIter nxds(datasets);
while ((pair = (TPair *) nxds())) {
dataset = (TFileCollection *) pair->Key();
TEntryList *enl = 0;
TObjString *os = (TObjString *) pair->Value();
if (strlen(os->GetName())) {
if (!(enl = dynamic_cast<TEntryList *>(input->FindObject(os->GetName())))) {
if (gProofServ)
gProofServ->SendAsynMessage(TString::Format("+++ Warning:"
" entry list %s not found", os->GetName()));
}
if (enl && (!(enl->GetLists()) || enl->GetLists()->GetSize() <= 0)) {
if (gProofServ)
gProofServ->SendAsynMessage(TString::Format("+++ Warning:"
" no sub-lists in entry-list!"));
}
}
TList *missingFiles = new TList;
TSeqCollection* files = dataset->GetList();
if (gDebug > 0) files->Print();
Bool_t availableOnly = (lookupopt != "all") ? kTRUE : kFALSE;
if (dset->TestBit(TDSet::kMultiDSet)) {
TDSet *ds = new TDSet(dataset->GetName(), dset->GetObjName(), dset->GetDirectory());
ds->SetSrvMaps(srvmapslist);
if (!ds->Add(files, dsTree, availableOnly, missingFiles)) {
emsg.Form("error integrating dataset %s", dataset->GetName());
continue;
}
dset->Add(ds);
if (enl) ds->SetEntryList(enl);
} else {
dset->SetSrvMaps(srvmapslist);
if (!dset->Add(files, dsTree, availableOnly, missingFiles)) {
emsg.Form("error integrating dataset %s", dataset->GetName());
continue;
}
if (enl) entrylist = enl;
}
if (missingFiles) {
TIter next(missingFiles);
TObject *file;
while ((file = next())) {
dataset->GetList()->Remove(file);
listOfMissingFiles->Add(file);
}
missingFiles->SetOwner(kFALSE);
missingFiles->Clear();
}
SafeDelete(missingFiles);
}
nxds.Reset();
while ((pair = (TPair *) nxds())) {
if (pair->Key()) delete pair->Key();
if (pair->Value()) delete pair->Value();
}
datasets->SetOwner(kTRUE);
SafeDelete(datasets);
if (srvmapslist && srvmapslist != srvmapsref) {
srvmapslist->SetOwner(kTRUE);
SafeDelete(srvmapslist);
}
if (entrylist) dset->SetEntryList(entrylist);
if (listOfMissingFiles && listOfMissingFiles->GetSize() > 0) {
listOfMissingFiles->SetName("MissingFiles");
input->Add(listOfMissingFiles);
}
return 0;
}
Int_t TProof::SaveInputData(TQueryResult *qr, const char *cachedir, TString &emsg)
{
TList *input = 0;
if (!qr || !(input = qr->GetInputList()) ||
!cachedir || strlen(cachedir) <= 0) return 0;
TNamed *data = (TNamed *) input->FindObject("PROOF_InputDataFile");
TList *inputdata = (TList *) input->FindObject("PROOF_InputData");
if (!data && !inputdata) return 0;
if (!data)
input->Add((data = new TNamed("PROOF_InputDataFile", kPROOF_InputDataFile)));
TString dstname(data->GetTitle()), srcname;
Bool_t fromcache = kFALSE;
if (dstname.BeginsWith("cache:")) {
fromcache = kTRUE;
dstname.ReplaceAll("cache:", "");
srcname.Form("%s/%s", cachedir, dstname.Data());
if (gSystem->AccessPathName(srcname)) {
emsg.Form("input data file not found in cache (%s)", srcname.Data());
return -1;
}
}
if (fromcache) {
if (gSystem->CopyFile(srcname, dstname, kTRUE) != 0) {
emsg.Form("problems copying %s to %s", srcname.Data(), dstname.Data());
return -1;
}
} else {
if (inputdata && inputdata->GetSize() > 0) {
TFile *f = TFile::Open(dstname.Data(), "RECREATE");
if (f) {
f->cd();
inputdata->Write();
f->Close();
delete f;
} else {
emsg.Form("could not create %s", dstname.Data());
return -1;
}
} else {
emsg.Form("no input data!");
return -1;
}
}
::Info("TProof::SaveInputData", "input data saved to %s", dstname.Data());
data->SetTitle(dstname);
if (inputdata) {
input->Remove(inputdata);
inputdata->SetOwner();
delete inputdata;
}
return 0;
}
Int_t TProof::SendInputData(TQueryResult *qr, TProof *p, TString &emsg)
{
TList *input = 0;
if (!qr || !(input = qr->GetInputList())) return 0;
TNamed *inputdata = (TNamed *) input->FindObject("PROOF_InputDataFile");
if (!inputdata) return 0;
TString fname(inputdata->GetTitle());
if (gSystem->AccessPathName(fname)) {
emsg.Form("input data file not found in sandbox (%s)", fname.Data());
return -1;
}
if (!p || !p->IsValid()) {
emsg.Form("TProof object undefined or invalid: protocol error!");
return -1;
}
p->BroadcastFile(fname, TProof::kBinary, "cache");
return 0;
}
Int_t TProof::GetInputData(TList *input, const char *cachedir, TString &emsg)
{
if (!input || !cachedir || strlen(cachedir) <= 0) return 0;
TNamed *inputdata = (TNamed *) input->FindObject("PROOF_InputDataFile");
if (!inputdata) return 0;
TString fname;
fname.Form("%s/%s", cachedir, inputdata->GetTitle());
if (gSystem->AccessPathName(fname)) {
emsg.Form("input data file not found in cache (%s)", fname.Data());
return -1;
}
TList *added = new TList;
added->SetName("PROOF_InputObjsFromFile");
TFile *f = TFile::Open(fname.Data());
if (f) {
TList *keys = (TList *) f->GetListOfKeys();
if (!keys) {
emsg.Form("could not get list of object keys from file");
return -1;
}
TIter nxk(keys);
TKey *k = 0;
while ((k = (TKey *)nxk())) {
TObject *o = f->Get(k->GetName());
if (o) {
input->Add(o);
added->Add(o);
}
}
if (added->GetSize() > 0) {
added->Add(f);
input->Add(added);
} else {
f->Close();
delete f;
}
} else {
emsg.Form("could not open %s", fname.Data());
return -1;
}
return 0;
}
void TProof::LogViewer(const char *url, Int_t idx)
{
if (!gROOT->IsBatch()) {
if (!fgLogViewer) {
if ((fgLogViewer =
gROOT->GetPluginManager()->FindHandler("TProofProgressLog"))) {
if (fgLogViewer->LoadPlugin() == -1) {
fgLogViewer = 0;
::Error("TProof::LogViewer", "cannot load the relevant plug-in");
return;
}
}
}
if (fgLogViewer) {
TString u = (url && strlen(url) <= 0) ? "lite" : url;
fgLogViewer->ExecPlugin(2, u.Data(), idx);
}
} else {
if (url && strlen(url) > 0) {
::Info("TProof::LogViewer",
"batch mode: use TProofLog *pl = TProof::Mgr(\"%s\")->GetSessionLogs(%d)", url, idx);
} else if (url && strlen(url) <= 0) {
::Info("TProof::LogViewer",
"batch mode: use TProofLog *pl = TProof::Mgr(\"lite\")->GetSessionLogs(%d)", idx);
} else {
::Info("TProof::LogViewer",
"batch mode: use TProofLog *pl = TProof::Mgr(\"<master>\")->GetSessionLogs(%d)", idx);
}
}
return;
}
void TProof::SetProgressDialog(Bool_t on)
{
if (on)
SetBit(kUseProgressDialog);
else
ResetBit(kUseProgressDialog);
}
void TProof::ShowMissingFiles(TQueryResult *qr)
{
TQueryResult *xqr = (qr) ? qr : GetQueryResult();
if (!xqr) {
Warning("ShowMissingFiles", "no (last) query found: do nothing");
return;
}
TList *missing = (xqr->GetOutputList()) ? (TList *) xqr->GetOutputList()->FindObject("MissingFiles") : 0;
if (!missing) {
Info("ShowMissingFiles", "no files missing in query %s:%s", xqr->GetTitle(), xqr->GetName());
return;
}
Int_t nmf = 0, ncf = 0;
Long64_t msz = 0, mszzip = 0, mev = 0;
TFileInfo *fi = 0;
TIter nxf(missing);
while ((fi = (TFileInfo *) nxf())) {
char status = 'M';
if (fi->TestBit(TFileInfo::kCorrupted)) {
ncf++;
status = 'C';
} else {
nmf++;
}
TFileInfoMeta *im = fi->GetMetaData();
if (im) {
if (im->GetTotBytes() > 0) msz += im->GetTotBytes();
if (im->GetZipBytes() > 0) mszzip += im->GetZipBytes();
mev += im->GetEntries();
Printf(" %d. (%c) %s %s %lld", ncf+nmf, status, fi->GetCurrentUrl()->GetUrl(), im->GetName(), im->GetEntries());
} else {
Printf(" %d. (%c) %s '' -1", ncf+nmf, status, fi->GetCurrentUrl()->GetUrl());
}
}
if (msz <= 0) msz = -1;
if (mszzip <= 0) mszzip = -1;
Double_t xf = (Double_t)mev / (mev + xqr->GetEntries()) ;
if (msz > 0. || mszzip > 0.) {
Printf(" +++ %d file(s) missing, %d corrupted, i.e. %lld unprocessed events -->"
" about %.2f%% of the total (%lld bytes, %lld zipped)",
nmf, ncf, mev, xf * 100., msz, mszzip);
} else {
Printf(" +++ %d file(s) missing, %d corrupted, i.e. %lld unprocessed events -->"
" about %.2f%% of the total", nmf, ncf, mev, xf * 100.);
}
}
TFileCollection *TProof::GetMissingFiles(TQueryResult *qr)
{
TFileCollection *fc = 0;
TQueryResult *xqr = (qr) ? qr : GetQueryResult();
if (!xqr) {
Warning("GetMissingFiles", "no (last) query found: do nothing");
return fc;
}
TList *missing = (xqr->GetOutputList()) ? (TList *) xqr->GetOutputList()->FindObject("MissingFiles") : 0;
if (!missing) {
if (gDebug > 0)
Info("ShowMissingFiles", "no files missing in query %s:%s", xqr->GetTitle(), xqr->GetName());
return fc;
}
TString fcname("unknown");
TDSet *ds = (TDSet *) xqr->GetInputObject("TDSet");
if (ds) {
fcname.Form("%s.m0", ds->GetName());
Int_t j = 1;
while (gDirectory->FindObject(fcname) && j < 1000)
fcname.Form("%s.m%d", ds->GetName(), j++);
}
fc = new TFileCollection(fcname, "Missing Files");
if (ds) fc->SetDefaultTreeName(ds->GetObjName());
TFileInfo *fi = 0;
TIter nxf(missing);
while ((fi = (TFileInfo *) nxf())) {
fc->Add((TFileInfo *) fi->Clone());
}
fc->Update();
return fc;
}
void TProof::SetPerfTree(const char *pf, Bool_t withWrks)
{
if (pf && strlen(pf) > 0) {
fPerfTree = pf;
SetParameter("PROOF_StatsHist", "");
SetParameter("PROOF_StatsTrace", "");
if (withWrks) SetParameter("PROOF_SlaveStatsTrace", "");
Info("SetPerfTree", "saving of the performance tree enabled (%s)", fPerfTree.Data());
} else {
fPerfTree = "";
DeleteParameters("PROOF_StatsHist");
DeleteParameters("PROOF_StatsTrace");
DeleteParameters("PROOF_SlaveStatsTrace");
Info("SetPerfTree", "saving of the performance tree disabled");
}
}
Int_t TProof::SavePerfTree(const char *pf, const char *ref)
{
if (!IsValid()) {
Error("SafePerfTree", "this TProof instance is invalid!");
return -1;
}
TList *outls = GetOutputList();
TString sref;
if (ref && strlen(ref) > 0) {
if (!fPlayer) {
Error("SafePerfTree", "requested to use query '%s' but player instance undefined!", ref);
return -1;
}
TQueryResult *qr = fPlayer->GetQueryResult(ref);
if (!qr) {
Error("SafePerfTree", "TQueryResult instance for query '%s' could not be retrieved", ref);
return -1;
}
outls = qr->GetOutputList();
sref.Form(" for requested query '%s'", ref);
}
if (!outls || (outls && outls->GetSize() <= 0)) {
Error("SafePerfTree", "outputlist%s undefined or empty", sref.Data());
return -1;
}
TString fn = fPerfTree;
if (pf && strlen(pf)) fn = pf;
if (fn.IsNull()) fn = "perftree.root";
TFile f(fn, "RECREATE");
if (f.IsZombie()) {
Error("SavePerfTree", "could not open file '%s' for writing", fn.Data());
} else {
f.cd();
TIter nxo(outls);
TObject* obj = 0;
while ((obj = nxo())) {
TString objname(obj->GetName());
if (objname.BeginsWith("PROOF_")) {
if (objname == "PROOF_PerfStats" ||
objname == "PROOF_PacketsHist" ||
objname == "PROOF_EventsHist" ||
objname == "PROOF_NodeHist" ||
objname == "PROOF_LatencyHist" ||
objname == "PROOF_ProcTimeHist" ||
objname == "PROOF_CpuTimeHist")
obj->Write();
}
}
f.Close();
}
Info("SavePerfTree", "performance information%s saved in %s ...", sref.Data(), fn.Data());
return 0;
}