]> git.uio.no Git - u/mrichter/AliRoot.git/blobdiff - SHUTTLE/AliShuttleTrigger.cxx
dcs timeout and number of retrievals set in the configuration instead of in AliShuttl...
[u/mrichter/AliRoot.git] / SHUTTLE / AliShuttleTrigger.cxx
index 9f8f778cfd84f431595622668037993d780210c4..d53ae7207e9906510999b371dccb890dfdfaaf9e 100644 (file)
 
 /*
  $Log$
+ Revision 1.15  2007/12/10 18:29:23  acolla
+ Some log added to the listen mode
+
+ Revision 1.14  2007/12/07 19:14:36  acolla
+ in AliShuttleTrigger:
+
+ Added automatic collection of new runs on a regular time basis (settable from the configuration)
+
+ in AliShuttleConfig: new members
+
+ - triggerWait: time to wait for DIM trigger (s) before starting automatic collection of new runs
+ - mode: run mode (test, prod) -> used to build log folder (logs or logs_PROD)
+
+ in AliShuttle:
+
+ - logs now stored in logs/#RUN/DET_#RUN.log
+
+ Revision 1.13  2006/11/16 16:16:48  jgrosseo
+ introducing strict run ordering flag
+ removed giving preprocessor name to preprocessor, they have to know their name themselves ;-)
+
+ Revision 1.12  2006/10/20 15:22:59  jgrosseo
+ o) Adding time out to the execution of the preprocessors: The Shuttle forks and the parent process monitors the child
+ o) Merging Collect, CollectAll, CollectNew function
+ o) Removing implementation of empty copy constructors (declaration still there!)
+
+ Revision 1.11  2006/10/02 16:38:39  jgrosseo
+ update (alberto):
+ fixed memory leaks
+ storing of objects that failed to be stored to the grid before
+ interfacing of shuttle status table in daq system
+
+ Revision 1.10  2006/08/15 10:50:00  jgrosseo
+ effc++ corrections (alberto)
+
+ Revision 1.9  2006/08/08 14:19:29  jgrosseo
+ Update to shuttle classes (Alberto)
+
+ - Possibility to set the full object's path in the Preprocessor's and
+ Shuttle's  Store functions
+ - Possibility to extend the object's run validity in the same classes
+ ("startValidity" and "validityInfinite" parameters)
+ - Implementation of the StoreReferenceData function to store reference
+ data in a dedicated CDB storage.
+
+ Revision 1.8  2006/07/21 07:37:20  jgrosseo
+ last run is stored after each run
+
+ Revision 1.7  2006/07/20 09:54:40  jgrosseo
+ introducing status management: The processing per subdetector is divided into several steps,
+ after each step the status is stored on disk. If the system crashes in any of the steps the Shuttle
+ can keep track of the number of failures and skips further processing after a certain threshold is
+ exceeded. These thresholds can be configured in LDAP.
+
+ Revision 1.6  2006/07/19 10:09:55  jgrosseo
+ new configuration, accesst to DAQ FES (Alberto)
+
+ Revision 1.5  2006/07/10 13:01:41  jgrosseo
+ enhanced storing of last sucessfully processed run (alberto)
+
  Revision 1.4  2006/07/04 14:59:57  jgrosseo
  revision of AliDCSValue: Removed wrapper classes, reduced storage size per value by factor 2
 
 // 
 // This class is to deal with DAQ LogBook and DAQ "end of run" notification.
 // It has severeal two modes:
-//     1) syncrhnized - Collect(), CollectNew() and CollectAll methods
+//     1) synchronized - Collect()
 //     2) asynchronized - Run() - starts listening for DAQ "end of run"
 //             notification by DIM service.
 //
 
 #include "AliShuttleTrigger.h"
 
-#include <TSQLServer.h>
-#include <TSQLResult.h>
-#include <TSQLRow.h>
-#include <TObjArray.h>
 #include <TSystem.h>
 
 #include "AliLog.h"
-#include "AliCDBManager.h"
-#include "AliCDBStorage.h"
-#include "AliCDBEntry.h"
-
-#include "AliDCSValue.h"
 #include "AliShuttleConfig.h"
 #include "AliShuttle.h"
 #include "DATENotifier.h"
 
 ClassImp(TerminateSignalHandler)
-
-//______________________________________________________________________
-TerminateSignalHandler::TerminateSignalHandler(const TerminateSignalHandler& /*other*/):
-TSignalHandler()
-{
-// copy constructor (not implemented)
-
-}
-
-//______________________________________________________________________
-TerminateSignalHandler &TerminateSignalHandler::operator=(const TerminateSignalHandler& /*other*/)
-{
-// assignment operator (not implemented)
-
-return *this;
-}
+ClassImp(AliShuttleTrigger)
 
 //______________________________________________________________________________________________
-Bool_t TerminateSignalHandler::Notify() 
+Bool_t TerminateSignalHandler::Notify()
 {
 // Sentd terminate command to the Shuttle trigger
 
@@ -93,17 +129,12 @@ Bool_t TerminateSignalHandler::Notify()
 }
 
 //______________________________________________________________________________________________
-//______________________________________________________________________________________________
-
-ClassImp(AliShuttleTrigger)
-
-//______________________________________________________________________________________________
-AliShuttleTrigger::AliShuttleTrigger(const AliShuttleConfig* config,
-               UInt_t timeout, Int_t retries):
+AliShuttleTrigger::AliShuttleTrigger(const AliShuttleConfig* config):
        fConfig(config), fShuttle(NULL),
-       fNotified(kFALSE), fTerminate(kFALSE), fCondition(&fMutex),
-       fQuitSignalHandler(this, kSigQuit), 
-       fInterruptSignalHandler(this, kSigInterrupt)
+       fNotified(kFALSE), fTerminate(kFALSE),
+       fMutex(), fCondition(&fMutex),
+       fQuitSignalHandler(0),
+       fInterruptSignalHandler(0)
 {
        //
        // config - pointer to the AliShuttleConfig object which represents
@@ -112,49 +143,40 @@ AliShuttleTrigger::AliShuttleTrigger(const AliShuttleConfig* config,
        // localStorage (local) CDB storage to be used if mainStorage is unavailable
        //
 
+       if (!fConfig->IsValid()) AliFatal("********** !!!!! Invalid configuration !!!!! **********");
+       UInt_t timeout = fConfig->GetDCSTimeOut();
+       Int_t retries = fConfig->GetDCSRetries();
        fShuttle = new AliShuttle(config, timeout, retries);
 
-       gSystem->AddSignalHandler(&fQuitSignalHandler);
-       gSystem->AddSignalHandler(&fInterruptSignalHandler);
-}
-
+       TerminateSignalHandler* fQuitSignalHandler = new TerminateSignalHandler(this, kSigQuit);
+       TerminateSignalHandler* fInterruptSignalHandler = new TerminateSignalHandler(this, kSigInterrupt);
 
-
-//______________________________________________________________________
-AliShuttleTrigger::AliShuttleTrigger(const AliShuttleTrigger& /*other*/):
-TObject()
-{
-// copy constructor (not implemented)
+       gSystem->AddSignalHandler(fQuitSignalHandler);
+       gSystem->AddSignalHandler(fInterruptSignalHandler);
 
 }
 
-//______________________________________________________________________
-AliShuttleTrigger &AliShuttleTrigger::operator=(const AliShuttleTrigger& /*other*/)
-{
-// assignment operator (not implemented)
-
-return *this;
-}
-
-
-
-
-
 //______________________________________________________________________________________________
 AliShuttleTrigger::~AliShuttleTrigger() 
 {
-// destructor
+  // destructor
 
-       gSystem->RemoveSignalHandler(&fQuitSignalHandler);
-       gSystem->RemoveSignalHandler(&fInterruptSignalHandler);
+       gSystem->RemoveSignalHandler(fQuitSignalHandler);
+       gSystem->RemoveSignalHandler(fInterruptSignalHandler);
 
        delete fShuttle;
+
+  delete fQuitSignalHandler;
+  fQuitSignalHandler = 0;
+
+  delete fInterruptSignalHandler;
+  fInterruptSignalHandler = 0;
 }
 
 //______________________________________________________________________________________________
 Bool_t AliShuttleTrigger::Notify() {
        //
-       // Trigger CollectNew() methods in asynchronized (listen) mode.
+       // Trigger Collect() methods in asynchronized (listen) mode.
        // Usually called automaticly by DATENotifier on "end of run" 
        // notification event.
        //
@@ -185,19 +207,26 @@ void AliShuttleTrigger::Run() {
        //
        // AliShuttleTrigger main loop for asynchronized (listen) mode.
        // It spawns DIM service listener and waits for DAQ "end of run"
-       // notification. Calls CollectNew() on notification.
+       // notification. Calls Collect() on notification.
        //
 
        fTerminate = kFALSE;
 
        DATENotifier* notifier = new DATENotifier(this, "/DATE/LOGBOOK/UPDATE");
 
+       Int_t nTry=0; 
+       Int_t nMaxTry = fConfig->GetMaxRetries()+1;
+       Int_t received=0;
+       
+       AliInfo("Listening for ECS trigger");
+       
        while (1) {
        
                fMutex.Lock();
 
                while (!(fNotified || fTerminate)) {
-                       fCondition.Wait();
+                       received=fCondition.TimedWaitRelative(1000*fConfig->GetTriggerWait());
+                       if (received==1) break; // 1 = timeout
                }
 
                fNotified = kFALSE;
@@ -208,247 +237,45 @@ void AliShuttleTrigger::Run() {
                        AliInfo("Terminated.");
                        break;          
                }
-       
-               CollectNew();
-       }
-
-       delete notifier;
-}
-
-//______________________________________________________________________________________________
-Bool_t AliShuttleTrigger::RetrieveDATEEntries(const char* whereClause,
-               TObjArray& entries)
-{
-// Retrieve start time and end time for all runs in the DAQ logbook
-// that aren't processed yet
-
-       TString sqlQuery;
-       sqlQuery += "select run, time_start, time_end from logbook ";
-       sqlQuery += whereClause;
-       sqlQuery += " order by run";
-
-       TSQLServer* aServer;
-       TString logbookHost="mysql://";
-       logbookHost+=fConfig->GetDAQLogBookHost();
-       
-       aServer = TSQLServer::Connect(logbookHost,
-                       fConfig->GetDAQLogBookUser(),
-                       fConfig->GetDAQLogBookPassword());
-       if (!aServer) {
-               AliError("Can't establish connection to DAQ log book DB!");
-               return kFALSE;
-       }
-       
-       aServer->GetTables("REFSYSLOG");
-
-       TSQLResult* aResult;
-       aResult = aServer->Query(sqlQuery);
-       if (!aResult) {
-               AliError(Form("Can't execute query <%s>!", sqlQuery.Data()));
-               delete aServer;
-               return kFALSE;
-       }
-
-       if (aResult->GetFieldCount() != 3) {
-               AliError("Invalid SQL result field number!");
-               delete aResult;
-               delete aServer;
-               return kFALSE;
-       }
-
-       TSQLRow* aRow;
-       while ((aRow = aResult->Next())) {
-               TString runString(aRow->GetField(0), aRow->GetFieldLength(0));
-               Int_t run = runString.Atoi();
-
-               TString startTimeString(aRow->GetField(1),
-                               aRow->GetFieldLength(1));
-               Int_t startTime = startTimeString.Atoi();
-               if (!startTime) {
-                       AliWarning(Form("Zero StartTime for run <%d>!", run));
-                       AliWarning("Going to skip this run!");
-                       continue;
-               }
-
-               TString endTimeString(aRow->GetField(2),
-                               aRow->GetFieldLength(2));
-               Int_t endTime = endTimeString.Atoi();
-               if (!endTime) {
-                       AliWarning(Form("Zero EndTime for run <%d>!", run));
-                       AliWarning("Going to skip this run!");
-                       continue;
+               
+               if (received == 0)
+               {
+                       AliInfo("Trigger from ECS received!");
+               } else if (received == 1) {
+                       AliInfo(Form("Timeout (%d s) waiting for trigger. "
+                               "Starting collection of new runs!", 
+                                       fConfig->GetTriggerWait()));
+               } else {
+                       AliInfo("Error receiving trigger from ECS!");
+                       break;
                }
-
-               if (startTime > endTime) {
-                       AliWarning(Form("StartTime bigger than EndTime for run <%d>", run));
-                       AliWarning("Going to skip this run!");
-                       continue;
+               
+               nTry++;
+               AliInfo(Form("Received %d triggers so far", nTry));
+               
+               if (fConfig->GetRunMode() == AliShuttleConfig::kTest)
+               {
+                       if(nTry>=nMaxTry)
+                       {
+                               AliInfo(Form("Collect() ran more than %d times -> Exiting!", 
+                                               nMaxTry));
+                               break;
+                       }
                }
-
-               entries.AddLast(new AliShuttleTriggerDATEEntry(run, startTime, endTime));
-               delete aRow;
-       }
-
-       delete aResult;
        
-       aServer->Close();
-       delete aServer;
-
-       entries.SetOwner(1);
-
-       return kTRUE;
-}
-
-//______________________________________________________________________________________________
-Bool_t AliShuttleTrigger::RetrieveConditionsData(const TObjArray& dateEntries, Int_t &lastRun)
-{
-// Retrieve conditions data for all runs that aren't processed yet
-
-       Bool_t hasError = kFALSE;
-
-       TIter iter(&dateEntries);
-       AliShuttleTriggerDATEEntry* anEntry;
-       lastRun=-1;
-       while ((anEntry = (AliShuttleTriggerDATEEntry*) iter.Next())) {
-               Bool_t processError = kFALSE;
-               if(lastRun == -1) lastRun = anEntry->GetRun();
-               if(!fShuttle->Process(anEntry->GetRun(),
-                               anEntry->GetStartTime(),
-                               anEntry->GetEndTime())) {
-                                       processError = kTRUE;
-                                       hasError = kTRUE;
-               }
-               if(!processError) lastRun = anEntry->GetRun();
+               Collect();
        }
 
-       return hasError == kFALSE;
+       delete notifier;
 }
 
 //______________________________________________________________________________________________
 Bool_t AliShuttleTrigger::Collect(Int_t run)
 {
        //
-       // Collects conditions date for the given run.
-       //
-
-       AliInfo(Form("Collecting conditions data for run <%d> ...", run));
-
-       TString whereClause("where run = ");
-       whereClause += run;
-
-       TObjArray dateEntries;
-       if (!RetrieveDATEEntries(whereClause, dateEntries)) {
-               AliError("Can't retrieve entries from DAQ log book.");
-               return kFALSE;
-        }
-
-       if (!dateEntries.GetEntriesFast()) {
-               AliError(Form("There isn't entry for run <%d> in DAQ log book!",
-                       run));
-               return kFALSE;
-       }
-
-       if (dateEntries.GetEntriesFast() > 1) {
-               AliError(Form("There is more than one entry for run <%d> in DAQ log book", run));
-               return kFALSE;
-       }
-
-       Int_t lastRun;
-       if (!RetrieveConditionsData(dateEntries, lastRun)) {
-               AliError("An error occured during conditions data retrieval!");
-               return kFALSE;
-       }
-
-       return kTRUE;
-}
-
-//______________________________________________________________________________________________
-Bool_t AliShuttleTrigger::CollectNew() 
-{
-       //
-       // Collects conditions data for all new run written to DAQ LogBook.
+       // this function creates a thread that runs the shuttle
+       // then it checks if the shuttle is still running by checking the monitoring functions of the shuttle
        //
 
-  // TODO revise this! last run number is ONLY allowed to be written when run was processed successfully!!!
-
-       AliInfo("Collecting conditions data for new runs ...");
-
-       Int_t lastRun;
-
-       AliCDBEntry* cdbEntry = AliCDBManager::Instance()->GetStorage(AliShuttle::GetLocalURI())
-                               ->Get("/SHUTTLE/SYSTEM/LASTRUN", 0);
-       if (cdbEntry) {
-               TObject* anObject = cdbEntry->GetObject();
-               if (anObject == NULL ||
-                       anObject->IsA() != AliDCSValue::Class()) {
-                       AliError("Invalid last run object stored to CDB!");
-                       return kFALSE;
-               }
-               AliDCSValue* simpleValue = (AliDCSValue*) anObject;
-               lastRun = simpleValue->GetInt();
-               AliInfo(Form("Last run successfully stored: %d",lastRun));
-               delete cdbEntry;
-       } else {
-               AliWarning("There isn't last run stored! Starting from run 21240");
-               lastRun = 21240; // TODO maybe exit here
-       }
-
-       AliInfo(Form("Last run number <%d>", lastRun));
-
-       TString whereClause("where run > ");
-       whereClause += lastRun;
-
-       Int_t newLastRun;
-       TObjArray dateEntries;
-       if (!RetrieveDATEEntries(whereClause, dateEntries)) {
-               AliError("Can't retrieve entries from DAQ log book.");
-               return kFALSE;
-       }
-
-       if (!RetrieveConditionsData(dateEntries, newLastRun)) {
-               AliError("Process of at least one run failed!");
-               // return kFALSE;
-       }
-       
-       if (newLastRun > lastRun) {
-               AliDCSValue lastRunObj(newLastRun, 0);
-               AliCDBMetaData metaData;
-               AliCDBId cdbID(AliCDBPath("SHUTTLE", "SYSTEM", "LASTRUN"), 0, 0);
-
-               UInt_t result = AliCDBManager::Instance()->GetStorage(AliShuttle::GetLocalURI())
-                               ->Put(&lastRunObj, cdbID, &metaData);
-
-               if (!result) {
-                       AliError("Can't store last run to CDB!");
-                       return kFALSE;
-               }
-       }
-
-       
-       return kTRUE;
-}
-
-//______________________________________________________________________________________________
-Bool_t AliShuttleTrigger::CollectAll() 
-{
-       //
-       // Collects conditions data for all run written in DAQ LogBook.
-       //
-
-       AliInfo("Collecting conditions data for all runs ...");
-
-       Int_t lastRun;
-       TObjArray dateEntries;
-       if (!RetrieveDATEEntries("", dateEntries)) {
-               AliError("Can't retrieve entries from DAQ log book.");
-               return kFALSE;
-       }
-
-       if (!RetrieveConditionsData(dateEntries, lastRun)) {
-               AliError("An error occured during conditions data retrieval!");
-               return kFALSE;
-       }
-
-       return kTRUE;
+  return fShuttle->Collect(run);
 }
-