df/d49/_avalanche_scheduler_svc_8cpp_source.html

 /***********************************************************************************\
 * (c) Copyright 1998-2019 CERN for the benefit of the LHCb and ATLAS collaborations *
 *                                                                                   *
 * This software is distributed under the terms of the Apache version 2 licence,     *
 * copied verbatim in the file "LICENSE".                                            *
 *                                                                                   *
 * In applying this licence, CERN does not waive the privileges and immunities       *
 * granted to it by virtue of its status as an Intergovernmental Organization        *
 * or submit itself to any jurisdiction.                                             *
 \***********************************************************************************/
 #include "AvalancheSchedulerSvc.h"

 #include "AlgoExecutionTask.h"
 #include "IOBoundAlgTask.h"

 // Framework includes
 #include "GaudiKernel/ConcurrencyFlags.h"
 #include "GaudiKernel/DataHandleHolderVisitor.h"
 #include "GaudiKernel/IAlgorithm.h"
 #include "GaudiKernel/IDataManagerSvc.h"
 #include "GaudiKernel/ThreadLocalContext.h"
 #include <Gaudi/Algorithm.h> // can be removed ASA dynamic casts to Algorithm are removed

 // C++
 #include <algorithm>
 #include <map>
 #include <queue>
 #include <sstream>
 #include <thread>
 #include <unordered_set>

 // External libs
 #include "boost/algorithm/string.hpp"
 #include "boost/thread.hpp"
 #include "boost/tokenizer.hpp"
 // DP waiting for the TBB service
 #include "tbb/tbb_stddef.h"
 #if TBB_INTERFACE_VERSION_MAJOR < 12
 #  include "tbb/task_scheduler_init.h"
 #endif // TBB_INTERFACE_VERSION_MAJOR < 12

 // Instantiation of a static factory class used by clients to create instances of this service
 DECLARE_COMPONENT( AvalancheSchedulerSvc )

 #define ON_DEBUG if ( msgLevel( MSG::DEBUG ) )
 #define ON_VERBOSE if ( msgLevel( MSG::VERBOSE ) )

 namespace {
   struct DataObjIDSorter {
     bool operator()( const DataObjID* a, const DataObjID* b ) { return a->fullKey() < b->fullKey(); }
   };

   // Sort a DataObjIDColl in a well-defined, reproducible manner.
   // Used for making debugging dumps.
   std::vector<const DataObjID*> sortedDataObjIDColl( const DataObjIDColl& coll ) {
     std::vector<const DataObjID*> v;
     v.reserve( coll.size() );
     for ( const DataObjID& id : coll ) v.push_back( &id );
     std::sort( v.begin(), v.end(), DataObjIDSorter() );
     return v;
   }

   bool subSlotAlgsInStates( const EventSlot& slot, std::initializer_list<AlgsExecutionStates::State> testStates ) {
     return std::any_of( slot.allSubSlots.begin(), slot.allSubSlots.end(),
                         [testStates]( const EventSlot& ss ) { return ss.algsStates.containsAny( testStates ); } );
   }
 } // namespace

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::initialize() {

   // Initialise mother class (read properties, ...)
   StatusCode sc( Service::initialize() );
   if ( sc.isFailure() ) warning() << "Base class could not be initialized" << endmsg;

   // Get hold of the TBBSvc. This should initialize the thread pool
   m_threadPoolSvc = serviceLocator()->service( "ThreadPoolSvc" );
   if ( !m_threadPoolSvc.isValid() ) {
     fatal() << "Error retrieving ThreadPoolSvc" << endmsg;
     return StatusCode::FAILURE;
   }

   // Activate the scheduler in another thread.
   info() << "Activating scheduler in a separate thread" << endmsg;
   m_thread = std::thread( [this]() { this->activate(); } );

   while ( m_isActive != ACTIVE ) {
     if ( m_isActive == FAILURE ) {
       fatal() << "Terminating initialization" << endmsg;
       return StatusCode::FAILURE;
     } else {
       ON_DEBUG debug() << "Waiting for AvalancheSchedulerSvc to activate" << endmsg;
       sleep( 1 );
     }
   }

   if ( m_enableCondSvc ) {
     // Get hold of the CondSvc
     m_condSvc = serviceLocator()->service( "CondSvc" );
     if ( !m_condSvc.isValid() ) {
       warning() << "No CondSvc found, or not enabled. "
                 << "Will not manage CondAlgorithms" << endmsg;
       m_enableCondSvc = false;
     }
   }

   // Get the algo resource pool
   m_algResourcePool = serviceLocator()->service( "AlgResourcePool" );
   if ( !m_algResourcePool.isValid() ) {
     fatal() << "Error retrieving AlgoResourcePool" << endmsg;
     return StatusCode::FAILURE;
   }

   m_algExecStateSvc = serviceLocator()->service( "AlgExecStateSvc" );
   if ( !m_algExecStateSvc.isValid() ) {
     fatal() << "Error retrieving AlgExecStateSvc" << endmsg;
     return StatusCode::FAILURE;
   }

   // Get Whiteboard
   m_whiteboard = serviceLocator()->service( m_whiteboardSvcName );
   if ( !m_whiteboard.isValid() ) {
     fatal() << "Error retrieving EventDataSvc interface IHiveWhiteBoard." << endmsg;
     return StatusCode::FAILURE;
   }

   // Get dedicated scheduler for I/O-bound algorithms
   if ( m_useIOBoundAlgScheduler ) {
     m_IOBoundAlgScheduler = serviceLocator()->service( m_IOBoundAlgSchedulerSvcName );
     if ( !m_IOBoundAlgScheduler.isValid() )
       fatal() << "Error retrieving IOBoundSchedulerAlgSvc interface IAccelerator." << endmsg;
   }

   // Set the MaxEventsInFlight parameters from the number of WB stores
   m_maxEventsInFlight = m_whiteboard->getNumberOfStores();

   // Set the number of free slots
   m_freeSlots = m_maxEventsInFlight;

   // Get the list of algorithms
   const std::list<IAlgorithm*>& algos      = m_algResourcePool->getFlatAlgList();
   const unsigned int            algsNumber = algos.size();
   if ( algsNumber != 0 ) {
     info() << "Found " << algsNumber << " algorithms" << endmsg;
   } else {
     error() << "No algorithms found" << endmsg;
     return StatusCode::FAILURE;
   }

   /* Dependencies
    1) Look for handles in algo, if none
    2) Assume none are required
   */

   DataObjIDColl globalInp, globalOutp;

   // figure out all outputs
   for ( IAlgorithm* ialgoPtr : algos ) {
     Gaudi::Algorithm* algoPtr = dynamic_cast<Gaudi::Algorithm*>( ialgoPtr );
     if ( !algoPtr ) {
       fatal() << "Could not convert IAlgorithm into Gaudi::Algorithm: this will result in a crash." << endmsg;
       return StatusCode::FAILURE;
     }
     for ( auto id : algoPtr->outputDataObjs() ) globalOutp.insert( id );
   }

   std::ostringstream ostdd;
   ostdd << "Data Dependencies for Algorithms:";

   std::map<std::string, DataObjIDColl> algosDependenciesMap;
   for ( IAlgorithm* ialgoPtr : algos ) {
     Gaudi::Algorithm* algoPtr = dynamic_cast<Gaudi::Algorithm*>( ialgoPtr );
     if ( nullptr == algoPtr ) {
       fatal() << "Could not convert IAlgorithm into Gaudi::Algorithm for " << ialgoPtr->name()
               << ": this will result in a crash." << endmsg;
       return StatusCode::FAILURE;
     }

     ostdd << "\n  " << algoPtr->name();

     DataObjIDColl algoDependencies;
     if ( !algoPtr->inputDataObjs().empty() || !algoPtr->outputDataObjs().empty() ) {
       for ( const DataObjID* idp : sortedDataObjIDColl( algoPtr->inputDataObjs() ) ) {
         DataObjID id = *idp;
         ostdd << "\n    o INPUT  " << id;
         if ( id.key().find( ":" ) != std::string::npos ) {
           ostdd << " contains alternatives which require resolution...\n";
           auto tokens = boost::tokenizer<boost::char_separator<char>>{id.key(), boost::char_separator<char>{":"}};
           auto itok   = std::find_if( tokens.begin(), tokens.end(), [&]( const std::string& t ) {
             return globalOutp.find( DataObjID{t} ) != globalOutp.end();
           } );
           if ( itok != tokens.end() ) {
             ostdd << "found matching output for " << *itok << " -- updating scheduler info\n";
             id.updateKey( *itok );
           } else {
             error() << "failed to find alternate in global output list"
                     << " for id: " << id << " in Alg " << algoPtr->name() << endmsg;
             m_showDataDeps = true;
           }
         }
         algoDependencies.insert( id );
         globalInp.insert( id );
       }
       for ( const DataObjID* id : sortedDataObjIDColl( algoPtr->outputDataObjs() ) ) {
         ostdd << "\n    o OUTPUT " << *id;
         if ( id->key().find( ":" ) != std::string::npos ) {
           error() << " in Alg " << algoPtr->name() << " alternatives are NOT allowed for outputs! id: " << *id
                   << endmsg;
           m_showDataDeps = true;
         }
       }
     } else {
       ostdd << "\n      none";
     }
     algosDependenciesMap[algoPtr->name()] = algoDependencies;
   }

   if ( m_showDataDeps ) { info() << ostdd.str() << endmsg; }

   // Check if we have unmet global input dependencies, and, optionally, heal them
   // WARNING: this step must be done BEFORE the Precedence Service is initialized
   if ( m_checkDeps ) {
     DataObjIDColl unmetDep;
     for ( auto o : globalInp )
       if ( globalOutp.find( o ) == globalOutp.end() ) unmetDep.insert( o );

     if ( unmetDep.size() > 0 ) {

       std::ostringstream ost;
       for ( const DataObjID* o : sortedDataObjIDColl( unmetDep ) ) {
         ost << "\n   o " << *o << "    required by Algorithm: ";

         for ( const auto& p : algosDependenciesMap )
           if ( p.second.find( *o ) != p.second.end() ) ost << "\n       * " << p.first;
       }

       if ( !m_useDataLoader.empty() ) {

         // Find the DataLoader Alg
         IAlgorithm* dataLoaderAlg( nullptr );
         for ( IAlgorithm* algo : algos )
           if ( algo->name() == m_useDataLoader ) {
             dataLoaderAlg = algo;
             break;
           }

         if ( dataLoaderAlg == nullptr ) {
           fatal() << "No DataLoader Algorithm \"" << m_useDataLoader.value()
                   << "\" found, and unmet INPUT dependencies "
                   << "detected:\n"
                   << ost.str() << endmsg;
           return StatusCode::FAILURE;
         }

         info() << "Will attribute the following unmet INPUT dependencies to \"" << dataLoaderAlg->type() << "/"
                << dataLoaderAlg->name() << "\" Algorithm" << ost.str() << endmsg;

         // Set the property Load of DataLoader Alg
         Gaudi::Algorithm* dataAlg = dynamic_cast<Gaudi::Algorithm*>( dataLoaderAlg );
         if ( !dataAlg ) {
           fatal() << "Unable to dcast DataLoader \"" << m_useDataLoader.value() << "\" IAlg to Gaudi::Algorithm"
                   << endmsg;
           return StatusCode::FAILURE;
         }

         for ( auto& id : unmetDep ) {
           ON_DEBUG debug() << "adding OUTPUT dep \"" << id << "\" to " << dataLoaderAlg->type() << "/"
                            << dataLoaderAlg->name() << endmsg;
           dataAlg->addDependency( id, Gaudi::DataHandle::Writer );
         }

       } else {
         fatal() << "Auto DataLoading not requested, "
                 << "and the following unmet INPUT dependencies were found:" << ost.str() << endmsg;
         return StatusCode::FAILURE;
       }

     } else {
       info() << "No unmet INPUT data dependencies were found" << endmsg;
     }
   }

   // Get the precedence service
   m_precSvc = serviceLocator()->service( "PrecedenceSvc" );
   if ( !m_precSvc.isValid() ) {
     fatal() << "Error retrieving PrecedenceSvc" << endmsg;
     return StatusCode::FAILURE;
   }
   const PrecedenceSvc* precSvc = dynamic_cast<const PrecedenceSvc*>( m_precSvc.get() );
   if ( !precSvc ) {
     fatal() << "Unable to dcast PrecedenceSvc" << endmsg;
     return StatusCode::FAILURE;
   }

   // Fill the containers to convert algo names to index
   m_algname_vect.resize( algsNumber );
   for ( IAlgorithm* algo : algos ) {
     const std::string& name    = algo->name();
     auto               index   = precSvc->getRules()->getAlgorithmNode( name )->getAlgoIndex();
     m_algname_index_map[name]  = index;
     m_algname_vect.at( index ) = name;
   }

   // Shortcut for the message service
   SmartIF<IMessageSvc> messageSvc( serviceLocator() );
   if ( !messageSvc.isValid() ) error() << "Error retrieving MessageSvc interface IMessageSvc." << endmsg;

   m_eventSlots.reserve( m_maxEventsInFlight );
   for ( size_t i = 0; i < m_maxEventsInFlight; ++i ) {
     m_eventSlots.emplace_back( algsNumber, precSvc->getRules()->getControlFlowNodeCounter(), messageSvc );
     m_eventSlots.back().complete = true;
   }

   if ( m_threadPoolSize > 1 ) { m_maxAlgosInFlight = (size_t)m_threadPoolSize; }

   // Clearly inform about the level of concurrency
   info() << "Concurrency level information:" << endmsg;
   info() << " o Number of events in flight: " << m_maxEventsInFlight << endmsg;
   info() << " o TBB thread pool size: " << m_threadPoolSize << endmsg;

   if ( m_showControlFlow ) m_precSvc->dumpControlFlow();

   if ( m_showDataFlow ) m_precSvc->dumpDataFlow();

   // Simulate execution flow
   if ( m_simulateExecution ) sc = m_precSvc->simulate( m_eventSlots[0] );

   return sc;
 }
 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::finalize() {

   StatusCode sc( Service::finalize() );
   if ( sc.isFailure() ) warning() << "Base class could not be finalized" << endmsg;

   sc = deactivate();
   if ( sc.isFailure() ) warning() << "Scheduler could not be deactivated" << endmsg;

   info() << "Joining Scheduler thread" << endmsg;
   m_thread.join();

   // Final error check after thread pool termination
   if ( m_isActive == FAILURE ) {
     error() << "problems in scheduler thread" << endmsg;
     return StatusCode::FAILURE;
   }

   return sc;
 }
 //---------------------------------------------------------------------------

 void AvalancheSchedulerSvc::activate() {

   ON_DEBUG debug() << "AvalancheSchedulerSvc::activate()" << endmsg;

   if ( m_threadPoolSvc->initPool( m_threadPoolSize ).isFailure() ) {
     error() << "problems initializing ThreadPoolSvc" << endmsg;
     m_isActive = FAILURE;
     return;
   }

   // Wait for actions pushed into the queue by finishing tasks.
   action     thisAction;
   StatusCode sc( StatusCode::SUCCESS );

   m_isActive = ACTIVE;

   // Continue to wait if the scheduler is running or there is something to do
   ON_DEBUG debug() << "Start checking the actionsQueue" << endmsg;
   while ( m_isActive == ACTIVE || m_actionsQueue.size() != 0 ) {
     m_actionsQueue.pop( thisAction );
     sc = thisAction();
     ON_VERBOSE {
       if ( sc.isFailure() )
         verbose() << "Action did not succeed (which is not bad per se)." << endmsg;
       else
         verbose() << "Action succeeded." << endmsg;
     }
     else sc.ignore();

     // If all queued actions have been processed, update the slot states
     if ( m_needsUpdate.load() && m_actionsQueue.empty() ) {
       sc = updateStates();
       ON_VERBOSE {
         if ( sc.isFailure() )
           verbose() << "updateStates did not succeed (which is not bad per se)." << endmsg;
         else
           verbose() << "updateStates succeeded." << endmsg;
       }
       else sc.ignore();
     }
   }

   ON_DEBUG debug() << "Terminating thread-pool resources" << endmsg;
   if ( m_threadPoolSvc->terminatePool().isFailure() ) {
     error() << "Problems terminating thread pool" << endmsg;
     m_isActive = FAILURE;
   }
 }

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::deactivate() {

   if ( m_isActive == ACTIVE ) {

     // Set the number of slots available to an error code
     m_freeSlots.store( 0 );

     // Empty queue
     action thisAction;
     while ( m_actionsQueue.try_pop( thisAction ) ) {};

     // This would be the last action
     m_actionsQueue.push( [this]() -> StatusCode {
       ON_VERBOSE verbose() << "Deactivating scheduler" << endmsg;
       m_isActive = INACTIVE;
       return StatusCode::SUCCESS;
     } );
   }

   return StatusCode::SUCCESS;
 }

 //---------------------------------------------------------------------------

 // EventSlot management
 StatusCode AvalancheSchedulerSvc::pushNewEvent( EventContext* eventContext ) {

   if ( !eventContext ) {
     fatal() << "Event context is nullptr" << endmsg;
     return StatusCode::FAILURE;
   }

   if ( m_freeSlots.load() == 0 ) {
     ON_DEBUG debug() << "A free processing slot could not be found." << endmsg;
     return StatusCode::FAILURE;
   }

   // no problem as push new event is only called from one thread (event loop manager)
   --m_freeSlots;

   auto action = [this, eventContext]() -> StatusCode {
     // Event processing slot forced to be the same as the wb slot
     const unsigned int thisSlotNum = eventContext->slot();
     EventSlot&         thisSlot    = m_eventSlots[thisSlotNum];
     if ( !thisSlot.complete ) {
       fatal() << "The slot " << thisSlotNum << " is supposed to be a finished event but it's not" << endmsg;
       return StatusCode::FAILURE;
     }

     ON_DEBUG debug() << "Executing event " << eventContext->evt() << " on slot " << thisSlotNum << endmsg;
     thisSlot.reset( eventContext );

     // Result status code:
     StatusCode result = StatusCode::SUCCESS;

     // promote to CR and DR the initial set of algorithms
     Cause cs = {Cause::source::Root, "RootDecisionHub"};
     if ( m_precSvc->iterate( thisSlot, cs ).isFailure() ) {
       error() << "Failed to call IPrecedenceSvc::iterate for slot " << thisSlotNum << endmsg;
       result = StatusCode::FAILURE;
     }

     if ( this->updateStates().isFailure() ) {
       error() << "Failed to call AvalancheSchedulerSvc::updateStates for slot " << thisSlotNum << endmsg;
       result = StatusCode::FAILURE;
     }

     return result;
   }; // end of lambda

   // Kick off the scheduling!
   ON_VERBOSE {
     verbose() << "Pushing the action to update the scheduler for slot " << eventContext->slot() << endmsg;
     verbose() << "Free slots available " << m_freeSlots.load() << endmsg;
   }

   m_actionsQueue.push( action );

   return StatusCode::SUCCESS;
 }

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::pushNewEvents( std::vector<EventContext*>& eventContexts ) {
   StatusCode sc;
   for ( auto context : eventContexts ) {
     sc = pushNewEvent( context );
     if ( sc != StatusCode::SUCCESS ) return sc;
   }
   return sc;
 }

 //---------------------------------------------------------------------------

 unsigned int AvalancheSchedulerSvc::freeSlots() { return std::max( m_freeSlots.load(), 0 ); }

 //---------------------------------------------------------------------------
 StatusCode AvalancheSchedulerSvc::popFinishedEvent( EventContext*& eventContext ) {

   // ON_DEBUG debug() << "popFinishedEvent: queue size: " << m_finishedEvents.size() << endmsg;
   if ( m_freeSlots.load() == (int)m_maxEventsInFlight || m_isActive == INACTIVE ) {
     // ON_DEBUG debug() << "freeslots: " << m_freeSlots << "/" << m_maxEventsInFlight
     //      << " active: " << m_isActive << endmsg;
     return StatusCode::FAILURE;
   } else {
     // ON_DEBUG debug() << "freeslots: " << m_freeSlots << "/" << m_maxEventsInFlight
     //      << " active: " << m_isActive << endmsg;
     m_finishedEvents.pop( eventContext );
     ++m_freeSlots;
     ON_DEBUG debug() << "Popped slot " << eventContext->slot() << " (event " << eventContext->evt() << ")" << endmsg;
     return StatusCode::SUCCESS;
   }
 }

 //---------------------------------------------------------------------------
 StatusCode AvalancheSchedulerSvc::tryPopFinishedEvent( EventContext*& eventContext ) {

   if ( m_finishedEvents.try_pop( eventContext ) ) {
     ON_DEBUG debug() << "Try Pop successful slot " << eventContext->slot() << "(event " << eventContext->evt() << ")"
                      << endmsg;
     ++m_freeSlots;
     return StatusCode::SUCCESS;
   }
   return StatusCode::FAILURE;
 }

 //--------------------------------------------------------------------------
 // States Management

 StatusCode AvalancheSchedulerSvc::updateStates() {

   StatusCode global_sc( StatusCode::SUCCESS );

   // Retry algs
   AlgQueueEntry queuePop;
   const size_t  retries = m_retryQueue.size();
   for ( unsigned int retryIndex = 0; retryIndex < retries; ++retryIndex ) {

     queuePop = m_retryQueue.front();
     m_retryQueue.pop();

     global_sc = enqueue( queuePop.algIndex, queuePop.slotIndex, queuePop.contextPtr );
   }

   // Loop over all slots
   for ( EventSlot& thisSlot : m_eventSlots ) {

     // Ignore slots without a valid context (relevant when populating scheduler for first time)
     if ( !thisSlot.eventContext ) continue;

     int iSlot = thisSlot.eventContext->slot();

     // Cache the states of the algos to improve readability and performance
     AlgsExecutionStates& thisAlgsStates = thisSlot.algsStates;

     StatusCode partial_sc( StatusCode::FAILURE, true );

     // Perform DR->SCHEDULED
     for ( auto it = thisAlgsStates.begin( AState::DATAREADY ); it != thisAlgsStates.end( AState::DATAREADY ); ++it ) {
       uint algIndex = *it;

       bool IOBound = false;
       if ( m_useIOBoundAlgScheduler ) IOBound = m_precSvc->isBlocking( index2algname( algIndex ) );

       if ( !IOBound )
         partial_sc = enqueue( algIndex, iSlot, thisSlot.eventContext.get() );
       else
         partial_sc = promoteToAsyncScheduled( algIndex, iSlot, thisSlot.eventContext.get() );

       ON_VERBOSE if ( partial_sc.isFailure() ) verbose()
           << "Could not apply transition from " << AState::DATAREADY << " for algorithm " << index2algname( algIndex )
           << " on processing slot " << iSlot << endmsg;
     }

     // Check for algorithms ready in sub-slots
     for ( auto& subslot : thisSlot.allSubSlots ) {
       auto& subslotStates = subslot.algsStates;
       for ( auto it = subslotStates.begin( AState::DATAREADY ); it != subslotStates.end( AState::DATAREADY ); ++it ) {
         uint algIndex{*it};
         partial_sc = enqueue( algIndex, iSlot, subslot.eventContext.get() );
         // The following verbosity is expensive when the number of sub-slots is high
         /*ON_VERBOSE if ( partial_sc.isFailure() ) verbose()
             << "Could not apply transition from " << AState::DATAREADY << " for algorithm " << index2algname( algIndex )
             << " on processing subslot " << subslot.eventContext->slot() << endmsg;*/
       }
     }

     if ( m_dumpIntraEventDynamics ) {
       std::stringstream s;
       s << "START, " << thisAlgsStates.sizeOfSubset( AState::CONTROLREADY ) << ", "
         << thisAlgsStates.sizeOfSubset( AState::DATAREADY ) << ", " << thisAlgsStates.sizeOfSubset( AState::SCHEDULED )
         << ", " << std::chrono::high_resolution_clock::now().time_since_epoch().count() << "\n";
       auto threads = ( m_threadPoolSize != -1 ) ? std::to_string( m_threadPoolSize )
 #if TBB_INTERFACE_VERSION_MAJOR < 12
                                                 : std::to_string( tbb::task_scheduler_init::default_num_threads() );
 #else
                                                 : std::to_string( std::thread::hardware_concurrency() );
 #endif // TBB_INTERFACE_VERSION_MAJOR < 12
       std::ofstream myfile;
       myfile.open( "IntraEventFSMOccupancy_" + threads + "T.csv", std::ios::app );
       myfile << s.str();
       myfile.close();
     }

     // Not complete because this would mean that the slot is already free!
     if ( m_precSvc->CFRulesResolved( thisSlot ) &&
          !thisSlot.algsStates.containsAny(
              {AState::CONTROLREADY, AState::DATAREADY, AState::SCHEDULED, AState::RESOURCELESS} ) &&
          !subSlotAlgsInStates( thisSlot,
                                {AState::CONTROLREADY, AState::DATAREADY, AState::SCHEDULED, AState::RESOURCELESS} ) &&
          !thisSlot.complete ) {

       thisSlot.complete = true;
       // if the event did not fail, add it to the finished events
       // otherwise it is taken care of in the error handling
       if ( m_algExecStateSvc->eventStatus( *thisSlot.eventContext ) == EventStatus::Success ) {
         ON_DEBUG debug() << "Event " << thisSlot.eventContext->evt() << " finished (slot "
                          << thisSlot.eventContext->slot() << ")." << endmsg;
         m_finishedEvents.push( thisSlot.eventContext.release() );
       }

       // now let's return the fully evaluated result of the control flow
       ON_DEBUG debug() << m_precSvc->printState( thisSlot ) << endmsg;

       thisSlot.eventContext.reset( nullptr );

     } else if ( isStalled( thisSlot ) ) {
       m_algExecStateSvc->setEventStatus( EventStatus::AlgStall, *thisSlot.eventContext );
       eventFailed( thisSlot.eventContext.get() ); // can't release yet
     }
     partial_sc.ignore();
   } // end loop on slots

   ON_VERBOSE verbose() << "States Updated." << endmsg;
   m_needsUpdate.store( false );
   return global_sc;
 }

 //---------------------------------------------------------------------------
 // Update states in the appropriate event slot
 StatusCode AvalancheSchedulerSvc::setAlgState( unsigned int iAlgo, EventContext* contextPtr, AState state,
                                                bool iterate ) {
   StatusCode updateSc;
   EventSlot& thisSlot = m_eventSlots[contextPtr->slot()];
   Cause      cs       = {Cause::source::Task, index2algname( iAlgo )};
   if ( contextPtr->usesSubSlot() ) {
     // Sub-slot
     size_t const subSlotIndex = contextPtr->subSlot();
     updateSc                  = thisSlot.allSubSlots[subSlotIndex].algsStates.set( iAlgo, state );
     if ( updateSc.isSuccess() && iterate ) updateSc = m_precSvc->iterate( thisSlot.allSubSlots[subSlotIndex], cs );
   } else {
     // Event level (standard behaviour)
     updateSc = thisSlot.algsStates.set( iAlgo, state );
     if ( updateSc.isSuccess() && iterate ) updateSc = m_precSvc->iterate( thisSlot, cs );
   }
   return updateSc;
 }

 //---------------------------------------------------------------------------

 bool AvalancheSchedulerSvc::isStalled( const EventSlot& slot ) const {

   if ( !slot.algsStates.containsAny( {AState::DATAREADY, AState::SCHEDULED, AState::RESOURCELESS} ) &&
        !subSlotAlgsInStates( slot, {AState::DATAREADY, AState::SCHEDULED, AState::RESOURCELESS} ) ) {

     error() << "*** Stall detected in slot " << slot.eventContext->slot() << "! ***" << endmsg;

     return true;
   }
   return false;
 }

 //---------------------------------------------------------------------------

 void AvalancheSchedulerSvc::eventFailed( EventContext* eventContext ) {
   const uint slotIdx = eventContext->slot();

   error() << "Event " << eventContext->evt() << " on slot " << slotIdx << " failed" << endmsg;

   dumpSchedulerState( msgLevel( MSG::VERBOSE ) ? -1 : slotIdx );

   // dump temporal and topological precedence analysis (if enabled in the PrecedenceSvc)
   m_precSvc->dumpPrecedenceRules( m_eventSlots[slotIdx] );

   // Push into the finished events queue the failed context
   m_eventSlots[slotIdx].complete = true;
   m_finishedEvents.push( m_eventSlots[slotIdx].eventContext.release() );
 }

 //---------------------------------------------------------------------------

 void AvalancheSchedulerSvc::dumpSchedulerState( int iSlot ) {

   // To have just one big message
   std::ostringstream outputMS;

   outputMS << "Dumping scheduler state\n"
            << "=========================================================================================\n"
            << "++++++++++++++++++++++++++++++++++++ SCHEDULER STATE ++++++++++++++++++++++++++++++++++++\n"
            << "=========================================================================================\n\n";

   //===========================================================================

   outputMS << "------------------ Last schedule: Task/Event/Slot/Thread/State Mapping "
            << "------------------\n\n";

   // Figure if TimelineSvc is available (used below to detect threads IDs)
   auto timelineSvc = serviceLocator()->service<ITimelineSvc>( "TimelineSvc", false );
   if ( !timelineSvc.isValid() || !timelineSvc->isEnabled() ) {
     outputMS << "WARNING Enable TimelineSvc in record mode (RecordTimeline = True) to trace the mapping\n";
   } else {

     // Figure optimal printout layout
     size_t indt( 0 );
     for ( auto& slot : m_eventSlots )
       for ( auto it = slot.algsStates.begin( AState::SCHEDULED ); it != slot.algsStates.end( AState::SCHEDULED ); ++it )
         if ( index2algname( *it ).length() > indt ) indt = index2algname( *it ).length();

     // Figure the last running schedule across all slots
     for ( auto& slot : m_eventSlots ) {
       for ( auto it = slot.algsStates.begin( AState::SCHEDULED ); it != slot.algsStates.end( AState::SCHEDULED );
             ++it ) {

         const std::string algoName{index2algname( *it )};

         outputMS << "  task: " << std::setw( indt ) << algoName << " evt/slot: " << slot.eventContext->evt() << "/"
                  << slot.eventContext->slot();

         // Try to get POSIX threads IDs the currently running tasks are scheduled to
         if ( timelineSvc.isValid() ) {
           TimelineEvent te{};
           te.algorithm = algoName;
           te.slot      = slot.eventContext->slot();
           te.event     = slot.eventContext->evt();

           if ( timelineSvc->getTimelineEvent( te ) )
             outputMS << " thread.id: 0x" << std::hex << te.thread << std::dec;
           else
             outputMS << " thread.id: [unknown]"; // this means a task has just
                                                  // been signed off as SCHEDULED,
                                                  // but has not been assigned to a thread yet
                                                  // (i.e., not running yet)
         }
         outputMS << " state: [" << m_algExecStateSvc->algExecState( algoName, *( slot.eventContext ) ) << "]\n";
       }
     }
   }

   //===========================================================================

   outputMS << "\n---------------------------- Task/CF/FSM Mapping "
            << ( 0 > iSlot ? "[all slots] --" : "[target slot] " ) << "--------------------------\n\n";

   int slotCount = -1;
   for ( auto& slot : m_eventSlots ) {
     ++slotCount;
     if ( slot.complete ) continue;

     outputMS << "[ slot: "
              << ( slot.eventContext->valid() ? std::to_string( slot.eventContext->slot() ) : "[ctx invalid]" )
              << "  event: "
              << ( slot.eventContext->valid() ? std::to_string( slot.eventContext->evt() ) : "[ctx invalid]" )
              << " ]:\n\n";

     if ( 0 > iSlot || iSlot == slotCount ) {

       // Snapshot of the Control Flow and FSM states
       outputMS << m_precSvc->printState( slot ) << "\n";

       // Mention sub slots (this is expensive if the number of sub-slots is high)
       if ( m_verboseSubSlots && !slot.allSubSlots.empty() ) {
         outputMS << "\nNumber of sub-slots: " << slot.allSubSlots.size() << "\n\n";
         auto slotID = slot.eventContext->valid() ? std::to_string( slot.eventContext->slot() ) : "[ctx invalid]";
         for ( auto& ss : slot.allSubSlots ) {
           outputMS << "[ slot: " << slotID << ", sub-slot: "
                    << ( ss.eventContext->valid() ? std::to_string( ss.eventContext->subSlot() ) : "[ctx invalid]" )
                    << ", entry: " << ss.entryPoint << ", event: "
                    << ( ss.eventContext->valid() ? std::to_string( ss.eventContext->evt() ) : "[ctx invalid]" )
                    << " ]:\n\n";
           outputMS << m_precSvc->printState( ss ) << "\n";
         }
       }
     }
   }

   //===========================================================================

   if ( 0 <= iSlot ) {
     outputMS << "\n------------------------------ Algorithm Execution States -----------------------------\n\n";
     m_algExecStateSvc->dump( outputMS, *( m_eventSlots[iSlot].eventContext ) );
   }

   outputMS << "\n=========================================================================================\n"
            << "++++++++++++++++++++++++++++++++++++++ END OF DUMP ++++++++++++++++++++++++++++++++++++++\n"
            << "=========================================================================================\n\n";

   info() << outputMS.str() << endmsg;
 }

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::enqueue( unsigned int iAlgo, int si, EventContext* eventContext ) {

   // Use the algorithm rank to sort the queue
   const std::string& algName( index2algname( iAlgo ) );
   unsigned int       rank = 0;
   if ( !m_optimizationMode.empty() ) { rank = m_precSvc->getPriority( algName ); }

   // Get algorithm pointer
   IAlgorithm* iAlgoPtr = nullptr;
   StatusCode  getAlgSC( m_algResourcePool->acquireAlgorithm( algName, iAlgoPtr ) );

   // Check if the algorithm is available
   AState state;
   if ( getAlgSC.isSuccess() ) {

     // Add the algorithm to the scheduled queue
     m_scheduledQueue.push( {iAlgo, si, eventContext, rank, iAlgoPtr} );
     ++m_algosInFlight;

     // Avoid to use tbb if the pool size is 1 and run in this thread
     if ( -100 != m_threadPoolSize ) {

       // the child task that executes an Algorithm
       tbb::task* algoTask =
           new ( tbb::task::allocate_root() ) AlgoExecutionTask( this, serviceLocator(), m_algExecStateSvc );
       // schedule the algoTask
       tbb::task::enqueue( *algoTask );
     } else {

       AlgoExecutionTask theTask( this, serviceLocator(), m_algExecStateSvc );
       theTask.execute();
     }

     ON_DEBUG debug() << "Algorithm " << index2algname( iAlgo ) << " was submitted on event " << eventContext->evt()
                      << " in slot " << si << ". Algorithms scheduled are " << m_algosInFlight << endmsg;

     state = AState::SCHEDULED;
   } else {

     // Add the algorithm to the retry queue
     m_retryQueue.push( {iAlgo, si, eventContext, rank, nullptr} );

     state = AState::RESOURCELESS;
   }

   // Update alg state
   StatusCode updateSc = setAlgState( iAlgo, eventContext, state );

   ON_VERBOSE dumpSchedulerState( -1 );

   if ( updateSc.isSuccess() )
     ON_VERBOSE verbose() << "Promoting " << index2algname( iAlgo ) << " to " << state << " on slot " << si << endmsg;
   return updateSc;
 }

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::promoteToAsyncScheduled( unsigned int iAlgo, int si, EventContext* eventContext ) {

   if ( m_IOBoundAlgosInFlight == m_maxIOBoundAlgosInFlight ) return StatusCode::FAILURE;

   // bool IOBound = m_precSvc->isBlocking(algName);

   const std::string& algName( index2algname( iAlgo ) );
   IAlgorithm*        ialgoPtr = nullptr;
   StatusCode         sc( m_algResourcePool->acquireAlgorithm( algName, ialgoPtr ) );

   if ( sc.isSuccess() ) { // if we managed to get an algorithm instance try to schedule it

     ++m_IOBoundAlgosInFlight;
     auto promote2ExecutedClosure = [this, iAlgo, ialgoPtr, eventContext]() {
       this->m_actionsQueue.push( [this, iAlgo, ialgoPtr, eventContext]() {
         return this->AvalancheSchedulerSvc::promoteToAsyncExecuted( iAlgo, eventContext->slot(), ialgoPtr,
                                                                     eventContext );
       } );
       return StatusCode::SUCCESS;
     };
     // Can we use tbb-based overloaded new-operator for a "custom" task (an algorithm wrapper, not derived from
     // tbb::task)? it seems it works..

     // FIXME - The memory allocation here is causing memory leaks as detected by the gcc leak sanitizer
     //
     // clang-format off
     // Direct leak of 224 byte(s) in 7 object(s) allocated from:
     //   #0 0x7fc0cb524da8 in operator new(unsigned long) /afs/cern.ch/cms/CAF/CMSCOMM/COMM_ECAL/dkonst/GCC/build/contrib/gcc-8.2.0/src/gcc/8.2.0/libsanitizer/lsan/lsan_interceptors.cc:229
     //   #1 0x7fc0ba979f7b in function<AvalancheSchedulerSvc::promoteToAsyncScheduled(unsigned int, int, EventContext*)::<lambda()> > /cvmfs/lhcb.cern.ch/lib/lcg/releases/gcc/8.2.0-3fa06/x86_64-centos7/include/c++/8.2.0/bits/std_function.h:249
     //   #2 0x7fc0ba97d181 in AvalancheSchedulerSvc::promoteToAsyncScheduled(unsigned int, int, EventContext*) ../GaudiHive/src/AvalancheSchedulerSvc.cpp:969
     //   #3 0x7fc0ba98354d in AvalancheSchedulerSvc::updateStates(int, int, int, int) ../GaudiHive/src/AvalancheSchedulerSvc.cpp:660
     // clang-format on
     //
     // These leaks are currently suppressed in Gaudi/job/Gaudi-LSan.supp - remove entry there to reactivate
     //
     IOBoundAlgTask* theTask = new ( tbb::task::allocate_root() )
         IOBoundAlgTask( ialgoPtr, *eventContext, serviceLocator(), m_algExecStateSvc, promote2ExecutedClosure );
     if ( sc = m_IOBoundAlgScheduler->push( *theTask ); !sc ) return sc;
     //
     // FIXME

     ON_DEBUG debug() << "[Asynchronous] Algorithm " << algName << " was submitted on event " << eventContext->evt()
                      << " in slot " << si << ". algorithms scheduled are " << m_IOBoundAlgosInFlight << endmsg;

     // Update alg state
     StatusCode updateSc = setAlgState( iAlgo, eventContext, AState::SCHEDULED );

     ON_VERBOSE if ( updateSc.isSuccess() ) verbose()
         << "[Asynchronous] Promoting " << algName << " to SCHEDULED on slot " << si << endmsg;
     return updateSc;
   } else {
     ON_DEBUG debug() << "[Asynchronous] Could not acquire instance for algorithm " << index2algname( iAlgo )
                      << " on slot " << si << endmsg;
     return sc;
   }
 }

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::promoteToExecuted( unsigned int iAlgo, int si, EventContext* eventContext ) {

   const std::string& algName( index2algname( iAlgo ) );

   Gaudi::Hive::setCurrentContext( eventContext );

   --m_algosInFlight;

   ON_DEBUG debug() << "Trying to handle execution result of " << algName << " on slot " << si << endmsg;

   const AlgExecState& algstate = m_algExecStateSvc->algExecState( algName, *eventContext );
   AState              state    = algstate.execStatus().isSuccess()
                      ? ( algstate.filterPassed() ? AState::EVTACCEPTED : AState::EVTREJECTED )
                      : AState::ERROR;

   // Update alg state and iterate PrecedenceSvc
   StatusCode sc = setAlgState( iAlgo, eventContext, state, true );

   ON_VERBOSE if ( sc.isSuccess() ) verbose()
       << "Promoting " << algName << " on slot " << si << " to " << state << endmsg;

   ON_DEBUG debug() << "Algorithm " << algName << " executed in slot " << si << ". Algorithms scheduled are "
                    << m_algosInFlight << endmsg;

   // Prompt a call to updateStates
   m_needsUpdate.store( true );
   return sc;
 }

 //---------------------------------------------------------------------------

 StatusCode AvalancheSchedulerSvc::promoteToAsyncExecuted( unsigned int iAlgo, int si, IAlgorithm* algo,
                                                           EventContext* eventContext ) {
   Gaudi::Hive::setCurrentContext( eventContext );
   StatusCode sc = m_algResourcePool->releaseAlgorithm( algo->name(), algo );

   if ( sc.isFailure() ) {
     error() << "[Asynchronous]  [Event " << eventContext->evt() << ", Slot " << eventContext->slot() << "] "
             << "Instance of algorithm " << algo->name() << " could not be properly put back." << endmsg;
     return StatusCode::FAILURE;
   }

   --m_IOBoundAlgosInFlight;

   ON_DEBUG debug() << "[Asynchronous] Trying to handle execution result of " << algo->name() << " on slot " << si
                    << endmsg;

   const AlgExecState& algstate = m_algExecStateSvc->algExecState( algo, *eventContext );
   AState              state    = algstate.execStatus().isSuccess()
                      ? ( algstate.filterPassed() ? AState::EVTACCEPTED : AState::EVTREJECTED )
                      : AState::ERROR;

   // Update alg state and iterate PrecedenceSvc
   sc = setAlgState( iAlgo, eventContext, state, true );

   ON_VERBOSE if ( sc.isSuccess() ) verbose()
       << "[Asynchronous] Promoting " << algo->name() << " on slot " << si << " to " << state << endmsg;

   ON_DEBUG debug() << "[Asynchronous] Algorithm " << algo->name() << " executed in slot " << si
                    << ". Algorithms scheduled are " << m_IOBoundAlgosInFlight << endmsg;

   // Prompt a call to updateStates
   m_needsUpdate.store( true );
   return sc;
 }

 //---------------------------------------------------------------------------

 // Method to inform the scheduler about event views

 StatusCode AvalancheSchedulerSvc::scheduleEventView( const EventContext* sourceContext, const std::string& nodeName,
                                                      std::unique_ptr<EventContext> viewContext ) {
   //  Prevent view nesting
   if ( sourceContext->usesSubSlot() ) {
     fatal() << "Attempted to nest EventViews at node " << nodeName << ": this is not supported" << endmsg;
     return StatusCode::FAILURE;
   }

   ON_VERBOSE verbose() << "Queuing a view for [" << viewContext.get() << "]" << endmsg;

   // It's not possible to create an std::functional from a move-capturing lambda
   // So, we have to release the unique pointer
   auto action = [this, slotIndex = sourceContext->slot(), viewContextPtr = viewContext.release(),
                  &nodeName]() -> StatusCode {
     // Attach the sub-slot to the top-level slot
     EventSlot& topSlot = this->m_eventSlots[slotIndex];

     if ( viewContextPtr ) {
       // Re-create the unique pointer
       auto viewContext = std::unique_ptr<EventContext>( viewContextPtr );
       topSlot.addSubSlot( std::move( viewContext ), nodeName );
       return StatusCode::SUCCESS;
     } else {
       // Disable the view node if there are no views
       topSlot.disableSubSlots( nodeName );
       return StatusCode::SUCCESS;
     }
   };

   m_actionsQueue.push( std::move( action ) );

   return StatusCode::SUCCESS;
 }
IThreadPoolSvc::initPool
virtual StatusCode initPool(const int &poolSize)=0
Initializes the thread pool.

AvalancheSchedulerSvc::m_showDataFlow
Gaudi::Property< bool > m_showDataFlow
Definition: AvalancheSchedulerSvc.h:180

ON_DEBUG
#define ON_DEBUG
Definition: AvalancheSchedulerSvc.cpp:45

AvalancheSchedulerSvc::isStalled
bool isStalled(const EventSlot &) const
Check if scheduling in a particular slot is in a stall.
Definition: AvalancheSchedulerSvc.cpp:717

IOBoundAlgTask
Wrapper around I/O-bound Gaudi-algorithms.
Definition: IOBoundAlgTask.h:33

AvalancheSchedulerSvc::AlgQueueEntry::contextPtr
EventContext * contextPtr
Definition: AvalancheSchedulerSvc.h:282

AvalancheSchedulerSvc::tryPopFinishedEvent
StatusCode tryPopFinishedEvent(EventContext *&eventContext) override
Try to fetch an event from the scheduler.
Definition: AvalancheSchedulerSvc.cpp:557

AvalancheSchedulerSvc::scheduleEventView
virtual StatusCode scheduleEventView(const EventContext *sourceContext, const std::string &nodeName, std::unique_ptr< EventContext > viewContext) override
Method to inform the scheduler about event views.
Definition: AvalancheSchedulerSvc.cpp:1058

Service::initialize
StatusCode initialize() override
Definition: Service.cpp:70

SmartIF< IMessageSvc >

Service::serviceLocator
SmartIF< ISvcLocator > & serviceLocator() const override
Retrieve pointer to service locator.
Definition: Service.cpp:287

EventSlot
Class representing an event slot.
Definition: EventSlot.h:24

IAlgResourcePool::acquireAlgorithm
virtual StatusCode acquireAlgorithm(const std::string &name, IAlgorithm *&algo, bool blocking=false)=0
Acquire a certain algorithm using its name.

Cause::source::Task

EventContext::slot
ContextID_t slot() const
Definition: EventContext.h:51

std::unordered_set::empty
T empty(T... args)

AvalancheSchedulerSvc::INACTIVE
Definition: AvalancheSchedulerSvc.h:151

AvalancheSchedulerSvc::m_whiteboardSvcName
Gaudi::Property< std::string > m_whiteboardSvcName
Definition: AvalancheSchedulerSvc.h:156

AvalancheSchedulerSvc::m_IOBoundAlgosInFlight
unsigned int m_IOBoundAlgosInFlight
Number of algorithms presently in flight.
Definition: AvalancheSchedulerSvc.h:242

std::ofstream::open
T open(T... args)

concurrency::PrecedenceRulesGraph::getAlgorithmNode
AlgorithmNode * getAlgorithmNode(const std::string &algoName) const
Get the AlgorithmNode from by algorithm name using graph index.
Definition: PrecedenceRulesGraph.h:664

AvalancheSchedulerSvc::m_precSvc
SmartIF< IPrecedenceSvc > m_precSvc
A shortcut to the Precedence Service.
Definition: AvalancheSchedulerSvc.h:215

IPrecedenceSvc::iterate
virtual StatusCode iterate(EventSlot &, const Cause &)=0
Infer the precedence effect caused by an execution flow event.

AlgsExecutionStates::containsAny
bool containsAny(std::initializer_list< State > l) const
check if the collection contains at least one state of any listed types
Definition: AlgsExecutionStates.h:61

EventContext::evt
ContextEvt_t evt() const
Definition: EventContext.h:50

EventSlot::disableSubSlots
void disableSubSlots(const std::string &nodeName)
Disable event views for a given CF view node by registering an empty container Contact B.
Definition: EventSlot.h:78

Service::finalize
StatusCode finalize() override
Definition: Service.cpp:174

std::function< StatusCode()>

IAlgorithm::type
virtual const std::string & type() const =0
The type of the algorithm.

DataObjID
Definition: DataObjID.h:47

AvalancheSchedulerSvc::m_dumpIntraEventDynamics
Gaudi::Property< bool > m_dumpIntraEventDynamics
Definition: AvalancheSchedulerSvc.h:165

AvalancheSchedulerSvc::index2algname
const std::string & index2algname(unsigned int index)
Convert an integer to a name.
Definition: AvalancheSchedulerSvc.h:209

AvalancheSchedulerSvc::m_showDataDeps
Gaudi::Property< bool > m_showDataDeps
Definition: AvalancheSchedulerSvc.h:177

CommonMessagingBase::warning
MsgStream & warning() const
shortcut for the method msgStream(MSG::WARNING)
Definition: CommonMessaging.h:111

EventSlot::addSubSlot
void addSubSlot(std::unique_ptr< EventContext > viewContext, const std::string &nodeName)
Add a subslot to the slot (this constructs a new slot and registers it with the parent one)
Definition: EventSlot.h:61

AvalancheSchedulerSvc::m_needsUpdate
std::atomic< bool > m_needsUpdate
Definition: AvalancheSchedulerSvc.h:297

IAlgExecStateSvc::eventStatus
virtual const EventStatus::Status & eventStatus(const EventContext &ctx) const =0

AvalancheSchedulerSvc::initialize
StatusCode initialize() override
Initialise.
Definition: AvalancheSchedulerSvc.cpp:77

AvalancheSchedulerSvc::dumpSchedulerState
void dumpSchedulerState(int iSlot)
Dump the state of the scheduler.
Definition: AvalancheSchedulerSvc.cpp:756

IAlgorithm.h

AlgoExecutionTask
Definition: AlgoExecutionTask.h:26

ThreadLocalContext.h

PrecedenceSvc
A service to resolve the task execution precedence.
Definition: PrecedenceSvc.h:31

std::to_string
T to_string(T... args)

std::atomic::store
T store(T... args)

IOBoundAlgTask.h

SmartIF::isValid
bool isValid() const
Allow for check if smart pointer is valid.
Definition: SmartIF.h:72

StatusCode::SUCCESS
constexpr static const auto SUCCESS
Definition: StatusCode.h:100

TimelineEvent::algorithm
std::string algorithm
Definition: ITimelineSvc.h:31

AlgExecState::filterPassed
bool filterPassed() const
Definition: IAlgExecStateSvc.h:41

AvalancheSchedulerSvc::ACTIVE
Definition: AvalancheSchedulerSvc.h:151

AvalancheSchedulerSvc::activate
void activate()
Activate scheduler.
Definition: AvalancheSchedulerSvc.cpp:373

std::vector::end
T end(T... args)

AvalancheSchedulerSvc::m_useDataLoader
Gaudi::Property< std::string > m_useDataLoader
Definition: AvalancheSchedulerSvc.h:172

EventSlot::allSubSlots
std::vector< EventSlot > allSubSlots
Actual sub-slot instances.
Definition: EventSlot.h:100

AvalancheSchedulerSvc::m_optimizationMode
Gaudi::Property< std::string > m_optimizationMode
Definition: AvalancheSchedulerSvc.h:163

IPrecedenceSvc::simulate
virtual StatusCode simulate(EventSlot &) const =0
Simulate execution flow.

CommonMessagingBase::info
MsgStream & info() const
shortcut for the method msgStream(MSG::INFO)
Definition: CommonMessaging.h:114

AvalancheSchedulerSvc::AlgQueueEntry
Struct to hold entries in the alg queues.
Definition: AvalancheSchedulerSvc.h:279

IPrecedenceSvc::CFRulesResolved
virtual bool CFRulesResolved(EventSlot &) const =0
Check if control flow rules are resolved.

TimelineEvent
Definition: ITimelineSvc.h:23

IAlgResourcePool::getFlatAlgList
virtual std::list< IAlgorithm * > getFlatAlgList()=0
Get the flat list of algorithms.

MSG::VERBOSE
Definition: IMessageSvc.h:25

std::thread::hardware_concurrency
T hardware_concurrency(T... args)

SmartIF::get
TYPE * get() const
Get interface pointer.
Definition: SmartIF.h:86

EventContext
This class represents an entry point to all the event specific data.
Definition: EventContext.h:34

std::map
STL class.

AvalancheSchedulerSvc::AlgQueueEntry::algIndex
unsigned int algIndex
Definition: AvalancheSchedulerSvc.h:280

std::stringstream
STL class.

DataObjID::fullKey
std::string fullKey() const
Definition: DataObjID.cpp:99

AvalancheSchedulerSvc::AlgoExecutionTask
friend class AlgoExecutionTask
Definition: AvalancheSchedulerSvc.h:113

std::unique_ptr::release
T release(T... args)

AvalancheSchedulerSvc::m_isActive
std::atomic< ActivationState > m_isActive
Flag to track if the scheduler is active or not.
Definition: AvalancheSchedulerSvc.h:197

std::setw
T setw(T... args)

CommonMessaging< implements< IService, IProperty, IStateful > >::msgLevel
MSG::Level msgLevel() const
get the cached level (originally extracted from the embedded MsgStream)
Definition: CommonMessaging.h:148

AvalancheSchedulerSvc::m_algname_index_map
std::unordered_map< std::string, unsigned int > m_algname_index_map
Map to bookkeep the information necessary to the name2index conversion.
Definition: AvalancheSchedulerSvc.h:203

std::vector::resize
T resize(T... args)

AlgoExecutionTask::execute
tbb::task * execute() override
Definition: AlgoExecutionTask.cpp:31

AvalancheSchedulerSvc::m_checkDeps
Gaudi::Property< bool > m_checkDeps
Definition: AvalancheSchedulerSvc.h:170

std::string
STL class.

AvalancheSchedulerSvc::m_useIOBoundAlgScheduler
Gaudi::Property< bool > m_useIOBoundAlgScheduler
Definition: AvalancheSchedulerSvc.h:167

IAlgExecStateSvc::algExecState
virtual const AlgExecState & algExecState(const Gaudi::StringKey &algName, const EventContext &ctx) const =0

DECLARE_COMPONENT
#define DECLARE_COMPONENT(type)
Definition: PluginServiceV1.h:46

concurrency::AlgorithmNode::getAlgoIndex
const unsigned int & getAlgoIndex() const
Get algorithm index.
Definition: PrecedenceRulesGraph.h:523

AvalancheSchedulerSvc::m_freeSlots
std::atomic_int m_freeSlots
Atomic to account for asyncronous updates by the scheduler wrt the rest.
Definition: AvalancheSchedulerSvc.h:227

std::vector::at
T at(T... args)

IThreadPoolSvc::terminatePool
virtual StatusCode terminatePool()=0
Finalize the thread pool.

AvalancheSchedulerSvc::pushNewEvents
StatusCode pushNewEvents(std::vector< EventContext * > &eventContexts) override
Definition: AvalancheSchedulerSvc.cpp:519

ISvcLocator::service
StatusCode service(const Gaudi::Utils::TypeNameString &name, T *&svc, bool createIf=true)
Templated method to access a service by name.
Definition: ISvcLocator.h:86

Service::name
const std::string & name() const override
Retrieve name of the service.
Definition: Service.cpp:284

AvalancheSchedulerSvc::m_algosInFlight
unsigned int m_algosInFlight
Number of algorithms presently in flight.
Definition: AvalancheSchedulerSvc.h:239

std::vector::push_back
T push_back(T... args)

std::ofstream
STL class.

CommonMessagingBase::error
MsgStream & error() const
shortcut for the method msgStream(MSG::ERROR)
Definition: CommonMessaging.h:108

AvalancheSchedulerSvc::m_verboseSubSlots
Gaudi::Property< bool > m_verboseSubSlots
Definition: AvalancheSchedulerSvc.h:186

AvalancheSchedulerSvc::m_algResourcePool
SmartIF< IAlgResourcePool > m_algResourcePool
Cache for the algorithm resource pool.
Definition: AvalancheSchedulerSvc.h:271

IDataManagerSvc.h

AlgsExecutionStates
The AlgsExecutionStates encodes the state machine for the execution of algorithms within a single eve...
Definition: AlgsExecutionStates.h:36

IAlgExecStateSvc::dump
virtual void dump(std::ostringstream &ost, const EventContext &ctx) const =0

AvalancheSchedulerSvc::popFinishedEvent
StatusCode popFinishedEvent(EventContext *&eventContext) override
Blocks until an event is available.
Definition: AvalancheSchedulerSvc.cpp:536

std::thread::join
T join(T... args)

Cause
Definition: PrecedenceRulesGraph.h:397

IPrecedenceSvc::dumpPrecedenceRules
virtual void dumpPrecedenceRules(EventSlot &)=0
Dump precedence rules.

Algorithm.h

AvalancheSchedulerSvc::m_showControlFlow
Gaudi::Property< bool > m_showControlFlow
Definition: AvalancheSchedulerSvc.h:183

StatusCode
This class is used for returning status codes from appropriate routines.
Definition: StatusCode.h:61

AvalancheSchedulerSvc::m_whiteboard
SmartIF< IHiveWhiteBoard > m_whiteboard
A shortcut to the whiteboard.
Definition: AvalancheSchedulerSvc.h:218

std::ostringstream
STL class.

AvalancheSchedulerSvc::m_finishedEvents
tbb::concurrent_bounded_queue< EventContext * > m_finishedEvents
Queue of finished events.
Definition: AvalancheSchedulerSvc.h:230

AvalancheSchedulerSvc::m_algname_vect
std::vector< std::string > m_algname_vect
Vector to bookkeep the information necessary to the index2name conversion.
Definition: AvalancheSchedulerSvc.h:209

std::ofstream::close
T close(T... args)

AlgExecState::execStatus
const StatusCode & execStatus() const
Definition: IAlgExecStateSvc.h:43

AlgsExecutionStates::sizeOfSubset
size_t sizeOfSubset(State state) const
Definition: AlgsExecutionStates.h:75

AlgsExecutionStates::set
StatusCode set(unsigned int iAlgo, State newState)
Definition: AlgsExecutionStates.cpp:23

CommonMessagingBase::verbose
MsgStream & verbose() const
shortcut for the method msgStream(MSG::VERBOSE)
Definition: CommonMessaging.h:120

compareRootHistos.state
def state
Definition: compareRootHistos.py:468

EventStatus::AlgStall
Definition: IAlgExecStateSvc.h:73

AvalancheSchedulerSvc::m_IOBoundAlgSchedulerSvcName
Gaudi::Property< std::string > m_IOBoundAlgSchedulerSvcName
Definition: AvalancheSchedulerSvc.h:157

std::ostringstream::str
T str(T... args)

EventStatus::Success
Definition: IAlgExecStateSvc.h:73

IAlgExecStateSvc::setEventStatus
virtual void setEventStatus(const EventStatus::Status &sc, const EventContext &ctx)=0

Cause::source::Root

CommonMessagingBase::debug
MsgStream & debug() const
shortcut for the method msgStream(MSG::DEBUG)
Definition: CommonMessaging.h:117

concurrency::PrecedenceRulesGraph::getControlFlowNodeCounter
unsigned int getControlFlowNodeCounter() const
Get total number of control flow graph nodes.
Definition: PrecedenceRulesGraph.h:672

AvalancheSchedulerSvc::finalize
StatusCode finalize() override
Finalise.
Definition: AvalancheSchedulerSvc.cpp:342

std::unordered_set< DataObjID, DataObjID_Hasher >

IHiveWhiteBoard::getNumberOfStores
virtual size_t getNumberOfStores() const =0
Get the number of 'slots'.

DataHandleHolderVisitor.h

AvalancheSchedulerSvc::m_threadPoolSize
Gaudi::Property< int > m_threadPoolSize
Definition: AvalancheSchedulerSvc.h:153

IPrecedenceSvc::dumpDataFlow
virtual void dumpDataFlow() const =0

ITimelineSvc
Definition: ITimelineSvc.h:37

StatusCode::isSuccess
bool isSuccess() const
Definition: StatusCode.h:365

AvalancheSchedulerSvc::m_threadPoolSvc
SmartIF< IThreadPoolSvc > m_threadPoolSvc
Definition: AvalancheSchedulerSvc.h:302

std::list< IAlgorithm * >

AvalancheSchedulerSvc::m_IOBoundAlgScheduler
SmartIF< IAccelerator > m_IOBoundAlgScheduler
A shortcut to IO-bound algorithm scheduler.
Definition: AvalancheSchedulerSvc.h:221

std::max
T max(T... args)

IAlgorithm
The IAlgorithm is the interface implemented by the Algorithm base class.
Definition: IAlgorithm.h:38

AlgsExecutionStates::State
State
Execution states of the algorithms.
Definition: AlgsExecutionStates.h:39

Gaudi::Hive::setCurrentContext
GAUDI_API void setCurrentContext(const EventContext *ctx)
Definition: ThreadLocalContext.cpp:41

std::move
T move(T... args)

AvalancheSchedulerSvc
Definition: AvalancheSchedulerSvc.h:112

AvalancheSchedulerSvc::promoteToAsyncScheduled
StatusCode promoteToAsyncScheduled(unsigned int iAlgo, int si, EventContext *)
Definition: AvalancheSchedulerSvc.cpp:923

EventContext::subSlot
ContextID_t subSlot() const
Definition: EventContext.h:52

std::unique_ptr::get
T get(T... args)

std::unordered_set::insert
T insert(T... args)

DataHandleHolderBase::addDependency
void addDependency(const DataObjID &id, const Gaudi::DataHandle::Mode &mode) override
Definition: DataHandleHolderBase.h:68

DataHandleHolderBase::outputDataObjs
const DataObjIDColl & outputDataObjs() const override
Definition: DataHandleHolderBase.h:66

std::find_if
T find_if(T... args)

std::unordered_set::size
T size(T... args)

StatusCode::ignore
const StatusCode & ignore() const
Ignore/check StatusCode.
Definition: StatusCode.h:168

AvalancheSchedulerSvc::pushNewEvent
StatusCode pushNewEvent(EventContext *eventContext) override
Make an event available to the scheduler.
Definition: AvalancheSchedulerSvc.cpp:461

std::vector
STL class.

std::unique_ptr< EventContext >

AvalancheSchedulerSvc::m_simulateExecution
Gaudi::Property< bool > m_simulateExecution
Definition: AvalancheSchedulerSvc.h:160

AvalancheSchedulerSvc::setAlgState
StatusCode setAlgState(unsigned int iAlgo, EventContext *contextPtr, AState state, bool iterate=false)
Definition: AvalancheSchedulerSvc.cpp:691

AvalancheSchedulerSvc::updateStates
StatusCode updateStates()
Loop on algorithm in the slots and promote them to successive states.
Definition: AvalancheSchedulerSvc.cpp:580

std::vector::begin
T begin(T... args)

AvalancheSchedulerSvc::AlgQueueEntry::slotIndex
int slotIndex
Definition: AvalancheSchedulerSvc.h:281

AlgsExecutionStates::begin
Iterator begin(State kind)
Definition: AlgsExecutionStates.h:114

std::chrono::high_resolution_clock::now
T now(T... args)

std::any_of
T any_of(T... args)

AvalancheSchedulerSvc::m_enableCondSvc
Gaudi::Property< bool > m_enableCondSvc
Definition: AvalancheSchedulerSvc.h:175

ConcurrencyFlags.h

Gaudi::Algorithm
Base class from which all concrete algorithm classes should be derived.
Definition: Algorithm.h:89

AvalancheSchedulerSvc::m_maxAlgosInFlight
size_t m_maxAlgosInFlight
Definition: AvalancheSchedulerSvc.h:304

IPrecedenceSvc::getPriority
virtual uint getPriority(const std::string &) const =0
Get task priority.

std::vector::back
T back(T... args)

gaudirun.s
string s
Definition: gaudirun.py:328

AvalancheSchedulerSvc::enqueue
StatusCode enqueue(unsigned int iAlgo, int si, EventContext *)
Algorithm promotion.
Definition: AvalancheSchedulerSvc.cpp:866

StatusCode::FAILURE
constexpr static const auto FAILURE
Definition: StatusCode.h:101

Gaudi::DataHandle::Writer
Definition: DataHandle.h:39

std::hex
T hex(T... args)

MSG::ERROR
Definition: IMessageSvc.h:25

AvalancheSchedulerSvc::m_condSvc
SmartIF< ICondSvc > m_condSvc
A shortcut to service for Conditions handling.
Definition: AvalancheSchedulerSvc.h:236

AvalancheSchedulerSvc::eventFailed
void eventFailed(EventContext *eventContext)
Method to execute if an event failed.
Definition: AvalancheSchedulerSvc.cpp:735

AvalancheSchedulerSvc::freeSlots
unsigned int freeSlots() override
Get free slots number.
Definition: AvalancheSchedulerSvc.cpp:530

AvalancheSchedulerSvc::m_eventSlots
std::vector< EventSlot > m_eventSlots
Vector of events slots.
Definition: AvalancheSchedulerSvc.h:224

EventSlot::complete
bool complete
Flags completion of the event.
Definition: EventSlot.h:89

std::sort
T sort(T... args)

AvalancheSchedulerSvc::promoteToAsyncExecuted
StatusCode promoteToAsyncExecuted(unsigned int iAlgo, int si, IAlgorithm *algo, EventContext *)
The call to this method is triggered only from within the IOBoundAlgTask.
Definition: AvalancheSchedulerSvc.cpp:1019

AvalancheSchedulerSvc::deactivate
StatusCode deactivate()
Deactivate scheduler.
Definition: AvalancheSchedulerSvc.cpp:430

StatusCode::isFailure
bool isFailure() const
Definition: StatusCode.h:145

IAccelerator::push
virtual StatusCode push(IAlgTask &task)=0

AvalancheSchedulerSvc::m_scheduledQueue
tbb::concurrent_priority_queue< AlgQueueEntry, AlgQueueSort > m_scheduledQueue
Queues for scheduled algorithms.
Definition: AvalancheSchedulerSvc.h:293

AvalancheSchedulerSvc::FAILURE
Definition: AvalancheSchedulerSvc.h:151

DataHandleHolderBase::inputDataObjs
const DataObjIDColl & inputDataObjs() const override
Definition: DataHandleHolderBase.h:65

EventSlot::reset
void reset(EventContext *theeventContext)
Reset all resources in order to reuse the slot (thread-unsafe)
Definition: EventSlot.h:49

IPrecedenceSvc::dumpControlFlow
virtual void dumpControlFlow() const =0
Dump precedence rules.

IAlgResourcePool::releaseAlgorithm
virtual StatusCode releaseAlgorithm(const std::string &name, IAlgorithm *&algo)=0
Release a certain algorithm.

AlgExecState
Definition: IAlgExecStateSvc.h:37

IPrecedenceSvc::isBlocking
virtual bool isBlocking(const std::string &) const =0
Check if a task is CPU-blocking.

AvalancheSchedulerSvc::m_retryQueue
std::queue< AlgQueueEntry > m_retryQueue
Definition: AvalancheSchedulerSvc.h:294

std::thread
STL class.

AvalancheSchedulerSvc::m_algExecStateSvc
SmartIF< IAlgExecStateSvc > m_algExecStateSvc
Algorithm execution state manager.
Definition: AvalancheSchedulerSvc.h:233

AvalancheSchedulerSvc::m_maxIOBoundAlgosInFlight
Gaudi::Property< unsigned int > m_maxIOBoundAlgosInFlight
Definition: AvalancheSchedulerSvc.h:158

CommonMessagingBase::fatal
MsgStream & fatal() const
shortcut for the method msgStream(MSG::FATAL)
Definition: CommonMessaging.h:102

IPrecedenceSvc::printState
virtual const std::string printState(EventSlot &) const =0

AvalancheSchedulerSvc::m_maxEventsInFlight
size_t m_maxEventsInFlight
Definition: AvalancheSchedulerSvc.h:303

endmsg
MsgStream & endmsg(MsgStream &s)
MsgStream Modifier: endmsg. Calls the output method of the MsgStream.
Definition: MsgStream.h:202

std::initializer_list

AvalancheSchedulerSvc.h

AvalancheSchedulerErrorTest.threads
int threads
Definition: AvalancheSchedulerErrorTest.py:27

EventSlot::eventContext
std::unique_ptr< EventContext > eventContext
Cache for the eventContext.
Definition: EventSlot.h:83

AvalancheSchedulerSvc::m_actionsQueue
tbb::concurrent_bounded_queue< action > m_actionsQueue
Queue where closures are stored and picked for execution.
Definition: AvalancheSchedulerSvc.h:276

AlgoExecutionTask.h

std::atomic::load
T load(T... args)

PrecedenceSvc::getRules
const concurrency::PrecedenceRulesGraph * getRules() const
Precedence rules accessor.
Definition: PrecedenceSvc.h:73

Gaudi::Algorithm::name
const std::string & name() const override
The identifying name of the algorithm object.
Definition: Algorithm.cpp:549

EventSlot::algsStates
AlgsExecutionStates algsStates
Vector of algorithms states.
Definition: EventSlot.h:85

std::vector::reserve
T reserve(T... args)

AvalancheSchedulerSvc::promoteToExecuted
StatusCode promoteToExecuted(unsigned int iAlgo, int si, EventContext *)
The call to this method is triggered only from within the AlgoExecutionTask.
Definition: AvalancheSchedulerSvc.cpp:985

std::vector::emplace_back
T emplace_back(T... args)

AvalancheSchedulerSvc::m_thread
std::thread m_thread
The thread in which the activate function runs.
Definition: AvalancheSchedulerSvc.h:200

EventContext::usesSubSlot
bool usesSubSlot() const
Definition: EventContext.h:53

ON_VERBOSE
#define ON_VERBOSE
Definition: AvalancheSchedulerSvc.cpp:46

AlgsExecutionStates::end
Iterator end(State kind)
Definition: AlgsExecutionStates.h:115