GPU: Ensure that gpu-prepare-workflow and gpu-workflow process time frames in the same order via completion policy

davidrohr · davidrohr · commit e01747a967eb · 2023-09-24T00:58:46.000+02:00
diff --git a/GPU/Workflow/include/GPUWorkflow/GPUWorkflowSpec.h b/GPU/Workflow/include/GPUWorkflow/GPUWorkflowSpec.h
@@ -27,6 +27,7 @@
 #include <array>
 #include <vector>
 #include <mutex>
+#include <functional>
 
 class TStopwatch;
 namespace fair::mq
@@ -122,7 +123,7 @@ class GPURecoWorkflowSpec : public o2::framework::Task
     bool tpcTriggerHandling = false;
   };
 
-  GPURecoWorkflowSpec(CompletionPolicyData* policyData, Config const& specconfig, std::vector<int> const& tpcsectors, unsigned long tpcSectorMask, std::shared_ptr<o2::base::GRPGeomRequest>& ggr);
+  GPURecoWorkflowSpec(CompletionPolicyData* policyData, Config const& specconfig, std::vector<int> const& tpcsectors, unsigned long tpcSectorMask, std::shared_ptr<o2::base::GRPGeomRequest>& ggr, std::function<bool(o2::framework::DataProcessingHeader::StartTime)>** gPolicyOrder = nullptr);
   ~GPURecoWorkflowSpec() override;
   void init(o2::framework::InitContext& ic) final;
   void run(o2::framework::ProcessingContext& pc) final;
@@ -162,8 +163,10 @@ class GPURecoWorkflowSpec : public o2::framework::Task
   void RunReceiveThread();
   void TerminateReceiveThread();
   void handlePipelineEndOfStream(o2::framework::EndOfStreamContext& ec);
+  void initPipeline(o2::framework::InitContext& ic);
 
   CompletionPolicyData* mPolicyData;
+  std::function<bool(o2::framework::DataProcessingHeader::StartTime)> mPolicyOrder;
   std::unique_ptr<GPUO2Interface> mGPUReco;
   std::unique_ptr<GPUDisplayFrontendInterface> mDisplayFrontend;
   std::unique_ptr<TPCFastTransform> mFastTransform;
diff --git a/GPU/Workflow/src/GPUWorkflowInternal.h b/GPU/Workflow/src/GPUWorkflowInternal.h
@@ -47,13 +47,17 @@ struct GPURecoWorkflowSpec_PipelineInternals {
   fair::mq::Device* fmqDevice;
 
   std::thread receiveThread;
-  std::condition_variable notifyThread;
   std::mutex threadMutex;
   volatile bool shouldTerminate = false;
 
   std::queue<std::unique_ptr<GPURecoWorkflow_QueueObject>> pipelineQueue;
   std::mutex queueMutex;
   std::condition_variable queueNotify;
+
+  std::queue<o2::framework::DataProcessingHeader::StartTime> completionPolicyQueue;
+  bool pipelineSenderTerminating = false;
+  std::mutex completionPolicyMutex;
+  std::condition_variable completionPolicyNotify;
 };
 
 } // namespace gpurecoworkflow_internals
diff --git a/GPU/Workflow/src/GPUWorkflowPipeline.cxx b/GPU/Workflow/src/GPUWorkflowPipeline.cxx
@@ -56,6 +56,23 @@ struct pipelinePrepareMessage {
   bool flagEndOfStream;
 };
 
+void GPURecoWorkflowSpec::initPipeline(o2::framework::InitContext& ic)
+{
+  if (mSpecConfig.enableDoublePipeline == 1) {
+    mPipeline->fmqDevice = ic.services().get<RawDeviceService>().device();
+    mPolicyOrder = [this](o2::framework::DataProcessingHeader::StartTime timeslice) {
+      std::unique_lock lk(mPipeline->completionPolicyMutex);
+      mPipeline->completionPolicyNotify.wait(lk, [pipeline = mPipeline.get()] { return pipeline->pipelineSenderTerminating || !pipeline->completionPolicyQueue.empty(); });
+      if (mPipeline->completionPolicyQueue.front() == timeslice) {
+        mPipeline->completionPolicyQueue.pop();
+        return true;
+      }
+      return false;
+    };
+    mPipeline->receiveThread = std::thread([this]() { RunReceiveThread(); });
+  }
+}
+
 int GPURecoWorkflowSpec::handlePipeline(ProcessingContext& pc, GPUTrackingInOutPointers& ptrs, GPURecoWorkflowSpec_TPCZSBuffers& tpcZSmeta, o2::gpu::GPUTrackingInOutZS& tpcZS)
 {
   auto* device = pc.services().get<RawDeviceService>().device();
@@ -184,8 +201,8 @@ void GPURecoWorkflowSpec::RunReceiveThread()
       LOG(fatal) << "Prepare message corrupted, invalid magic word";
     }
     if (m->flagEndOfStream) {
-      LOG(info) << "Received end-of-stream from out-of-band channel";
-      continue;
+      LOG(info) << "Received end-of-stream from out-of-band channel, terminating receive thread"; // TODO: Breaks START / STOP / START
+      break;
     }
 
     auto o = std::make_unique<GPURecoWorkflow_QueueObject>();
@@ -220,12 +237,22 @@ void GPURecoWorkflowSpec::RunReceiveThread()
       }
     }
     o->ptrs.tpcZS = &o->tpcZS;
+    {
+      std::lock_guard lk(mPipeline->completionPolicyMutex);
+      mPipeline->completionPolicyQueue.emplace(m->timeSliceId);
+    }
+    mPipeline->completionPolicyNotify.notify_one();
     {
       std::lock_guard lk(mPipeline->queueMutex);
       mPipeline->pipelineQueue.emplace(std::move(o));
     }
     mPipeline->queueNotify.notify_one();
   }
+  {
+    std::lock_guard lk(mPipeline->completionPolicyMutex);
+    mPipeline->pipelineSenderTerminating = true;
+  }
+  mPipeline->completionPolicyNotify.notify_one();
 }
 
 void GPURecoWorkflowSpec::TerminateReceiveThread()
diff --git a/GPU/Workflow/src/GPUWorkflowSpec.cxx b/GPU/Workflow/src/GPUWorkflowSpec.cxx
@@ -107,7 +107,7 @@ using namespace o2::gpu::gpurecoworkflow_internals;
 namespace o2::gpu
 {
 
-GPURecoWorkflowSpec::GPURecoWorkflowSpec(GPURecoWorkflowSpec::CompletionPolicyData* policyData, Config const& specconfig, std::vector<int> const& tpcsectors, unsigned long tpcSectorMask, std::shared_ptr<o2::base::GRPGeomRequest>& ggr) : o2::framework::Task(), mPolicyData(policyData), mTPCSectorMask(tpcSectorMask), mTPCSectors(tpcsectors), mSpecConfig(specconfig), mGGR(ggr)
+GPURecoWorkflowSpec::GPURecoWorkflowSpec(GPURecoWorkflowSpec::CompletionPolicyData* policyData, Config const& specconfig, std::vector<int> const& tpcsectors, unsigned long tpcSectorMask, std::shared_ptr<o2::base::GRPGeomRequest>& ggr, std::function<bool(o2::framework::DataProcessingHeader::StartTime)>** gPolicyOrder) : o2::framework::Task(), mPolicyData(policyData), mTPCSectorMask(tpcSectorMask), mTPCSectors(tpcsectors), mSpecConfig(specconfig), mGGR(ggr)
 {
   if (mSpecConfig.outputCAClusters && !mSpecConfig.caClusterer && !mSpecConfig.decompressTPC) {
     throw std::runtime_error("inconsistent configuration: cluster output is only possible if CA clusterer is activated");
@@ -118,6 +118,10 @@ GPURecoWorkflowSpec::GPURecoWorkflowSpec(GPURecoWorkflowSpec::CompletionPolicyDa
   mTFSettings.reset(new GPUSettingsTF);
   mTimer.reset(new TStopwatch);
   mPipeline.reset(new GPURecoWorkflowSpec_PipelineInternals);
+
+  if (mSpecConfig.enableDoublePipeline == 1 && gPolicyOrder) {
+    *gPolicyOrder = &mPolicyOrder;
+  }
 }
 
 GPURecoWorkflowSpec::~GPURecoWorkflowSpec() = default;
@@ -285,9 +289,8 @@ void GPURecoWorkflowSpec::init(InitContext& ic)
     }
   }
 
-  if (mSpecConfig.enableDoublePipeline == 1) {
-    mPipeline->fmqDevice = ic.services().get<RawDeviceService>().device();
-    mPipeline->receiveThread = std::thread([this]() { RunReceiveThread(); });
+  if (mSpecConfig.enableDoublePipeline) {
+    initPipeline(ic);
   }
 
   auto& callbacks = ic.services().get<CallbackService>();
diff --git a/GPU/Workflow/src/gpu-reco-workflow.cxx b/GPU/Workflow/src/gpu-reco-workflow.cxx
@@ -38,6 +38,7 @@ using namespace o2::gpu;
 using CompletionPolicyData = std::vector<InputSpec>;
 static CompletionPolicyData gPolicyData;
 static constexpr unsigned long gTpcSectorMask = 0xFFFFFFFFF;
+static std::function<bool(o2::framework::DataProcessingHeader::StartTime)>* gPolicyOrderCheck;
 static std::shared_ptr<GPURecoWorkflowSpec> gTask;
 
 void customize(std::vector<o2::framework::CallbacksPolicy>& policies)
@@ -71,7 +72,7 @@ void customize(std::vector<DispatchPolicy>& policies)
 
 void customize(std::vector<CompletionPolicy>& policies)
 {
-  policies.push_back(o2::tpc::TPCSectorCompletionPolicy("gpu-reconstruction.*", o2::tpc::TPCSectorCompletionPolicy::Config::RequireAll, &gPolicyData, &gTpcSectorMask)());
+  policies.push_back(o2::tpc::TPCSectorCompletionPolicy("gpu-reconstruction.*", o2::tpc::TPCSectorCompletionPolicy::Config::RequireAll, &gPolicyData, &gTpcSectorMask, &gPolicyOrderCheck)());
 }
 
 void customize(o2::framework::OnWorkflowTerminationHook& hook)

Original file line number	Diff line number	Diff line change
`@@ -107,7 +107,7 @@ using namespace o2::gpu::gpurecoworkflow_internals;`
`107`	`107`	`namespace o2::gpu`
`108`	`108`	`{`
`109`	`109`
`110`		`-GPURecoWorkflowSpec::GPURecoWorkflowSpec(GPURecoWorkflowSpec::CompletionPolicyData* policyData, Config const& specconfig, std::vector<int> const& tpcsectors, unsigned long tpcSectorMask, std::shared_ptr<o2::base::GRPGeomRequest>& ggr) : o2::framework::Task(), mPolicyData(policyData), mTPCSectorMask(tpcSectorMask), mTPCSectors(tpcsectors), mSpecConfig(specconfig), mGGR(ggr)`
	`110`	`+GPURecoWorkflowSpec::GPURecoWorkflowSpec(GPURecoWorkflowSpec::CompletionPolicyData* policyData, Config const& specconfig, std::vector<int> const& tpcsectors, unsigned long tpcSectorMask, std::shared_ptr<o2::base::GRPGeomRequest>& ggr, std::function<bool(o2::framework::DataProcessingHeader::StartTime)>** gPolicyOrder) : o2::framework::Task(), mPolicyData(policyData), mTPCSectorMask(tpcSectorMask), mTPCSectors(tpcsectors), mSpecConfig(specconfig), mGGR(ggr)`
`111`	`111`	`{`
`112`	`112`	`if (mSpecConfig.outputCAClusters && !mSpecConfig.caClusterer && !mSpecConfig.decompressTPC) {`
`113`	`113`	`throw std::runtime_error("inconsistent configuration: cluster output is only possible if CA clusterer is activated");`
`@@ -118,6 +118,10 @@ GPURecoWorkflowSpec::GPURecoWorkflowSpec(GPURecoWorkflowSpec::CompletionPolicyDa`
`118`	`118`	`mTFSettings.reset(new GPUSettingsTF);`
`119`	`119`	`mTimer.reset(new TStopwatch);`
`120`	`120`	`mPipeline.reset(new GPURecoWorkflowSpec_PipelineInternals);`
	`121`	`+`
	`122`	`+ if (mSpecConfig.enableDoublePipeline == 1 && gPolicyOrder) {`
	`123`	`+ *gPolicyOrder = &mPolicyOrder;`
	`124`	`+ }`
`121`	`125`	`}`
`122`	`126`
`123`	`127`	`GPURecoWorkflowSpec::~GPURecoWorkflowSpec() = default;`
`@@ -285,9 +289,8 @@ void GPURecoWorkflowSpec::init(InitContext& ic)`
`285`	`289`	`}`
`286`	`290`	`}`
`287`	`291`
`288`		`- if (mSpecConfig.enableDoublePipeline == 1) {`
`289`		`- mPipeline->fmqDevice = ic.services().get<RawDeviceService>().device();`
`290`		`- mPipeline->receiveThread = std::thread([this]() { RunReceiveThread(); });`
	`292`	`+ if (mSpecConfig.enableDoublePipeline) {`
	`293`	`+ initPipeline(ic);`
`291`	`294`	`}`
`292`	`295`
`293`	`296`	`auto& callbacks = ic.services().get<CallbackService>();`
Original file line number	Diff line number	Diff line change
`@@ -38,6 +38,7 @@ using namespace o2::gpu;`
`38`	`38`	`using CompletionPolicyData = std::vector<InputSpec>;`
`39`	`39`	`static CompletionPolicyData gPolicyData;`
`40`	`40`	`static constexpr unsigned long gTpcSectorMask = 0xFFFFFFFFF;`
	`41`	`+static std::function<bool(o2::framework::DataProcessingHeader::StartTime)>* gPolicyOrderCheck;`
`41`	`42`	`static std::shared_ptr<GPURecoWorkflowSpec> gTask;`
`42`	`43`
`43`	`44`	`void customize(std::vector<o2::framework::CallbacksPolicy>& policies)`
`@@ -71,7 +72,7 @@ void customize(std::vector<DispatchPolicy>& policies)`
`71`	`72`
`72`	`73`	`void customize(std::vector<CompletionPolicy>& policies)`
`73`	`74`	`{`
`74`		`- policies.push_back(o2::tpc::TPCSectorCompletionPolicy("gpu-reconstruction.*", o2::tpc::TPCSectorCompletionPolicy::Config::RequireAll, &gPolicyData, &gTpcSectorMask)());`
	`75`	`+ policies.push_back(o2::tpc::TPCSectorCompletionPolicy("gpu-reconstruction.*", o2::tpc::TPCSectorCompletionPolicy::Config::RequireAll, &gPolicyData, &gTpcSectorMask, &gPolicyOrderCheck)());`
`75`	`76`	`}`
`76`	`77`
`77`	`78`	`void customize(o2::framework::OnWorkflowTerminationHook& hook)`