linuxboot
diff --git a/‎pkg/cerrors/cerrors.go‎
Lines changed: 0 additions & 55 deletions b/‎pkg/cerrors/cerrors.go‎
Lines changed: 0 additions & 55 deletions
diff --git a/‎pkg/config/timeouts.go‎
Lines changed: 25 additions & 4 deletions b/‎pkg/config/timeouts.go‎
Lines changed: 25 additions & 4 deletions
diff --git a/‎pkg/event/testevent/test.go‎
Lines changed: 2 additions & 14 deletions b/‎pkg/event/testevent/test.go‎
Lines changed: 2 additions & 14 deletions
diff --git a/‎pkg/jobmanager/jobmanager.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/jobmanager/jobmanager.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/pluginregistry/bundles.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/pluginregistry/bundles.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/runner/job_runner.go‎
Lines changed: 3 additions & 10 deletions b/‎pkg/runner/job_runner.go‎
Lines changed: 3 additions & 10 deletions
@@ -43,17 +43,6 @@ func (e *ErrTestStepsNeverReturned) Error() string {
 	return fmt.Sprintf("test step [%s] did not return", strings.Join(e.StepNames, ", "))
 }
 
-// ErrTestTargetInjectionTimedOut indicates that test step did not ingest a target
-// within allotted time.
-type ErrTestTargetInjectionTimedOut struct {
-	StepName string
-}
-
-// Error returns the error string associated with the error
-func (e *ErrTestTargetInjectionTimedOut) Error() string {
-	return fmt.Sprintf("test step %v failed to ingest a target", e.StepName)
-}
-
 // ErrTestStepClosedChannels indicates that the test step returned after
 // closing its output channels, which constitutes an API violation
 type ErrTestStepClosedChannels struct {
@@ -64,47 +53,3 @@ type ErrTestStepClosedChannels struct {
 func (e *ErrTestStepClosedChannels) Error() string {
 	return fmt.Sprintf("test step %v closed output channels (api violation)", e.StepName)
 }
-
-// ErrTestStepPaniced indicates that a test step's method paniced.
-type ErrTestStepPaniced struct {
-	StepName   string
-	StackTrace string
-}
-
-// Error returns the error string associated with the error
-func (e *ErrTestStepPaniced) Error() string {
-	return fmt.Sprintf("test step %s paniced, trace: %q", e.StepName, e.StackTrace)
-}
-
-// ErrTestStepReturnedDuplicateResult indicates that a test step's method paniced.
-type ErrTestStepReturnedDuplicateResult struct {
-	StepName string
-	Target   string
-}
-
-// Error returns the error string associated with the error
-func (e *ErrTestStepReturnedDuplicateResult) Error() string {
-	return fmt.Sprintf("test step %s returned duplicate result for %s", e.StepName, e.Target)
-}
-
-// ErrTestStepReturnedUnexpectedResult indicates that a test step's method paniced.
-type ErrTestStepReturnedUnexpectedResult struct {
-	StepName string
-	Target   string
-}
-
-// Error returns the error string associated with the error
-func (e *ErrTestStepReturnedUnexpectedResult) Error() string {
-	return fmt.Sprintf("test step %s returned unexpected result for %s", e.StepName, e.Target)
-}
-
-// ErrTestStepLostTargets indicates that targets have been lost during test run.
-type ErrTestStepLostTargets struct {
-	StepName string
-	Target   string
-}
-
-// Error returns the error string associated with the error
-func (e *ErrTestStepLostTargets) Error() string {
-	return fmt.Sprintf("test step %s lost target %s", e.StepName, e.Target)
-}
@@ -16,14 +16,35 @@ var TargetManagerAcquireTimeout = 5 * time.Minute
 var TargetManagerReleaseTimeout = 5 * time.Minute
 
 // StepInjectTimeout represents the maximum time that TestRunner will wait for
-// a TestStep to accept a Target
+// the first TestStep of the pipeline to accept a Target
 var StepInjectTimeout = 30 * time.Second
 
-// TestRunnerShutdownTimeout represents the maximum time that the TestRunner
-// will wait for all TestSteps to complete after all Targets have reached the end
-// of the pipeline.
+// TestRunnerMsgTimeout represents the maximum time that any component of the
+// TestRunner will wait for the delivery of a message to any other subsystem
+// of the TestRunner
+var TestRunnerMsgTimeout = 5 * time.Second
+
+// TestRunnerShutdownTimeout represents the maximum time that the TestRunner will
+// wait for all the TestStep to complete after a cancellation signal has been
+// delivered
+
+// TestRunnerShutdownTimeout controls a block of the TestRunner which works as a
+// watchdog, i.e. if there are multiple steps that need to return, the timeout is
+// reset every time a step returns. The timeout should be handled so that it
+// doesn't reset when a TestStep returns.
 var TestRunnerShutdownTimeout = 30 * time.Second
 
+// TestRunnerStepShutdownTimeout represents the maximum time that the TestRunner
+// will wait for all TestSteps to complete after all Targets have reached the end
+// of the pipeline. This timeout is only relevant if a cancellation signal is *not*
+// delivered.
+
+// TestRunnerStepShutdownTimeout controls a block of the TestRunner which worksas
+// a watchdog, i.e. if there are multiple steps that need to return, the timeout
+// is reset every time a step returns. The timeout should be handled so that it
+// doesn't reset when a TestStep returns.
+var TestRunnerStepShutdownTimeout = 5 * time.Second
+
 // LockRefreshTimeout is the amount of time by which a target lock is extended
 // periodically while a job is running.
 var LockRefreshTimeout = 1 * time.Minute
@@ -16,7 +16,7 @@ import (
 	"github.com/facebookincubator/contest/pkg/types"
 )
 
-// Header models the header of a test event, which consists in metadata that defines the
+// Header models the header of a test event, which consists in metadatat hat defines the
 // emitter of the events. The Header is under ConTest control and cannot be manipulated
 // by the TestStep
 type Header struct {
@@ -28,8 +28,8 @@ type Header struct {
 
 // Data models the data of a test event. It is populated by the TestStep
 type Data struct {
-	Target    *target.Target
 	EventName event.Name
+	Target    *target.Target
 	Payload   *json.RawMessage
 }
 
@@ -152,15 +152,3 @@ type EmitterFetcher interface {
 	Emitter
 	Fetcher
 }
-
-func (h *Header) String() string {
-	return fmt.Sprintf("[%d %d %s %s]", h.JobID, h.RunID, h.TestName, h.TestStepLabel)
-}
-
-func (d *Data) String() string {
-	ps := ""
-	if d.Payload != nil {
-		ps = fmt.Sprintf(" %q", d.Payload) //nolint SA5009 - works fine
-	}
-	return fmt.Sprintf("[%s %s%s]", d.Target, d.EventName, ps)
-}
@@ -161,7 +161,7 @@ func newPartialJobFromDescriptor(pr *pluginregistry.PluginRegistry, jd *job.JobD
 			}
 			// test step index is incremented by 1 so we can use 0 to signal an
 			// anomaly.
-			tsb, err := pr.NewTestStepBundle(*testStepDesc, tse)
+			tsb, err := pr.NewTestStepBundle(*testStepDesc, uint(idx)+1, tse)
 			if err != nil {
 				return nil, fmt.Errorf("NewTestStepBundle for test step '%s' with index %d failed: %w", testStepDesc.Name, idx, err)
 			}
 
@@ -15,7 +15,7 @@ import (
 )
 
 // NewTestStepBundle creates a TestStepBundle from a TestStepDescriptor
-func (r *PluginRegistry) NewTestStepBundle(testStepDescriptor test.TestStepDescriptor, allowedEvents map[event.Name]bool) (*test.TestStepBundle, error) {
+func (r *PluginRegistry) NewTestStepBundle(testStepDescriptor test.TestStepDescriptor, stepIndex uint, allowedEvents map[event.Name]bool) (*test.TestStepBundle, error) {
 	testStep, err := r.NewTestStep(testStepDescriptor.Name)
 	if err != nil {
 		return nil, fmt.Errorf("could not get the desired TestStep (%s): %v", testStepDescriptor.Name, err)
 
@@ -17,7 +17,6 @@ import (
 	"github.com/facebookincubator/contest/pkg/event/testevent"
 	"github.com/facebookincubator/contest/pkg/job"
 	"github.com/facebookincubator/contest/pkg/logging"
-	"github.com/facebookincubator/contest/pkg/statectx"
 	"github.com/facebookincubator/contest/pkg/storage"
 	"github.com/facebookincubator/contest/pkg/target"
 	"github.com/facebookincubator/contest/pkg/types"
@@ -158,8 +157,9 @@ func (jr *JobRunner) Run(j *job.Job) ([][]*job.Report, []*job.Report, error) {
 						if err := tl.Unlock(j.ID, targets); err != nil {
 							jobLog.Warningf("Failed to unlock targets (%v) for job ID %d: %v", targets, j.ID, err)
 						}
+					case <-j.StateCtx.Paused():
+						jobLog.Debugf("Received pause request, NOT releasing targets so the job can be resumed")
 						return
-					// Ignore the pause signal, continue to refresh targets.
 					case <-done:
 						if err := tl.Unlock(j.ID, targets); err != nil {
 							jobLog.Warningf("Failed to unlock %d target(s) (%v): %v", len(targets), targets, err)
@@ -183,14 +183,7 @@ func (jr *JobRunner) Run(j *job.Job) ([][]*job.Report, []*job.Report, error) {
 			if runErr = jr.emitAcquiredTargets(testEventEmitter, targets); runErr == nil {
 				jobLog.Infof("Run #%d: running test #%d for job '%s' (job ID: %d) on %d targets", run+1, idx, j.Name, j.ID, len(targets))
 				testRunner := NewTestRunner()
-				var resumeState []byte
-				resumeState, err := testRunner.Run(j.StateCtx, t, targets, j.ID, types.RunID(run+1), resumeState)
-				if err == statectx.ErrPaused {
-					jobLog.Debugf("Runner paused, state: %s", string(resumeState))
-					// TODO(rojer): Persist the state.
-				} else {
-					runErr = err
-				}
+				runErr = testRunner.Run(j.StateCtx, t, targets, j.ID, types.RunID(run+1))
 			}
 
 			// Job is done, release all the targets
Original file line number	Diff line number	Diff line change
`@@ -161,7 +161,7 @@ func newPartialJobFromDescriptor(pr pluginregistry.PluginRegistry, jd job.JobD`
`161`	`161`	`}`
`162`	`162`	`// test step index is incremented by 1 so we can use 0 to signal an`
`163`	`163`	`// anomaly.`
`164`		`- tsb, err := pr.NewTestStepBundle(*testStepDesc, tse)`
	`164`	`+ tsb, err := pr.NewTestStepBundle(*testStepDesc, uint(idx)+1, tse)`
`165`	`165`	`if err != nil {`
`166`	`166`	`return nil, fmt.Errorf("NewTestStepBundle for test step '%s' with index %d failed: %w", testStepDesc.Name, idx, err)`
`167`	`167`	`}`
Original file line number	Diff line number	Diff line change
`@@ -15,7 +15,7 @@ import (`
`15`	`15`	`)`
`16`	`16`
`17`	`17`	`// NewTestStepBundle creates a TestStepBundle from a TestStepDescriptor`
`18`		`-func (r PluginRegistry) NewTestStepBundle(testStepDescriptor test.TestStepDescriptor, allowedEvents map[event.Name]bool) (test.TestStepBundle, error) {`
	`18`	`+func (r PluginRegistry) NewTestStepBundle(testStepDescriptor test.TestStepDescriptor, stepIndex uint, allowedEvents map[event.Name]bool) (test.TestStepBundle, error) {`
`19`	`19`	`testStep, err := r.NewTestStep(testStepDescriptor.Name)`
`20`	`20`	`if err != nil {`
`21`	`21`	`return nil, fmt.Errorf("could not get the desired TestStep (%s): %v", testStepDescriptor.Name, err)`