cultureamp · liamstevens · Jan 30, 2025 · Jan 30, 2025 · Jan 30, 2025 · Jan 31, 2025
diff --git a/plugin.yml b/plugin.yml
@@ -9,3 +9,5 @@ configuration:
       type: string
     script:
       type: string
+    timeout:
+      type: integer
diff --git a/src/aws/ecs.go b/src/aws/ecs.go
@@ -59,11 +59,10 @@ func SubmitTask(ctx context.Context, ecsAPI EcsClientAPI, input *TaskRunnerConfi
 	return *response.Tasks[0].TaskArn, nil
 }
 
-func WaitForCompletion(ctx context.Context, waiter ecsWaiterAPI, taskArn string) (*ecs.DescribeTasksOutput, error) {
+func WaitForCompletion(ctx context.Context, waiter ecsWaiterAPI, taskArn string, timeOut int) (*ecs.DescribeTasksOutput, error) {
 	cluster := ClusterFromTaskArn(taskArn)
 
-	// TODO: This magic number will be resolved in a future piece of work, not going to refactor this right now
-	maxWaitDuration := 15 * time.Minute //nolint:mnd
+	maxWaitDuration := time.Duration(timeOut) * time.Second
 	result, err := waiter.WaitForOutput(ctx, &ecs.DescribeTasksInput{
 		Cluster: aws.String(cluster),
 		Tasks:   []string{taskArn},

diff --git a/src/aws/ecs_test.go b/src/aws/ecs_test.go
@@ -365,7 +365,7 @@ func TestWaitForCompletion(t *testing.T) {
 
 	for _, tc := range tests {
 		t.Run(tc.name, func(t *testing.T) {
-			result, err := WaitForCompletion(context.TODO(), tc.waiter, tc.input)
+			result, err := WaitForCompletion(context.TODO(), tc.waiter, tc.input, 15)
 			t.Logf("result: '%v'", err)
 			t.Logf("expected: detail: %v, reason: %v", *tc.expected.Failures[0].Detail, *tc.expected.Failures[0].Reason)
 

diff --git a/src/plugin/config.go b/src/plugin/config.go
@@ -7,6 +7,7 @@ import (
 type Config struct {
 	ParameterName string `required:"true" split_words:"true"`
 	Script        string `required:"true" split_words:"true"`
+	TimeOut       int    `default:"2700"  split_words:"true"`
 }
 
 type EnvironmentConfigFetcher struct {

diff --git a/src/plugin/config_test.go b/src/plugin/config_test.go
@@ -25,6 +25,7 @@ func TestFailOnMissingRequiredEnvironment(t *testing.T) {
 			disabledEnvVars: []string{
 				"BUILDKITE_PLUGIN_ECS_TASK_RUNNER_PARAMETER_NAME",
 				"BUILDKITE_PLUGIN_ECS_TASK_RUNNER_SCRIPT",
+				"BUILDKITE_PLUGIN_ECS_TASK_RUNNER_TIMEOUT",
 			},
 			enabledEnvVars: map[string]string{},
 			expectedErr:    "required key BUILDKITE_PLUGIN_ECS_TASK_RUNNER_PARAMETER_NAME missing value",
@@ -72,18 +73,27 @@ func TestFailOnMissingRequiredEnvironment(t *testing.T) {
 func TestFetchConfigFromEnvironment(t *testing.T) {
 	unsetEnv(t, "BUILDKITE_PLUGIN_ECS_TASK_RUNNER_PARAMETER_NAME")
 	unsetEnv(t, "BUILDKITE_PLUGIN_ECS_TASK_RUNNER_SCRIPT")
+	unsetEnv(t, "BUILDKITE_PLUGIN_ECS_TASK_RUNNER_TIME_OUT")
 
 	var config plugin.Config
 	fetcher := plugin.EnvironmentConfigFetcher{}
 
 	t.Setenv("BUILDKITE_PLUGIN_ECS_TASK_RUNNER_PARAMETER_NAME", "test-parameter")
 	t.Setenv("BUILDKITE_PLUGIN_ECS_TASK_RUNNER_SCRIPT", "hello-world")
+	t.Setenv("BUILDKITE_PLUGIN_ECS_TASK_RUNNER_TIME_OUT", "600")
 
 	err := fetcher.Fetch(&config)
 
 	require.NoError(t, err, "fetch should not error")
 	assert.Equal(t, "test-parameter", config.ParameterName, "fetched message should match environment")
 	assert.Equal(t, "hello-world", config.Script, "fetched message should match environment")
+	assert.Equal(t, 600, config.TimeOut, "fetched message should match environment")
+
+	// test default value
+	unsetEnv(t, "BUILDKITE_PLUGIN_ECS_TASK_RUNNER_TIME_OUT")
+	err = fetcher.Fetch(&config)
+	require.NoError(t, err, "fetch should not error")
+	assert.Equal(t, 2700, config.TimeOut, "fetched message should match environment")
 }
 
 func unsetEnv(t *testing.T, key string) {

diff --git a/src/plugin/task-runner.go b/src/plugin/task-runner.go
@@ -27,6 +27,7 @@ func (trp TaskRunnerPlugin) Run(ctx context.Context, fetcher ConfigFetcher) erro
 	if err != nil {
 		return fmt.Errorf("plugin configuration error: %w", err)
 	}
+	buildKiteAgent := buildkite.Agent{}
 
 	buildkite.Log("Executing task-runner plugin\n")
 
@@ -57,8 +58,9 @@ func (trp TaskRunnerPlugin) Run(ctx context.Context, fetcher ConfigFetcher) erro
 		// TODO: This is currently a magic number. If we want this to be configurable, remove the nolint directive and fix it up
 		o.MaxDelay = 10 * time.Second //nolint:mnd
 	})
-	result, err := awsinternal.WaitForCompletion(ctx, waiterClient, taskArn)
+	result, err := awsinternal.WaitForCompletion(ctx, waiterClient, taskArn, config.TimeOut)
 	if err != nil {
+		_ = buildKiteAgent.Annotate(ctx, fmt.Sprintf("Task did not complete successfully within timeout %v", result.Failures[0]), "error", "ecs-task-runner")
 		return fmt.Errorf("failed to wait for task completion: %w\nFailure information: %v", err, result.Failures[0])
 	}
 	// In a successful scenario for task completion, we would have a `tasks` slice with a single element