Add e2e internal package

DrJosh9000 · DrJosh9000 · commit 31d72739a8c7 · 2025-12-01T17:31:34.000+11:00
diff --git a/go.mod b/go.mod
@@ -21,6 +21,7 @@ require (
 	github.com/aws/smithy-go v1.23.2
 	github.com/brunoscheufler/aws-ecs-metadata-go v0.0.0-20220812150832-b6b31c6eeeaf
 	github.com/buildkite/bintest/v3 v3.3.0
+	github.com/buildkite/go-buildkite/v4 v4.11.0
 	github.com/buildkite/go-pipeline v0.16.0
 	github.com/buildkite/interpolate v0.1.5
 	github.com/buildkite/roko v1.4.0
@@ -112,6 +113,7 @@ require (
 	github.com/bitfield/gotestdox v0.2.2 // indirect
 	github.com/bmatcuk/doublestar/v4 v4.6.1 // indirect
 	github.com/buildkite/test-engine-client v1.6.0 // indirect
+	github.com/cenkalti/backoff v1.1.1-0.20171020064038-309aa717adbf // indirect
 	github.com/cenkalti/backoff/v5 v5.0.3 // indirect
 	github.com/cespare/xxhash/v2 v2.3.0 // indirect
 	github.com/cihub/seelog v0.0.0-20170130134532-f561c5e57575 // indirect
diff --git a/go.sum b/go.sum
@@ -132,6 +132,8 @@ github.com/brunoscheufler/aws-ecs-metadata-go v0.0.0-20220812150832-b6b31c6eeeaf
 github.com/brunoscheufler/aws-ecs-metadata-go v0.0.0-20220812150832-b6b31c6eeeaf/go.mod h1:CeKhh8xSs3WZAc50xABMxu+FlfAAd5PNumo7NfOv7EE=
 github.com/buildkite/bintest/v3 v3.3.0 h1:RTWcSaJRlOT6t/K311ejPf+0J3LE/QEODzVG3vlLnWo=
 github.com/buildkite/bintest/v3 v3.3.0/go.mod h1:btqpTsVODiJcb0NMdkkmtMQ6xoFc2W/nY5yy+3I0zcs=
+github.com/buildkite/go-buildkite/v4 v4.11.0 h1:rEvvUwITrqv433W9JWf6mj+NkkcM45s+ObhNs6C17i4=
+github.com/buildkite/go-buildkite/v4 v4.11.0/go.mod h1:DlebrRJqpZttXDjCW+MJ1QyW9AN++ZWt/UbPtKdbSSk=
 github.com/buildkite/go-pipeline v0.16.0 h1:wEgWUMRAgSg1ZnWOoA3AovtYYdTvN0dLY1zwUWmPP+4=
 github.com/buildkite/go-pipeline v0.16.0/go.mod h1:VE37qY3X5pmAKKUMoDZvPsHOQuyakB9cmXj9Qn6QasA=
 github.com/buildkite/interpolate v0.1.5 h1:v2Ji3voik69UZlbfoqzx+qfcsOKLA61nHdU79VV+tPU=
@@ -144,6 +146,8 @@ github.com/buildkite/test-engine-client v1.6.0 h1:yk/gdkFFU8B1+M16mxPNmxJgVoYffI
 github.com/buildkite/test-engine-client v1.6.0/go.mod h1:J6LrqenaJPfVCffiWW1/QxjICFb+OkqCvdCd7qAI0AE=
 github.com/buildkite/zstash v0.5.0 h1:e70mf8U2EjEB1eixXR78s6bsLgfo6bWLisVlRv58wCI=
 github.com/buildkite/zstash v0.5.0/go.mod h1:h70JfAEa2Ys1GDQQ6CNoKIMfMgJ0LZkNmQnzK710PHQ=
+github.com/cenkalti/backoff v1.1.1-0.20171020064038-309aa717adbf h1:yxlp0s+Sge9UsKEK0Bsvjiopb9XRk+vxylmZ9eGBfm8=
+github.com/cenkalti/backoff v1.1.1-0.20171020064038-309aa717adbf/go.mod h1:90ReRw6GdpyfrHakVjL/QHaoyV4aDUVVkXQJJJ3NXXM=
 github.com/cenkalti/backoff/v5 v5.0.3 h1:ZN+IMa753KfX5hd8vVaMixjnqRZ3y8CuJKRKj1xcsSM=
 github.com/cenkalti/backoff/v5 v5.0.3/go.mod h1:rkhZdG3JZukswDf7f0cwqPNk4K0sa+F97BxZthm/crw=
 github.com/cespare/xxhash/v2 v2.1.1/go.mod h1:VGX0DQ3Q6kWi7AoAeZDth3/j3BFtOZR5XLFGgcrjCOs=
diff --git a/internal/e2e/basic_test.go b/internal/e2e/basic_test.go
@@ -0,0 +1,29 @@
+//go:build e2e
+
+package e2e
+
+import (
+	"syscall"
+	"testing"
+)
+
+func TestBasicE2E(t *testing.T) {
+	ctx := t.Context()
+	tc := newTestCase(t, "steps:\n  - command: echo hello world\n")
+
+	agent := tc.startAgent()
+	build := tc.triggerBuild()
+	state, err := tc.waitForBuild(ctx, build)
+	if err != nil {
+		t.Fatalf("tc.waitForBuild(build %s) error = %v", build.ID, err)
+	}
+	if got, want := state, "passed"; got != want {
+		t.Errorf("Build state = %q, want %q", got, want)
+	}
+
+	// TODO: add ability to inspect job logs
+
+	if err := agent.Process.Signal(syscall.SIGTERM); err != nil {
+		t.Errorf("agent.Process.Signal(%d) = %v", syscall.SIGTERM, err)
+	}
+}
diff --git a/internal/e2e/doc.go b/internal/e2e/doc.go
@@ -0,0 +1,4 @@
+// Package e2e holds the end-to-end tests and test framework.
+// Test files are tagged go:build e2e so they are not run by default
+// (e.g. with plain `go test ./...`).
+package e2e
diff --git a/internal/e2e/testcase.go b/internal/e2e/testcase.go
@@ -0,0 +1,286 @@
+//go:build e2e
+
+package e2e
+
+import (
+	"cmp"
+	"context"
+	"fmt"
+	"os"
+	"os/exec"
+	"path/filepath"
+	"slices"
+	"strconv"
+	"strings"
+	"testing"
+	"text/template"
+	"time"
+
+	"github.com/buildkite/agent/v3/version"
+
+	"github.com/buildkite/go-buildkite/v4"
+)
+
+var (
+	// Filled in from secrets
+	apiToken   = os.Getenv("CI_E2E_TESTS_API_TOKEN")
+	agentToken = os.Getenv("CI_E2E_TESTS_AGENT_TOKEN")
+
+	// E2E testing config
+	agentPath     = os.Getenv("CI_E2E_TESTS_AGENT_PATH")
+	targetOrg     = os.Getenv("CI_E2E_TESTS_TARGET_ORG")
+	targetCluster = os.Getenv("CI_E2E_TESTS_TARGET_CLUSTER")
+
+	// Values from the Buildkite job running the tests
+	jobID = cmp.Or(
+		os.Getenv("BUILDKITE_JOB_ID"),
+		strconv.FormatInt(time.Now().UnixNano(), 10),
+	)
+	authorEmail = os.Getenv("BUILDKITE_BUILD_CREATOR_EMAIL")
+	authorName  = os.Getenv("BUILDKITE_BUILD_CREATOR")
+)
+
+const pipelineRepo = "https://github.com/buildkite/agent.git"
+
+type cleanupFn = func(context.Context) error
+
+var nopCleanup = func(context.Context) error { return nil }
+
+// testCase bundles the information needed to run an end-to-end test.
+// Note that it embeds testing.TB - each test should create its own testCase.
+type testCase struct {
+	testing.TB
+
+	fullName       string
+	bkClient       *buildkite.Client
+	pipelineConfig *template.Template
+	queue          *buildkite.ClusterQueue
+	pipeline       *buildkite.Pipeline
+}
+
+// newTestCase creates a new test case with a given pipeline config template,
+// and sets up the temporary queue and pipeline to run it.
+// It also registers cleanups with t.Cleanup so that the queue and pipeline
+// are (usually) automatically deleted.
+// It calls t.Fatal to end the test early if there was a failure setting up.
+func newTestCase(t testing.TB, pipelineConfigTemplate string) *testCase {
+	t.Helper()
+	ctx := t.Context()
+
+	name := strings.ToLower(t.Name() + "-" + jobID)
+
+	tmpl, err := template.New("pipeline").Parse(pipelineConfigTemplate)
+	if err != nil {
+		t.Fatalf("template.New(pipeline).Parse(%q) error = %v", pipelineConfigTemplate, err)
+	}
+
+	client, err := buildkite.NewClient(
+		buildkite.WithTokenAuth(apiToken),
+		buildkite.WithUserAgent("buildkite-agent-e2e-tests/0 "+version.UserAgent()),
+	)
+	if err != nil {
+		t.Fatalf("buildkite.NewClient(...) error = %v", err)
+	}
+
+	queue, cleanup, err := createQueue(ctx, client, name)
+	if err != nil {
+		t.Fatalf("Could not create cluster queue in org %q cluster %q: testHelper.createQueue(ctx, %q) error = %v", targetOrg, targetCluster, name, err)
+	}
+	t.Cleanup(func() {
+		if err := cleanup(ctx); err != nil {
+			t.Logf("Could not clean up cluster queue %q with id %s in org %q cluster %q: cleanup(ctx) error = %v", name, queue.ID, targetOrg, targetCluster, err)
+		}
+	})
+
+	var pipelineCfg strings.Builder
+	tmplInput := map[string]string{"queue": name}
+	if err := tmpl.Execute(&pipelineCfg, tmplInput); err != nil {
+		t.Fatalf("Could not execute pipeline config template: tmpl.Execute(%q) error = %v", tmplInput, err)
+	}
+
+	pipeline, cleanup, err := createPipeline(ctx, client, name, pipelineCfg.String())
+	if err != nil {
+		t.Fatalf("Could not create pipeline with the following config in org %q: testHelper.createPipeline(%q, pipelineCfg) error = %v\n%s", targetOrg, name, err, pipelineCfg.String())
+	}
+	t.Cleanup(func() {
+		if err := cleanup(ctx); err != nil {
+			t.Logf("Could not clean up pipeline %q (id = %s) in org %q: %v", name, pipeline.ID, targetOrg, err)
+		}
+	})
+
+	return &testCase{
+		TB:             t,
+		fullName:       name,
+		bkClient:       client,
+		pipelineConfig: tmpl,
+		queue:          queue,
+		pipeline:       pipeline,
+	}
+}
+
+// triggerBuild creates a new build in the target pipeline. It returns the
+// build object. It also registers cleanups with t.Cleanup so that the build is
+// (usually) automatically cancelled if it is still running.
+// It calls t.Fatal if there was an error creating the build.
+func (tc *testCase) triggerBuild() *buildkite.Build {
+	tc.Helper()
+	ctx := tc.Context()
+
+	createBuild := buildkite.CreateBuild{
+		Author: buildkite.Author{
+			Email: authorEmail,
+			Name:  cmp.Or(authorName, "Agent E2E Tests"),
+		},
+		Commit:  "HEAD",
+		Branch:  "main",
+		Message: tc.fullName,
+	}
+
+	build, _, err := tc.bkClient.Builds.Create(ctx, targetOrg, tc.pipeline.Slug, createBuild)
+	if err != nil {
+		tc.Fatalf("tc.bkClient.Builds.Create(ctx, %q, %q, %v) error = %v", targetOrg, tc.pipeline.Slug, createBuild, err)
+	}
+
+	tc.Cleanup(func() {
+		_, err := tc.bkClient.Builds.Cancel(ctx, targetOrg, tc.pipeline.Slug, build.ID)
+		if err != nil {
+			reasons := []string{
+				"already finished",
+				"already being canceled",
+				"already been canceled",
+				"No build found",
+			}
+			ignorable := slices.ContainsFunc(reasons, func(r string) bool {
+				return strings.Contains(err.Error(), r)
+			})
+			if ignorable {
+				return
+			}
+			tc.Logf("Couldn't cancel build %s: %v", build.ID, err)
+		}
+	})
+	return &build
+}
+
+// waitForBuild waits until the build is in a terminal state (passed, failed, canceled, etc). It polls the build once per second.
+func (tc *testCase) waitForBuild(ctx context.Context, build *buildkite.Build) (string, error) {
+	for {
+		state, _, err := tc.bkClient.Builds.Get(ctx, targetOrg, tc.pipeline.Slug, build.ID, nil)
+		if err != nil {
+			return "", err
+		}
+		switch state.State {
+		case "passed", "failed", "canceled", "canceling":
+			return state.State, nil
+
+		case "scheduled", "running":
+			select {
+			case <-time.After(time.Second):
+			case <-ctx.Done():
+				return "", ctx.Err()
+			}
+
+		default:
+			return state.State, fmt.Errorf("unknown build state %q", state.State)
+		}
+	}
+}
+
+// createQueue creates a cluster queue for running an end-to-end test in.
+// The returned cleanup function deletes the queue and should be called after
+// the test is finished.
+func createQueue(ctx context.Context, client *buildkite.Client, name string) (*buildkite.ClusterQueue, cleanupFn, error) {
+	cq, _, err := client.ClusterQueues.Create(ctx, targetOrg, targetCluster, buildkite.ClusterQueueCreate{
+		Key:         name,
+		Description: "Buildkite Agent E2E Test",
+	})
+	if err != nil {
+		return nil, nopCleanup, err
+	}
+
+	cleanup := func(ctx context.Context) error {
+		_, err := client.ClusterQueues.Delete(ctx, targetOrg, targetCluster, cq.ID)
+		return err
+	}
+	return &cq, cleanup, nil
+}
+
+// createPipeline creates a pipeline for running an end-to-end test in.
+// The returned cleanup function deletes the pipeline and should be called after
+// the test is finished.
+func createPipeline(ctx context.Context, client *buildkite.Client, name, config string) (*buildkite.Pipeline, cleanupFn, error) {
+	p, _, err := client.Pipelines.Create(ctx, targetOrg, buildkite.CreatePipeline{
+		Name:        name,
+		Repository:  pipelineRepo,
+		Description: "Buildkite Agent E2E Test",
+		ProviderSettings: &buildkite.GitHubSettings{
+			TriggerMode: "none",
+		},
+		Configuration: config,
+		ClusterID:     targetCluster,
+	})
+	if err != nil {
+		return nil, nopCleanup, err
+	}
+
+	cleanup := func(ctx context.Context) error {
+		_, err := client.Pipelines.Delete(ctx, targetOrg, p.Slug)
+		return err
+	}
+	return &p, cleanup, nil
+}
+
+// startAgent starts a copy of the agent (at agentPath, using agentToken). It
+// registers cleanup functions that kill the agent and remove the various
+// directories (build path, hooks path, etc).
+func (tc *testCase) startAgent(extraArgs ...string) *exec.Cmd {
+	tc.Helper()
+	dir, err := os.MkdirTemp(tc.TempDir(), tc.fullName)
+	if err != nil {
+		tc.Fatalf("Couldn't create temporary agent dir: os.MkdirTemp(%q, %q) = %v", tc.TempDir(), tc.fullName, err)
+	}
+	tc.Cleanup(func() {
+		if err := os.RemoveAll(dir); err != nil {
+			tc.Logf("Couldn't clean up temporary agent dir: os.RemoveAll(%q) = %v", dir, err)
+		}
+	})
+	buildPath := filepath.Join(dir, "builds")
+	hooksPath := filepath.Join(dir, "hooks")
+	socketsPath := filepath.Join(dir, "sockets")
+	pluginsPath := filepath.Join(dir, "plugins")
+	for _, path := range []string{buildPath, hooksPath, socketsPath, pluginsPath} {
+		if err := os.Mkdir(path, 0o700); err != nil {
+			tc.Fatalf("Couldn't create dir inside temporary agent dir: os.Mkdir(%q, %o) = %v", path, 0o700, err)
+		}
+	}
+
+	args := append([]string{
+		"start",
+		"--debug", "true",
+		"--token", agentToken,
+		"--name", tc.fullName,
+		"--queue", tc.queue.Key,
+		"--build-path", buildPath,
+		"--hooks-path", hooksPath,
+		"--sockets-path", socketsPath,
+		"--plugins-path", pluginsPath,
+	}, extraArgs...)
+
+	cmd := exec.CommandContext(tc.Context(), agentPath, args...)
+	// Ensure minimal environment variable shenanigans by setting only these:
+	cmd.Env = []string{
+		"HOME=" + os.Getenv("HOME"),
+		"PATH=" + os.Getenv("PATH"),
+	}
+	cmd.Stdout = os.Stderr
+	cmd.Stderr = os.Stderr
+	if err := cmd.Start(); err != nil {
+		tc.Fatalf("Couldn't start agent command %v: %v", cmd, err)
+	}
+	tc.Cleanup(func() {
+		if err := cmd.Cancel(); err != nil {
+			tc.Logf("agent.Cancel() error = %v", err)
+		}
+	})
+	return cmd
+}

-Original file line number
+Diff line change
 	github.com/aws/smithy-go v1.23.2
 	github.com/brunoscheufler/aws-ecs-metadata-go v0.0.0-20220812150832-b6b31c6eeeaf
 	github.com/buildkite/bintest/v3 v3.3.0
 +	github.com/buildkite/go-buildkite/v4 v4.11.0
 	github.com/buildkite/go-pipeline v0.16.0
 	github.com/buildkite/interpolate v0.1.5
 	github.com/buildkite/roko v1.4.0
 	github.com/bitfield/gotestdox v0.2.2 // indirect
 	github.com/bmatcuk/doublestar/v4 v4.6.1 // indirect
 	github.com/buildkite/test-engine-client v1.6.0 // indirect
 +	github.com/cenkalti/backoff v1.1.1-0.20171020064038-309aa717adbf // indirect
 	github.com/cenkalti/backoff/v5 v5.0.3 // indirect
 	github.com/cespare/xxhash/v2 v2.3.0 // indirect
 	github.com/cihub/seelog v0.0.0-20170130134532-f561c5e57575 // indirect