From c39f6fe5f56602ca7c991ad11a99f3ae72b1938c Mon Sep 17 00:00:00 2001 From: Tyler Yahn Date: Fri, 20 Dec 2024 14:30:06 -0800 Subject: [PATCH] Unify shutting down into an executioner utility --- internal/test/e2e/autosdk/compose.yaml | 33 ++---- internal/tools/executioner/Dockerfile | 8 ++ internal/tools/executioner/main.go | 153 +++++++++++++++++++++++++ 3 files changed, 169 insertions(+), 25 deletions(-) create mode 100644 internal/tools/executioner/Dockerfile create mode 100644 internal/tools/executioner/main.go diff --git a/internal/test/e2e/autosdk/compose.yaml b/internal/test/e2e/autosdk/compose.yaml index 765a642f0..a5e994f44 100644 --- a/internal/test/e2e/autosdk/compose.yaml +++ b/internal/test/e2e/autosdk/compose.yaml @@ -51,32 +51,15 @@ services: condition: service_healthy entrypoint: ["/usr/local/bin/runner"] command: -bin=/usr/local/bin/app - check: - image: busybox:latest + executioner: + build: + context: ../../../../ + dockerfile: internal/tools/executioner/Dockerfile + image: test-executioner:latest + pull_policy: build depends_on: e2e: condition: service_completed_successfully - entrypoint: /bin/sh command: - - -c - - | - data() { - wget -O - http://collector:8888/metrics \ - | grep otelcol_exporter_sent_spans \ - | grep 'exporter="file/trace"' \ - | grep -o '[^ ]*$' - } - - while [ "$(data)" -ne 3 ] - do - echo "Waiting on spans..." - sleep 2 - done - echo "Received 3 spans, stopping." - exit 0 - shutdown-sidecar: - image: busybox:latest - depends_on: - check: - condition: service_completed_successfully - entrypoint: /bin/sh -c "while ! wget -q -O - http://collector:8080/shutdown; do sleep 2; done; exit 0" + - -collector-address=http://collector + - -span-count=3 diff --git a/internal/tools/executioner/Dockerfile b/internal/tools/executioner/Dockerfile new file mode 100644 index 000000000..2c4973a33 --- /dev/null +++ b/internal/tools/executioner/Dockerfile @@ -0,0 +1,8 @@ +FROM golang:1.23 + +WORKDIR /usr/src/go.opentelemetry.io/auto/internal/tools/executioner + +COPY . /usr/src/go.opentelemetry.io/auto/ +RUN CGO_ENABLED=0 go build -a -installsuffix cgo -o /usr/local/bin/executioner ./... + +ENTRYPOINT ["/usr/local/bin/executioner"] diff --git a/internal/tools/executioner/main.go b/internal/tools/executioner/main.go new file mode 100644 index 000000000..7be6bdac4 --- /dev/null +++ b/internal/tools/executioner/main.go @@ -0,0 +1,153 @@ +// Copyright The OpenTelemetry Authors +// SPDX-License-Identifier: Apache-2.0 + +package main + +import ( + "context" + "flag" + "fmt" + "io" + "net/http" + "os" + "os/signal" + "strings" + "syscall" + "time" +) + +const ( + telemetryPath = "/metrics" + shutdownPath = "/shutdown" + metricName = "otelcol_exporter_sent_spans" + exporterAttr = `exporter="file/trace"` +) + +func main() { + // Command-line flags + collectorAddress := flag.String("collector-address", "http://collector", "Address of the collector") + spanCount := flag.Int("span-count", 0, "Number of spans to check before shutting down the collector") + checkLimit := flag.Int("limit", 5, "Maximum number of times to check the span count") + interval := flag.Duration("interval", 2*time.Second, "Duration between span count checks") + flag.Parse() + + if *spanCount < 0 { + fmt.Println("Error: span-count must not be negative") + return + } + + // TODO: have these ports be configurable. + telemetryURL := fmt.Sprintf("%s:8888%s", *collectorAddress, telemetryPath) + shutdownURL := fmt.Sprintf("%s:8080%s", *collectorAddress, shutdownPath) + + // Context to handle SIGTERM. + ctx, stop := signal.NotifyContext(context.Background(), os.Interrupt, syscall.SIGTERM) + defer stop() + + if *spanCount == 0 { + fmt.Println("Span count is 0. Skipping span count check.") + if err := sendShutdownSignal(ctx, shutdownURL); err != nil { + fmt.Println(err) + } + return + } + + fmt.Printf("Checking collector at %s for %d spans\n", telemetryURL, *spanCount) + + for i := 0; i < *checkLimit; i++ { + select { + case <-ctx.Done(): + fmt.Println("Received termination signal. Exiting.") + if err := sendShutdownSignal(ctx, shutdownURL); err != nil { + fmt.Println(err) + } + return + default: + } + + spanCountReached, err := checkSpanCount(ctx, telemetryURL, *spanCount) + if err != nil { + fmt.Printf("Error checking span count: %v\n", err) + time.Sleep(*interval) + continue + } + + if spanCountReached { + fmt.Printf("Span count of %d reached.\n", *spanCount) + if err := sendShutdownSignal(ctx, shutdownURL); err != nil { + fmt.Println(err) + } + return + } + + time.Sleep(*interval) // Wait before checking again + } + + fmt.Println("Reached check limit without meeting span count requirement.") + if err := sendShutdownSignal(ctx, shutdownURL); err != nil { + fmt.Println(err) + } +} + +func checkSpanCount(ctx context.Context, url string, targetCount int) (bool, error) { + req, err := http.NewRequestWithContext(ctx, http.MethodGet, url, nil) + if err != nil { + return false, fmt.Errorf("failed to create request: %v", err) + } + + resp, err := http.DefaultClient.Do(req) + if err != nil { + return false, fmt.Errorf("failed to fetch telemetry data: %v", err) + } + defer resp.Body.Close() + + if resp.StatusCode != http.StatusOK { + return false, fmt.Errorf("unexpected status code: %d", resp.StatusCode) + } + + body, err := io.ReadAll(resp.Body) + if err != nil { + return false, fmt.Errorf("failed to read telemetry response body: %v", err) + } + + lines := strings.Split(string(body), "\n") + for _, line := range lines { + if strings.HasPrefix(line, metricName) && strings.Contains(line, exporterAttr) { + fields := strings.Fields(line) + if len(fields) < 2 { + continue + } + + var value int + _, err := fmt.Sscanf(fields[len(fields)-1], "%d", &value) + if err != nil { + return false, fmt.Errorf("failed to parse span count: %v", err) + } + + return value >= targetCount, nil + } + } + + return false, nil +} + +func sendShutdownSignal(ctx context.Context, url string) error { + fmt.Printf("Sending shutdown signal to %s\n", url) + req, err := http.NewRequestWithContext(ctx, http.MethodPost, url, nil) + if err != nil { + return fmt.Errorf("failed to create shutdown request: %v", err) + } + + resp, err := http.DefaultClient.Do(req) + if err != nil { + return fmt.Errorf("failed to send shutdown request: %v", err) + } + defer resp.Body.Close() + + if resp.StatusCode != http.StatusOK { + return fmt.Errorf("unexpected status code: %d", resp.StatusCode) + } + + fmt.Println("Shutdown signal sent successfully.") + return nil +}