elastic · fearful-symmetry · Mar 22, 2024 · Mar 21, 2024 · Mar 21, 2024 · Mar 21, 2024
@@ -223,15 +223,15 @@ steps:
       provider: "gcp"
       machineType: "n1-standard-8"
 
-  # - label: "Extended runtime leak tests"
-  #   key: "extended-integration-tests"
-  #   command: ".buildkite/scripts/steps/integration_tests.sh stateful integration:TestForResourceLeaks"
-  #   artifact_paths:
-  #     - "build/TEST-**"
-  #     - "build/diagnostics/*"
-  #   agents:
-  #     provider: "gcp"
-  #     machineType: "n1-standard-8"
+  - label: "Extended runtime leak tests"
+    key: "extended-integration-tests"
+    command: ".buildkite/scripts/steps/integration_tests.sh stateful integration:TestForResourceLeaks"
+    artifact_paths:
+      - "build/TEST-**"
+      - "build/diagnostics/*"
+    agents:
+      provider: "gcp"
+      machineType: "n1-standard-8"
 
   - label: "Integration tests"
     key: "integration-tests"

@@ -78,7 +78,7 @@ func TestLongRunningAgentForLeaks(t *testing.T) {
 	}
 
 	suite.Run(t, &ExtendedRunner{info: info,
-		healthCheckTime:        time.Minute * 3,
+		healthCheckTime:        time.Minute * 6,
 		healthCheckRefreshTime: time.Second * 20,
 		resourceWatchers: []StatusWatcher{ // select which tests to run
 			&handleMonitor{},
@@ -229,13 +229,14 @@ func (runner *ExtendedRunner) TestHandleLeak() {
 // CheckHealthAtStartup ensures all the beats and agent are healthy and working before we continue
 func (runner *ExtendedRunner) CheckHealthAtStartup(ctx context.Context) {
 	// because we need to separately fetch the PIDs, wait until everything is healthy before we look for running beats
+	compDebugName := ""
 	require.Eventually(runner.T(), func() bool {
 		allHealthy := true
 		status, err := runner.agentFixture.ExecStatus(ctx)
 
 		apacheMatch := "logfile-apache"
 		foundApache := false
-		systemMatch := "metrics-default"
+		systemMatch := "system/metrics"
 		foundSystem := false
 
 		require.NoError(runner.T(), err)
@@ -253,11 +254,12 @@ func (runner *ExtendedRunner) CheckHealthAtStartup(ctx context.Context) {
 			}
 			runner.T().Logf("component state: %s", comp.Message)
 			if comp.State != int(cproto.State_HEALTHY) {
+				compDebugName = comp.Name
 				allHealthy = false
 			}
 		}
 		return allHealthy && foundApache && foundSystem
-	}, runner.healthCheckTime, runner.healthCheckRefreshTime, "install never became healthy")
+	}, runner.healthCheckTime, runner.healthCheckRefreshTime, "install never became healthy: components did not return a healthy state: %s", compDebugName)
 }
 
 /*