Block silent detection pass and classify Claude embedded 429 rate limits (#31081)

Copilot · web-flow · commit a54a6e71075e · 2026-05-08T13:58:05.000-07:00
diff --git a/actions/setup/js/claude_harness.cjs b/actions/setup/js/claude_harness.cjs
@@ -61,7 +61,11 @@ const MAX_DELAY_MS = 60000;
 const OVERLOADED_ERROR_PATTERN = /overloaded_error|"overloaded"/i;
 
 // Pattern to detect Anthropic rate-limit errors (HTTP 429).
-const RATE_LIMIT_ERROR_PATTERN = /rate_limit_error|429 Too Many Requests/i;
+// Claude CLI may surface this as:
+//   - transport-style text (e.g. "429 Too Many Requests")
+//   - embedded stream-json result fields (e.g. "api_error_status":429)
+//   - human-readable message text ("rate limit")
+const RATE_LIMIT_ERROR_PATTERN = /rate_limit_error|429 Too Many Requests|"api_error_status"\s*:\s*429|request rejected \(429\)|rate limit/i;
 
 // Pattern to detect a clean max-turns exit from Claude Code.
 // Claude Code emits a JSON result object with "subtype":"error_max_turns" when the
@@ -341,6 +345,7 @@ if (typeof module !== "undefined" && module.exports) {
   module.exports = {
     resolveClaudePromptFileArgs,
     stripPromptFileArgs,
+    isRateLimitError,
     isMaxTurnsExit,
     isNoDeferredMarkerError,
   };
diff --git a/actions/setup/js/claude_harness.test.cjs b/actions/setup/js/claude_harness.test.cjs
@@ -5,7 +5,7 @@ import os from "os";
 import path from "path";
 
 const require = createRequire(import.meta.url);
-const { resolveClaudePromptFileArgs, stripPromptFileArgs, isMaxTurnsExit, isNoDeferredMarkerError } = require("./claude_harness.cjs");
+const { resolveClaudePromptFileArgs, stripPromptFileArgs, isRateLimitError, isMaxTurnsExit, isNoDeferredMarkerError } = require("./claude_harness.cjs");
 
 describe("claude_harness.cjs", () => {
   describe("resolveClaudePromptFileArgs", () => {
@@ -108,6 +108,20 @@ describe("claude_harness.cjs", () => {
     });
   });
 
+  describe("isRateLimitError", () => {
+    it("returns true for stream-json api_error_status 429", () => {
+      expect(isRateLimitError('{"type":"result","subtype":"success","is_error":true,"api_error_status":429}')).toBe(true);
+    });
+
+    it("returns true for stream-json request rejected 429 message", () => {
+      expect(isRateLimitError("API Error: Request rejected (429) &middot; This request would exceed your account's rate limit.")).toBe(true);
+    });
+
+    it("returns false for non-rate-limit output", () => {
+      expect(isRateLimitError('{"type":"result","subtype":"success","is_error":false}')).toBe(false);
+    });
+  });
+
   describe("isNoDeferredMarkerError", () => {
     it("returns true for the canonical no-deferred-marker error message", () => {
       const output =
diff --git a/actions/setup/js/parse_threat_detection_results.cjs b/actions/setup/js/parse_threat_detection_results.cjs
@@ -263,6 +263,8 @@ async function main() {
   const logPath = path.join(threatDetectionDir, DETECTION_LOG_FILENAME);
   const runDetection = process.env.RUN_DETECTION;
   const continueOnError = process.env.GH_AW_DETECTION_CONTINUE_ON_ERROR !== "false";
+  const detectionExecutionOutcome = process.env.DETECTION_AGENTIC_EXECUTION_OUTCOME || "";
+  const detectionExecutionFailed = detectionExecutionOutcome === "failure";
   const isWarnMode = continueOnError;
 
   /**
@@ -273,8 +275,9 @@ async function main() {
    * @param {string} message - Human-readable error message
    */
   function setDetectionFailure(reason, message) {
+    const mustFail = detectionExecutionFailed && (reason === "agent_failure" || reason === "parse_error");
     core.setOutput("reason", reason);
-    if (isWarnMode) {
+    if (isWarnMode && !mustFail) {
       core.warning(`&#9888;&#65039; ${message}`);
       core.setOutput("conclusion", "warning");
       core.setOutput("success", "false");
@@ -309,6 +312,7 @@ async function main() {
     core.info("&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;&#9552;");
     core.info(`&#128203; RUN_DETECTION env: ${JSON.stringify(runDetection)}`);
     core.info(`&#128203; continue-on-error: ${continueOnError}`);
+    core.info(`&#128203; detection execution outcome: ${JSON.stringify(detectionExecutionOutcome)}`);
     core.info(`&#128193; Threat detection directory: ${threatDetectionDir}`);
     core.info(`&#128196; Detection log path: ${logPath}`);
 
diff --git a/actions/setup/js/parse_threat_detection_results.test.cjs b/actions/setup/js/parse_threat_detection_results.test.cjs
@@ -444,6 +444,7 @@ describe("main", () => {
     // Reset environment variables
     delete process.env.RUN_DETECTION;
     delete process.env.GH_AW_DETECTION_CONTINUE_ON_ERROR;
+    delete process.env.DETECTION_AGENTIC_EXECUTION_OUTCOME;
     // Re-import to get fresh module with mocks
     mod = await import("./parse_threat_detection_results.cjs");
   });
@@ -508,6 +509,18 @@ describe("main", () => {
       expect(mockCore.setFailed).toHaveBeenCalledWith(expect.stringContaining("Detection log file not found"));
     });
 
+    it("should fail when detection execution failed even in warn mode", async () => {
+      process.env.DETECTION_AGENTIC_EXECUTION_OUTCOME = "failure";
+      mockExistsSync.mockReturnValue(false);
+
+      await mod.main();
+
+      expect(mockCore.setOutput).toHaveBeenCalledWith("conclusion", "failure");
+      expect(mockCore.setOutput).toHaveBeenCalledWith("success", "false");
+      expect(mockCore.setOutput).toHaveBeenCalledWith("reason", "agent_failure");
+      expect(mockCore.setFailed).toHaveBeenCalledWith(expect.stringContaining("Detection log file not found"));
+    });
+
     // Note: The following tests are skipped because mocking fs for CJS modules
     // is difficult in vitest (same issue as safe_output_validator.test.cjs).
     // The core parsing logic is thoroughly tested via parseDetectionLog above.
diff --git a/pkg/workflow/detection_success_test.go b/pkg/workflow/detection_success_test.go
@@ -70,6 +70,9 @@ Create an issue.
 	if !strings.Contains(detectionSection, "GH_AW_DETECTION_CONTINUE_ON_ERROR:") {
 		t.Error("Detection conclusion step missing GH_AW_DETECTION_CONTINUE_ON_ERROR env var")
 	}
+	if !strings.Contains(detectionSection, "DETECTION_AGENTIC_EXECUTION_OUTCOME: ${{ steps.detection_agentic_execution.outcome }}") {
+		t.Error("Detection conclusion step missing DETECTION_AGENTIC_EXECUTION_OUTCOME env var")
+	}
 
 	// Check that the combined parse-and-conclude step has ID detection_conclusion
 	if !strings.Contains(detectionSection, "id: detection_conclusion") {
diff --git a/pkg/workflow/threat_detection.go b/pkg/workflow/threat_detection.go
@@ -488,6 +488,7 @@ func (c *Compiler) buildDetectionConclusionStep(data *WorkflowData) []string {
 		fmt.Sprintf("        uses: %s\n", getCachedActionPin("actions/github-script", data)),
 		"        env:\n",
 		"          RUN_DETECTION: ${{ steps.detection_guard.outputs.run_detection }}\n",
+		"          DETECTION_AGENTIC_EXECUTION_OUTCOME: ${{ steps.detection_agentic_execution.outcome }}\n",
 		coeEnvLine,
 		"        with:\n",
 		"          script: |\n",
@@ -774,10 +775,11 @@ func (c *Compiler) buildResultsParsingScriptRequire() string {
   await main();
 } catch (loadErr) {
   const continueOnError = process.env.GH_AW_DETECTION_CONTINUE_ON_ERROR !== 'false';
+  const detectionExecutionFailed = process.env.DETECTION_AGENTIC_EXECUTION_OUTCOME === 'failure';
   const msg = 'ERR_SYSTEM: \u274C Unexpected error loading threat detection module: ' + (loadErr && loadErr.message ? loadErr.message : String(loadErr));
   core.error(msg);
   core.setOutput('reason', 'parse_error');
-  if (continueOnError) {
+  if (continueOnError && !detectionExecutionFailed) {
     core.warning('\u26A0\uFE0F ' + msg);
     core.setOutput('conclusion', 'warning');
     core.setOutput('success', 'false');

Original file line number	Diff line number	Diff line change
`@@ -70,6 +70,9 @@ Create an issue.`
`70`	`70`	`if !strings.Contains(detectionSection, "GH_AW_DETECTION_CONTINUE_ON_ERROR:") {`
`71`	`71`	`t.Error("Detection conclusion step missing GH_AW_DETECTION_CONTINUE_ON_ERROR env var")`
`72`	`72`	`}`
	`73`	`+ if !strings.Contains(detectionSection, "DETECTION_AGENTIC_EXECUTION_OUTCOME: ${{ steps.detection_agentic_execution.outcome }}") {`
	`74`	`+ t.Error("Detection conclusion step missing DETECTION_AGENTIC_EXECUTION_OUTCOME env var")`
	`75`	`+ }`
`73`	`76`
`74`	`77`	`// Check that the combined parse-and-conclude step has ID detection_conclusion`
`75`	`78`	`if !strings.Contains(detectionSection, "id: detection_conclusion") {`