Add AI credit cap observability attributes to OTLP conclusion spans (#38550)

Copilot · web-flow · commit 77f950f8f699 · 2026-06-11T12:49:43.000+02:00
diff --git a/actions/setup/js/ai_credits_context.cjs b/actions/setup/js/ai_credits_context.cjs
@@ -277,37 +277,40 @@ function parseAuditLogCombined(auditJsonlPathOverride) {
 }
 
 /**
+ * @param {{ logProvenance?: boolean }} [options]
  * @returns {{ aiCredits: string, maxAICredits: string, aiCreditsRateLimitError: boolean, maxAICreditsExceeded: boolean }}
  */
-function resolveAICreditsFailureState() {
+function resolveAICreditsFailureState({ logProvenance = true } = {}) {
   const stdioSignals = parseAICreditsExceededFromAgentStdio();
   const { aiCredits: auditAICredits, maxAICredits: auditMaxAICredits, rateLimitError: auditRateLimitError, maxAICreditsExceeded: auditMaxAICreditsExceeded } = parseAuditLogCombined();
   const envAICredits = parsePositiveNumberString(process.env.GH_AW_AIC);
   const envMaxAICredits = parsePositiveNumberString(process.env.GH_AW_MAX_AI_CREDITS);
 
   // Log provenance so failing issues can be diagnosed when credit data is missing.
-  if (auditAICredits) {
-    console.log(`[ai-credits] aiCredits source=audit_log value=${auditAICredits}`);
-  } else if (stdioSignals.aiCredits) {
-    console.log(`[ai-credits] aiCredits source=agent_stdio value=${stdioSignals.aiCredits}`);
-  } else if (envAICredits) {
-    console.log(`[ai-credits] aiCredits source=env(GH_AW_AIC) value=${envAICredits}`);
-  } else {
-    console.log(`[ai-credits] aiCredits source=none GH_AW_AIC=${process.env.GH_AW_AIC || "(unset)"}`);
-  }
+  if (logProvenance) {
+    if (auditAICredits) {
+      console.log(`[ai-credits] aiCredits source=audit_log value=${auditAICredits}`);
+    } else if (stdioSignals.aiCredits) {
+      console.log(`[ai-credits] aiCredits source=agent_stdio value=${stdioSignals.aiCredits}`);
+    } else if (envAICredits) {
+      console.log(`[ai-credits] aiCredits source=env(GH_AW_AIC) value=${envAICredits}`);
+    } else {
+      console.log(`[ai-credits] aiCredits source=none GH_AW_AIC=${process.env.GH_AW_AIC || "(unset)"}`);
+    }
 
-  if (auditMaxAICredits) {
-    console.log(`[ai-credits] maxAICredits source=audit_log value=${auditMaxAICredits}`);
-  } else if (stdioSignals.maxAICredits) {
-    console.log(`[ai-credits] maxAICredits source=agent_stdio value=${stdioSignals.maxAICredits}`);
-  } else if (envMaxAICredits) {
-    console.log(`[ai-credits] maxAICredits source=env(GH_AW_MAX_AI_CREDITS) value=${envMaxAICredits}`);
-  } else {
-    console.log(`[ai-credits] maxAICredits source=none GH_AW_MAX_AI_CREDITS=${process.env.GH_AW_MAX_AI_CREDITS || "(unset)"}`);
-  }
+    if (auditMaxAICredits) {
+      console.log(`[ai-credits] maxAICredits source=audit_log value=${auditMaxAICredits}`);
+    } else if (stdioSignals.maxAICredits) {
+      console.log(`[ai-credits] maxAICredits source=agent_stdio value=${stdioSignals.maxAICredits}`);
+    } else if (envMaxAICredits) {
+      console.log(`[ai-credits] maxAICredits source=env(GH_AW_MAX_AI_CREDITS) value=${envMaxAICredits}`);
+    } else {
+      console.log(`[ai-credits] maxAICredits source=none GH_AW_MAX_AI_CREDITS=${process.env.GH_AW_MAX_AI_CREDITS || "(unset)"}`);
+    }
 
-  const rawRateLimitSignalSource = auditRateLimitError ? "audit_log" : stdioSignals.rateLimitError ? "agent_stdio" : process.env.GH_AW_AI_CREDITS_RATE_LIMIT_ERROR === "true" ? "env(GH_AW_AI_CREDITS_RATE_LIMIT_ERROR)" : "none";
-  console.log(`[ai-credits] rateLimitSignal source=${rawRateLimitSignalSource}`);
+    const rawRateLimitSignalSource = auditRateLimitError ? "audit_log" : stdioSignals.rateLimitError ? "agent_stdio" : process.env.GH_AW_AI_CREDITS_RATE_LIMIT_ERROR === "true" ? "env(GH_AW_AI_CREDITS_RATE_LIMIT_ERROR)" : "none";
+    console.log(`[ai-credits] rateLimitSignal source=${rawRateLimitSignalSource}`);
+  }
 
   const aiCredits = auditAICredits || stdioSignals.aiCredits || envAICredits || "";
   const maxAICredits = auditMaxAICredits || stdioSignals.maxAICredits || envMaxAICredits || "";
diff --git a/actions/setup/js/handle_agent_failure.cjs b/actions/setup/js/handle_agent_failure.cjs
@@ -35,7 +35,7 @@ const COPILOT_SESSION_STATE_DIR = path.join(os.tmpdir(), "gh-aw", "sandbox", "ag
 // - Copilot/CAPI "CAPIError: 429" and utility-model quota text
 // - retry wrapper text that includes the canonical "Failed to get response..." phrase
 const ENGINE_RATE_LIMIT_429_RE =
-  /(?:\b429\b[\s\S]{0,120}(?:too many requests|rate[\s-]*limit)|rate_limit_(?:error|exceeded)|capierror:\s*429|failed to get response from the ai model[\s\S]{0,120}\b429\b|exceeded your rate limit for utility models)/i;
+  /(?:\b429\b[\s\S]{0,120}(?:too many requests|rate[\s-]*limit)|\brate_limit_(?:error|exceeded)\b|capierror:\s*429|failed to get response from the ai model[\s\S]{0,120}\b429\b|exceeded your rate limit for utility models)/i;
 
 /**
  * Parse action failure issue expiration from environment.
diff --git a/actions/setup/js/handle_agent_failure.test.cjs b/actions/setup/js/handle_agent_failure.test.cjs
@@ -2963,13 +2963,15 @@ describe("handle_agent_failure", () => {
       tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), "aw-test-engine-fail-guard-"));
       stdioLogPath = path.join(tmpDir, "agent-stdio.log");
       process.env.GH_AW_AGENT_OUTPUT = path.join(tmpDir, "agent_output.json");
+      process.env.GH_AW_OTEL_JSONL_PATH = path.join(tmpDir, "otel.jsonl");
       process.env.RUNNER_TEMP = tmpDir;
       ({ buildEngineFailureContext } = require("./handle_agent_failure.cjs"));
     });
 
     afterEach(() => {
       delete process.env.GH_AW_AGENT_OUTPUT;
       delete process.env.GH_AW_ENGINE_ID;
+      delete process.env.GH_AW_OTEL_JSONL_PATH;
       delete process.env.RUNNER_TEMP;
       if (fs.existsSync(tmpDir)) {
         fs.rmSync(tmpDir, { recursive: true, force: true });
diff --git a/actions/setup/js/send_otlp_span.cjs b/actions/setup/js/send_otlp_span.cjs
@@ -11,6 +11,7 @@ const { buildWorkflowRunUrl } = require("./workflow_metadata_helpers.cjs");
 const { readExperimentAssignments, EXPERIMENT_ASSIGNMENTS_PATH } = require("./experiment_helpers.cjs");
 const { parseJsonlContent } = require("./jsonl_helpers.cjs");
 const { countSteeringEventsInApiProxyJsonl } = require("./steering_helpers.cjs");
+const { resolveAICreditsFailureState } = require("./ai_credits_context.cjs");
 
 /**
  * send_otlp_span.cjs
@@ -2359,6 +2360,18 @@ async function sendJobConclusionSpan(spanName, options = {}) {
     attributes.push(...usageAttrs);
   }
 
+  const { maxAICredits, aiCreditsRateLimitError, maxAICreditsExceeded } = resolveAICreditsFailureState({ logProvenance: false });
+  const maxAICreditsValue = normalizeNonNegativeNumber(maxAICredits);
+  if (typeof maxAICreditsValue === "number") {
+    attributes.push(buildAttr("gh-aw.max_ai_credits", maxAICreditsValue));
+  }
+  if (typeof maxAICreditsExceeded === "boolean") {
+    attributes.push(buildAttr("gh-aw.max_ai_credits_exceeded", maxAICreditsExceeded));
+  }
+  if (typeof aiCreditsRateLimitError === "boolean") {
+    attributes.push(buildAttr("gh-aw.ai_credits_rate_limit_error", aiCreditsRateLimitError));
+  }
+
   const payload = buildOTLPPayload({
     traceId,
     spanId: conclusionSpanId,
diff --git a/actions/setup/js/send_otlp_span.test.cjs b/actions/setup/js/send_otlp_span.test.cjs
@@ -2523,6 +2523,8 @@ describe("sendJobConclusionSpan", () => {
     "OTEL_SERVICE_NAME",
     "GH_AW_EFFECTIVE_TOKENS",
     "GH_AW_AIC",
+    "GH_AW_MAX_AI_CREDITS",
+    "GH_AW_AI_CREDITS_RATE_LIMIT_ERROR",
     "GH_AW_INFO_VERSION",
     "GH_AW_INFO_CLI_VERSION",
     "GITHUB_AW_OTEL_TRACE_ID",
@@ -2645,6 +2647,7 @@ describe("sendJobConclusionSpan", () => {
     process.env.INPUT_JOB_NAME = "agent";
     process.env.GITHUB_AW_OTEL_TRACE_ID = "f".repeat(32);
     process.env.GITHUB_AW_OTEL_PARENT_SPAN_ID = "abcdef1234567890";
+    process.env.GH_AW_MAX_AI_CREDITS = "1000";
 
     const startMs = 1_700_000_000_000;
     const endMs = 1_700_000_005_000;
@@ -2677,6 +2680,14 @@ describe("sendJobConclusionSpan", () => {
     expect(conclusionSpan.parentSpanId).toBe("abcdef1234567890");
     expect(agentSpan.attributes).toContainEqual({ key: "gh-aw.output.item_count", value: { intValue: 2 } });
     expect(conclusionSpan.attributes).toContainEqual({ key: "gh-aw.output.item_count", value: { intValue: 2 } });
+    const agentKeys = agentSpan.attributes.map(a => a.key);
+    const conclusionKeys = conclusionSpan.attributes.map(a => a.key);
+    expect(agentKeys).not.toContain("gh-aw.max_ai_credits");
+    expect(agentKeys).not.toContain("gh-aw.max_ai_credits_exceeded");
+    expect(agentKeys).not.toContain("gh-aw.ai_credits_rate_limit_error");
+    expect(conclusionKeys).toContain("gh-aw.max_ai_credits");
+    expect(conclusionKeys).toContain("gh-aw.max_ai_credits_exceeded");
+    expect(conclusionKeys).toContain("gh-aw.ai_credits_rate_limit_error");
   });
 
   it("uses agent_cli_start_ms.txt as agent span start time when file is present", async () => {
@@ -3578,6 +3589,75 @@ describe("sendJobConclusionSpan", () => {
     expect(aicAttr.value.doubleValue).toBe(0.125);
   });
 
+  it("emits gh-aw.max_ai_credits as a numeric conclusion-span attribute when available", async () => {
+    const mockFetch = vi.fn().mockResolvedValue({ ok: true, status: 200, statusText: "OK" });
+    vi.stubGlobal("fetch", mockFetch);
+
+    process.env.GH_AW_OTLP_ENDPOINTS = JSON.stringify([{ url: "https://traces.example.com" }]);
+    process.env.GH_AW_MAX_AI_CREDITS = "1000.5";
+
+    await sendJobConclusionSpan("gh-aw.job.conclusion");
+
+    const body = JSON.parse(mockFetch.mock.calls[0][1].body);
+    const span = body.resourceSpans[0].scopeSpans[0].spans[0];
+    const maxAICreditsAttr = span.attributes.find(a => a.key === "gh-aw.max_ai_credits");
+    expect(maxAICreditsAttr).toBeDefined();
+    expect(maxAICreditsAttr.value.doubleValue).toBe(1000.5);
+  });
+
+  it("emits AI credits boolean cap/rate-limit attributes on conclusion spans when detected", async () => {
+    const mockFetch = vi.fn().mockResolvedValue({ ok: true, status: 200, statusText: "OK" });
+    vi.stubGlobal("fetch", mockFetch);
+
+    process.env.GH_AW_OTLP_ENDPOINTS = JSON.stringify([{ url: "https://traces.example.com" }]);
+
+    const stdioContent = Buffer.from("CAPIError: 429 Maximum AI credits exceeded (1002.381900 / 1000).", "utf8");
+    const stdioLogPath = "/tmp/gh-aw/agent-stdio.log";
+    const MOCK_FD = 42;
+    const existsSpy = vi.spyOn(fs, "existsSync").mockImplementation(p => p === stdioLogPath);
+    const statSpy = vi.spyOn(fs, "statSync").mockImplementation(p => {
+      if (p === stdioLogPath) return /** @type {fs.Stats} */ { size: stdioContent.length };
+      throw Object.assign(new Error("ENOENT"), { code: "ENOENT" });
+    });
+    const openSpy = vi.spyOn(fs, "openSync").mockReturnValue(/** @type {number} */ MOCK_FD);
+    const readSpy = vi.spyOn(fs, "readSync").mockImplementation((_fd, buf) => {
+      stdioContent.copy(/** @type {Buffer} */ buf);
+      return stdioContent.length;
+    });
+    const closeSpy = vi.spyOn(fs, "closeSync").mockImplementation(() => {});
+
+    try {
+      await sendJobConclusionSpan("gh-aw.job.conclusion");
+    } finally {
+      existsSpy.mockRestore();
+      statSpy.mockRestore();
+      openSpy.mockRestore();
+      readSpy.mockRestore();
+      closeSpy.mockRestore();
+    }
+
+    const body = JSON.parse(mockFetch.mock.calls[0][1].body);
+    const span = body.resourceSpans[0].scopeSpans[0].spans[0];
+    const attrs = Object.fromEntries(span.attributes.map(a => [a.key, a.value.boolValue ?? a.value.doubleValue ?? a.value.intValue ?? a.value.stringValue]));
+    expect(attrs["gh-aw.max_ai_credits_exceeded"]).toBe(true);
+    expect(attrs["gh-aw.ai_credits_rate_limit_error"]).toBe(true);
+  });
+
+  it("does not emit gh-aw.max_ai_credits when max AI credits is missing or invalid", async () => {
+    const mockFetch = vi.fn().mockResolvedValue({ ok: true, status: 200, statusText: "OK" });
+    vi.stubGlobal("fetch", mockFetch);
+
+    process.env.GH_AW_OTLP_ENDPOINTS = JSON.stringify([{ url: "https://traces.example.com" }]);
+    process.env.GH_AW_MAX_AI_CREDITS = "not-a-number";
+
+    await sendJobConclusionSpan("gh-aw.job.conclusion");
+
+    const body = JSON.parse(mockFetch.mock.calls[0][1].body);
+    const span = body.resourceSpans[0].scopeSpans[0].spans[0];
+    const keys = span.attributes.map(a => a.key);
+    expect(keys).not.toContain("gh-aw.max_ai_credits");
+  });
+
   it("emits dashboard metrics and aliases on the conclusion span", async () => {
     const mockFetch = vi.fn().mockResolvedValue({ ok: true, status: 200, statusText: "OK" });
     vi.stubGlobal("fetch", mockFetch);
diff --git a/docs/src/content/docs/reference/open-telemetry.mdx b/docs/src/content/docs/reference/open-telemetry.mdx
@@ -88,6 +88,9 @@ These attributes appear on built-in workflow setup, agent, and conclusion spans
     <tr><td><code>gh-aw.action_minutes</code></td><td>Elapsed runtime converted to minutes.</td></tr>
     <tr><td><code>gh-aw.tracker.id</code></td><td>Tracker identifier when present.</td></tr>
     <tr><td><code>gh-aw.aic</code></td><td>AI credits consumed for the run when available.</td></tr>
+    <tr><td><code>gh-aw.max_ai_credits</code></td><td>Configured max AI credits budget for the run when available.</td></tr>
+    <tr><td><code>gh-aw.max_ai_credits_exceeded</code></td><td>Whether the run exceeded the max AI credits budget.</td></tr>
+    <tr><td><code>gh-aw.ai_credits_rate_limit_error</code></td><td>Whether an AI-credits rate-limit or budget-exhaustion signal was detected.</td></tr>
     <tr><td><code>gh-aw.turns</code></td><td>Total agent turns recorded for the run.</td></tr>
     <tr><td><code>gh-aw.agent.conclusion</code></td><td>Normalized agent conclusion.</td></tr>
     <tr><td><code>gh-aw.detection.conclusion</code></td><td>Detection subsystem conclusion when present.</td></tr>
diff --git a/specs/otel-observability-spec.md b/specs/otel-observability-spec.md
@@ -455,6 +455,9 @@ This section defines the attributes each span type MUST or MAY carry.
 | `gh-aw.trigger.*` | string | Trigger context (same fields as setup span) |
 | `gh-aw.frontmatter.*` | string | Frontmatter metadata (same fields as setup span) |
 | `gh-aw.aic` | double | AI credits consumed (AIC); always emitted as a numeric attribute on agent and detection conclusion spans (0 when no usage data is available, so Sentry EAP and Tempo index the field as numeric from first emission). |
+| `gh-aw.max_ai_credits` | double | Configured max AI credits budget for the run when a valid numeric value is available. |
+| `gh-aw.max_ai_credits_exceeded` | boolean | True when a max-AI-credits hard-limit exceedance signal is detected for the run. |
+| `gh-aw.ai_credits_rate_limit_error` | boolean | True when an AI-credits-related rate-limit or budget-exhaustion signal is detected. |
 | `gh-aw.turns` | int | Number of agent turns |
 | `gh-aw.agent.conclusion` | string | Agent job outcome |
 | `gh-aw.detection.conclusion` | string | Threat detection outcome |