feat(telemetry): add agent detection tag for AI coding tools (#687)

betegon · claude · github-actions[bot] · web-flow · commit fc2ac72e0b9c · 2026-04-09T19:43:16.000+01:00
## Summary Adds an `agent` tag to telemetry spans when the CLI is invoked by a known AI coding tool. Detection uses two strategies: 1. **Environment variables** (sync, instant) — agents inject these into child processes. Adapted from [Vercel's `@vercel/detect-agent`](https://github.com/vercel/vercel/tree/main/packages/detect-agent) (Apache-2.0). 2. **Process tree walking** (async, non-blocking) — scans parent/grandparent process names for known agent executables. Fires in the background so it never delays CLI startup. ## Supported agents (env vars) | Agent | Env var(s) | |-------|-----------| | Generic override | `AI_AGENT` | | Cursor | `CURSOR_TRACE_ID`, `CURSOR_AGENT` | | Gemini | `GEMINI_CLI` | | Codex | `CODEX_SANDBOX`, `CODEX_CI`, `CODEX_THREAD_ID` | | Antigravity | `ANTIGRAVITY_AGENT` | | Augment | `AUGMENT_AGENT` | | OpenCode | `OPENCODE_CLIENT` | | Claude Code | `CLAUDE_CODE`, `CLAUDECODE` | | Cowork | `CLAUDE_CODE` + `CLAUDE_CODE_IS_COWORK` | | GitHub Copilot | `COPILOT_MODEL`, `COPILOT_ALLOW_ALL` | | Goose | `GOOSE_TERMINAL` | | Amp | `AMP_THREAD_ID` | | Generic fallback | `AGENT` | **Intentionally excluded:** `REPL_ID` (set in all Replit workspaces, not just AI agent sessions) and `COPILOT_GITHUB_TOKEN` (auth credential users may export persistently). New agents can be added with a single `["ENV_VAR", "agent-name"]` line in the `ENV_VAR_AGENTS` map. ## Process tree detection (fallback) When no env var matches, the CLI asynchronously walks the parent process tree (up to 5 levels) looking for known agent executables: `cursor`, `claude`, `goose`, `windsurf`, `amp`, `codex`, `augment`, `opencode`, `gemini` - **Linux**: reads `/proc/<pid>/status` (in-memory filesystem, fast) - **macOS**: uses `ps(1)` with a 500ms timeout, child process unreffed to never block exit - **Windows**: not supported (env var detection still works) ## Detection priority 1. `AI_AGENT` env var (explicit override) 2. Agent-specific env vars (`ENV_VAR_AGENTS` map) 3. Claude Code / Cowork (conditional logic) 4. `AGENT` env var (generic fallback — explicit signal beats heuristic) 5. Process tree walking (async, best-effort — may miss very fast commands) ## Known limitations - **Fast commands**: Process tree detection runs asynchronously. For commands completing in <50ms where no env vars are set, the tag may not be applied before the transaction ends. This is an intentional trade-off — env vars cover the vast majority of agent invocations instantly. - **Windows**: No process tree detection (no `/proc/` or `ps`). Env var detection still works. ## Test plan - [x] 47 unit tests covering env var detection, process tree walking, depth limits, case-insensitive matching, priority ordering, map structure validation, and real `/proc/` reads - [ ] Manual: `CLAUDE_CODE=1 bunx sentry-cli auth status` and verify span has `agent: claude` --------- Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com> Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: Burak Yigit Kaya <byk@sentry.io>
diff --git a/src/lib/detect-agent.ts b/src/lib/detect-agent.ts
@@ -0,0 +1,242 @@
+/**
+ * AI agent detection — determines whether the CLI is being driven by
+ * a specific AI coding agent.
+ *
+ * Detection uses two strategies:
+ * 1. **Environment variables** (sync) — agents inject these into child
+ *    processes. Adapted from Vercel's @vercel/detect-agent (Apache-2.0).
+ * 2. **Process tree walking** (async) — scan parent/grandparent process
+ *    names for known agent executables. Runs as a non-blocking background
+ *    task so it never delays CLI startup.
+ *
+ * To add a new agent, add entries to {@link ENV_VAR_AGENTS} and/or
+ * {@link PROCESS_NAME_AGENTS}.
+ */
+
+import { execFile } from "node:child_process";
+import { readFile } from "node:fs/promises";
+import { basename } from "node:path";
+
+import { getEnv } from "./env.js";
+
+/**
+ * Env var → agent name. Checked in insertion order — first match wins.
+ * Each env var maps directly to the agent that sets it.
+ */
+export const ENV_VAR_AGENTS = new Map<string, string>([
+  // Cursor
+  ["CURSOR_TRACE_ID", "cursor"],
+  ["CURSOR_AGENT", "cursor"],
+  // Gemini CLI
+  ["GEMINI_CLI", "gemini"],
+  // OpenAI Codex
+  ["CODEX_SANDBOX", "codex"],
+  ["CODEX_CI", "codex"],
+  ["CODEX_THREAD_ID", "codex"],
+  // Antigravity
+  ["ANTIGRAVITY_AGENT", "antigravity"],
+  // Augment
+  ["AUGMENT_AGENT", "augment"],
+  // OpenCode
+  ["OPENCODE_CLIENT", "opencode"],
+  // Replit — REPL_ID intentionally excluded because it's set in ALL Replit
+  // workspaces, not just when the AI agent is driving the CLI
+  // GitHub Copilot — COPILOT_GITHUB_TOKEN intentionally excluded because
+  // users may export it persistently for auth, causing false positives
+  ["COPILOT_MODEL", "github-copilot"],
+  ["COPILOT_ALLOW_ALL", "github-copilot"],
+  // Goose
+  ["GOOSE_TERMINAL", "goose"],
+  // Amp
+  ["AMP_THREAD_ID", "amp"],
+]);
+
+/**
+ * Process executable basename (lowercase) → agent name.
+ * Used when scanning the parent process tree as a fallback.
+ */
+export const PROCESS_NAME_AGENTS = new Map<string, string>([
+  ["cursor", "cursor"],
+  ["claude", "claude"],
+  ["goose", "goose"],
+  ["windsurf", "windsurf"],
+  ["amp", "amp"],
+  ["codex", "codex"],
+  ["augment", "augment"],
+  ["opencode", "opencode"],
+  ["gemini", "gemini"],
+]);
+
+/** Max levels to walk up the process tree before giving up. */
+const MAX_ANCESTOR_DEPTH = 5;
+
+/** Pattern to extract `Name:` from `/proc/<pid>/status`. */
+const PROC_STATUS_NAME_RE = /^Name:\s+(.+)$/m;
+
+/** Pattern to extract `PPid:` from `/proc/<pid>/status`. */
+const PROC_STATUS_PPID_RE = /^PPid:\s+(\d+)$/m;
+
+/** Pattern to parse `ps -o ppid=,comm=` output: "  <ppid> <comm>". */
+const PS_PPID_COMM_RE = /^(\d+)\s+(.+)$/;
+
+/** Name + parent PID of a process. */
+type ProcessInfo = {
+  /** Basename of the executable (e.g. "cursor", "bash"). */
+  name: string;
+  /** Parent process ID, or 0 if unavailable. */
+  ppid: number;
+};
+
+/**
+ * Async process info provider signature. Default reads from `/proc/` or `ps(1)`.
+ * Override via {@link setProcessInfoProvider} for testing.
+ */
+type ProcessInfoProvider = (pid: number) => Promise<ProcessInfo | undefined>;
+
+let _getProcessInfo: ProcessInfoProvider = getProcessInfoFromOS;
+
+/**
+ * Override the process info provider. Follows the same pattern as
+ * {@link setEnv} — call with a mock in tests, reset in `afterEach`.
+ *
+ * Pass `getProcessInfoFromOS` to restore the real implementation.
+ */
+export function setProcessInfoProvider(provider: ProcessInfoProvider): void {
+  _getProcessInfo = provider;
+}
+
+/**
+ * Detect agent from environment variables only (synchronous, no I/O).
+ *
+ * Priority:
+ * 1. `AI_AGENT` env var — explicit override, any agent can self-identify
+ * 2. Agent-specific env vars from {@link ENV_VAR_AGENTS}
+ * 3. Claude Code with Cowork variant (conditional, can't be in the map)
+ * 4. `AGENT` env var — generic fallback set by Goose, Amp, and others
+ *
+ * Returns the agent name string, or `undefined` if no agent is detected.
+ * For process tree fallback, use {@link detectAgentFromProcessTree} separately.
+ */
+export function detectAgent(): string | undefined {
+  const env = getEnv();
+
+  // 1. Highest priority: explicit override — any agent can self-identify
+  const aiAgent = env.AI_AGENT?.trim();
+  if (aiAgent) {
+    return aiAgent;
+  }
+
+  // 2. Table-driven env var check (Map iteration preserves insertion order)
+  for (const [envVar, agent] of ENV_VAR_AGENTS) {
+    if (env[envVar]) {
+      return agent;
+    }
+  }
+
+  // 3. Claude Code / Cowork — requires branching logic, so not in the map
+  if (env.CLAUDECODE || env.CLAUDE_CODE) {
+    return env.CLAUDE_CODE_IS_COWORK ? "cowork" : "claude";
+  }
+
+  // 4. Lowest priority: generic AGENT fallback
+  return env.AGENT?.trim() || undefined;
+}
+
+/**
+ * Walk the ancestor process tree looking for known agent executables.
+ *
+ * Fully async — never blocks CLI startup. Starts at the direct parent
+ * (`process.ppid`) and walks up to {@link MAX_ANCESTOR_DEPTH} levels.
+ * Stops at PID 1 (init/launchd) or on any read error.
+ *
+ * - **Linux**: reads `/proc/<pid>/status` (in-memory filesystem, fast).
+ * - **macOS**: uses `ps(1)` with a 500ms timeout per invocation.
+ * - **Windows**: not supported (env var detection still works).
+ */
+export async function detectAgentFromProcessTree(): Promise<
+  string | undefined
+> {
+  let pid = process.ppid;
+
+  for (let depth = 0; depth < MAX_ANCESTOR_DEPTH && pid > 1; depth++) {
+    const info = await _getProcessInfo(pid);
+    if (!info) {
+      break;
+    }
+
+    const agent = PROCESS_NAME_AGENTS.get(info.name.toLowerCase());
+    if (agent) {
+      return agent;
+    }
+
+    pid = info.ppid;
+  }
+
+  return;
+}
+
+/**
+ * Read process name and parent PID for a given PID.
+ *
+ * Tries `/proc/<pid>/status` first (Linux, no subprocess overhead),
+ * falls back to `ps(1)` (macOS and other Unix systems).
+ * Windows is unsupported — returns `undefined`.
+ */
+export async function getProcessInfoFromOS(
+  pid: number
+): Promise<ProcessInfo | undefined> {
+  // Linux: /proc is an in-memory filesystem — fast even though async
+  try {
+    const status = await readFile(`/proc/${pid}/status`, "utf-8");
+    const nameMatch = status.match(PROC_STATUS_NAME_RE);
+    const ppidMatch = status.match(PROC_STATUS_PPID_RE);
+    if (nameMatch?.[1] && ppidMatch?.[1]) {
+      return { name: nameMatch[1].trim(), ppid: Number(ppidMatch[1]) };
+    }
+  } catch {
+    // Not Linux or process is gone — fall through to ps
+  }
+
+  // macOS / other Unix: use ps(1) asynchronously
+  if (process.platform !== "win32") {
+    try {
+      const result = await execFileUnreffed(
+        "ps",
+        ["-p", String(pid), "-o", "ppid=,comm="],
+        { timeout: 500 }
+      );
+      const match = result.trim().match(PS_PPID_COMM_RE);
+      if (match?.[1] && match?.[2]) {
+        return { name: basename(match[2].trim()), ppid: Number(match[1]) };
+      }
+    } catch {
+      // Process gone, ps not available, or timeout
+    }
+  }
+}
+
+/**
+ * Spawn `execFile` with the child process unreffed so it never
+ * prevents the CLI from exiting. Resolves with stdout on success.
+ */
+function execFileUnreffed(
+  cmd: string,
+  args: readonly string[],
+  opts: { timeout?: number }
+): Promise<string> {
+  return new Promise((resolve, reject) => {
+    const child = execFile(
+      cmd,
+      args,
+      { encoding: "utf-8", ...opts },
+      (err, stdout) => {
+        if (err) {
+          reject(err);
+        } else {
+          resolve(stdout);
+        }
+      }
+    );
+    child.unref();
+  });
+}
diff --git a/src/lib/telemetry.ts b/src/lib/telemetry.ts
@@ -19,9 +19,10 @@ import {
   SENTRY_CLI_DSN,
 } from "./constants.js";
 import { isReadonlyError, tryRepairAndRetry } from "./db/schema.js";
+import { detectAgent, detectAgentFromProcessTree } from "./detect-agent.js";
 import { getEnv } from "./env.js";
 import { ApiError, AuthError, OutputError } from "./errors.js";
-import { attachSentryReporter } from "./logger.js";
+import { attachSentryReporter, logger } from "./logger.js";
 import { getSentryBaseUrl, isSentrySaasUrl } from "./sentry-urls.js";
 import { getRealUsername } from "./utils.js";
 
@@ -522,6 +523,25 @@ export function initSentry(
     // Tag whether running in an interactive terminal or agent/CI environment
     Sentry.setTag("is_tty", !!process.stdout.isTTY);
 
+    // Tag which AI agent (if any) is driving the CLI.
+    // Env var detection is sync (instant). If no env var matches, fire off
+    // async process tree detection in the background — it sets the tag
+    // before the transaction finishes without blocking CLI startup.
+    const agent = detectAgent();
+    if (agent) {
+      Sentry.setTag("agent", agent);
+    } else {
+      detectAgentFromProcessTree()
+        .then((processAgent) => {
+          if (processAgent) {
+            Sentry.setTag("agent", processAgent);
+          }
+        })
+        .catch((error) => {
+          logger.withTag("agent").warn("Process tree detection failed:", error);
+        });
+    }
+
     // Wire up consola → Sentry log forwarding now that the client is active
     attachSentryReporter();
 
diff --git a/test/lib/detect-agent.test.ts b/test/lib/detect-agent.test.ts