betaHi
diff --git a/‎README.md‎
Lines changed: 3 additions & 9 deletions b/‎README.md‎
Lines changed: 3 additions & 9 deletions
diff --git a/‎scripts/probe-claude-cli.ts‎
Lines changed: 1 addition & 4 deletions b/‎scripts/probe-claude-cli.ts‎
Lines changed: 1 addition & 4 deletions
diff --git a/‎scripts/probe-claude.ts‎
Lines changed: 1 addition & 4 deletions b/‎scripts/probe-claude.ts‎
Lines changed: 1 addition & 4 deletions
diff --git a/‎src/bridges/claude/non-stream-translation.ts‎
Lines changed: 5 additions & 68 deletions b/‎src/bridges/claude/non-stream-translation.ts‎
Lines changed: 5 additions & 68 deletions
diff --git a/‎src/bridges/claude/tool-names.ts‎
Lines changed: 0 additions & 4 deletions b/‎src/bridges/claude/tool-names.ts‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎src/bridges/codex/responses.ts‎
Lines changed: 11 additions & 34 deletions b/‎src/bridges/codex/responses.ts‎
Lines changed: 11 additions & 34 deletions
diff --git a/‎src/lib/auto-session.ts‎
Lines changed: 20 additions & 3 deletions b/‎src/lib/auto-session.ts‎
Lines changed: 20 additions & 3 deletions
diff --git a/‎src/lib/model-capabilities.ts‎
Lines changed: 5 additions & 7 deletions b/‎src/lib/model-capabilities.ts‎
Lines changed: 5 additions & 7 deletions
diff --git a/‎src/lib/models-resolver.ts‎
Lines changed: 6 additions & 0 deletions b/‎src/lib/models-resolver.ts‎
Lines changed: 6 additions & 0 deletions
@@ -219,6 +219,7 @@ Common:
 | `--host <host>` | Bind address. Defaults to `127.0.0.1`. |
 | `--port <port>` | Listen port. Overrides `$PORT` and the port inferred from Claude settings. |
 | `--model <model>` | Override the request model for this bridge process only; does not edit config files. |
+| `--auto` | Acquire a Copilot Auto session and attach its session token only to upstream `/chat/completions` and `/responses` requests. Codex model selection is limited to Auto-available models. |
 | `--rate-limit <seconds>` | Enforce a minimum delay between upstream requests. |
 | `--wait` | With `--rate-limit`, wait instead of returning HTTP 429. |
 
@@ -280,22 +281,15 @@ accepts upstream.
 | Model                            | Reasoning efforts                       | Notes                                  |
 | -------------------------------- | --------------------------------------- | -------------------------------------- |
 | `claude-opus-4.8`                | `medium`                                |                                        |
-| `claude-opus-4.7`                | `medium`                                | Effort sent as `output_config.effort`. |
-| `claude-opus-4.7-1m`             | `low`, `medium`, `high`, `xhigh`        | 1M-token context window, prefer use `claude-opus-4.7-[1m]` in config|
-| `claude-opus-4.7-high`           | `high`                                  | Fixed high reasoning|
-| `claude-opus-4.7-xhigh`          | `xhigh`                                 | Fixed extra-high reasoning|
+| `claude-opus-4.7`                | `low`, `medium`, `high`, `xhigh`        | Effort sent as `output_config.effort`. |
+| `claude-opus-4.7-1m`             | `low`, `medium`, `high`, `xhigh`        | 1M-token context window, prefer use `claude-opus-4.7-[1m]` in config. |
 | `claude-opus-4.6`                | `low`, `medium`, `high`                 |                                        |
 | `claude-opus-4.6-1m`             | `low`, `medium`, `high`                 | 1M-token context window, prefer use `claude-opus-4.6-[1m]` in config              |
 | `claude-sonnet-4.6`              | `low`, `medium`, `high`                 |                                        |
 | `claude-opus-4.5`                | —                                       | Reasoning not accepted upstream.       |
 | `claude-sonnet-4.5`              | —                                       | Reasoning not accepted upstream.       |
-| `claude-sonnet-4`                | —                                       | Reasoning not accepted upstream.       |
 | `claude-haiku-4.5`               | —                                       | Reasoning not accepted upstream.       |
 
-For Claude Opus 4.7, both Codex CLI and Claude Code can use
-`claude-opus-4.7` with reasoning effort `high` or `xhigh`; the bridge routes the
-request to the matching upstream reasoning variant.
-
 For Claude Code settings, prefer `claude-opus-4.7-[1m]` or
 `claude-opus-4.6-[1m]` when you want the CLI `/context` UI and the upstream
 model to both use 1M context. Direct API clients can use
 
@@ -19,16 +19,13 @@ const CASES: Case[] = [
   { model: "gpt-5.2-codex", efforts: ["low", "medium", "high", "xhigh"] },
   { model: "gpt-5-mini", efforts: ["low", "medium", "high"] },
   // Claude
-  { model: "claude-opus-4.7", efforts: ["medium"] },
+  { model: "claude-opus-4.7", efforts: ["low", "medium", "high", "xhigh"] },
   { model: "claude-opus-4.7-1m", efforts: ["low", "medium", "high", "xhigh"] },
-  { model: "claude-opus-4.7-high", efforts: ["high"] },
-  { model: "claude-opus-4.7-xhigh", efforts: ["xhigh"] },
   { model: "claude-opus-4.6", efforts: ["low", "medium", "high"] },
   { model: "claude-opus-4.6-1m", efforts: ["low", "medium", "high"] },
   { model: "claude-sonnet-4.6", efforts: ["low", "medium", "high"] },
   { model: "claude-opus-4.5", efforts: [null] },
   { model: "claude-sonnet-4.5", efforts: [null] },
-  { model: "claude-sonnet-4", efforts: [null] },
   { model: "claude-haiku-4.5", efforts: [null] },
   // Gemini
   { model: "gemini-3.1-pro-preview", efforts: [null] },
 
@@ -8,16 +8,13 @@ interface Case {
 }
 
 const CASES: Case[] = [
-  { model: "claude-opus-4.7", efforts: ["medium"] },
+  { model: "claude-opus-4.7", efforts: ["low", "medium", "high", "xhigh"] },
   { model: "claude-opus-4.7-1m", efforts: ["low", "medium", "high", "xhigh"] },
-  { model: "claude-opus-4.7-high", efforts: ["high"] },
-  { model: "claude-opus-4.7-xhigh", efforts: ["xhigh"] },
   { model: "claude-opus-4.6", efforts: ["low", "medium", "high"] },
   { model: "claude-opus-4.6-1m", efforts: ["low", "medium", "high"] },
   { model: "claude-sonnet-4.6", efforts: ["low", "medium", "high"] },
   { model: "claude-opus-4.5", efforts: [null] },
   { model: "claude-sonnet-4.5", efforts: [null] },
-  { model: "claude-sonnet-4", efforts: [null] },
   { model: "claude-haiku-4.5", efforts: [null] },
 ]
 
 
@@ -81,64 +81,6 @@ const normalizeClaudeModelAlias = (model: string): string => {
   return prefixed
 }
 
-function normalizeClaudeReasoningEffortForRouting(
-  value: string | undefined,
-): ClaudeOpus47Effort | undefined {
-  switch (value?.toLowerCase()) {
-    case "low":
-    case "medium":
-    case "high":
-    case "xhigh":
-    case "max": {
-      return value.toLowerCase() as ClaudeOpus47Effort
-    }
-    default: {
-      return undefined
-    }
-  }
-}
-
-const getEnvValueCaseInsensitive = (
-  env: Record<string, string>,
-  key: string,
-): string | undefined => {
-  const direct = env[key]
-  if (typeof direct === "string") {
-    return direct
-  }
-  const lower = key.toLowerCase()
-  const matched = Object.entries(env).find(([k]) => k.toLowerCase() === lower)
-  return matched?.[1]
-}
-
-const getConfiguredClaudeReasoningEffort = (
-  settings: Pick<ClaudeSettings, "env"> | undefined,
-): string | undefined =>
-  process.env.MODEL_REASONING_EFFORT
-  ?? getEnvValueCaseInsensitive(settings?.env ?? {}, "MODEL_REASONING_EFFORT")
-
-const routeClaudeOpus47ByEffort = (
-  model: string,
-  requestedEffort: string | undefined,
-): string => {
-  if (model !== "claude-opus-4.7") {
-    return model
-  }
-
-  switch (normalizeClaudeReasoningEffortForRouting(requestedEffort)) {
-    case "high": {
-      return "claude-opus-4.7-high"
-    }
-    case "xhigh":
-    case "max": {
-      return "claude-opus-4.7-xhigh"
-    }
-    default: {
-      return model
-    }
-  }
-}
-
 const getConfiguredClaudeDefaultModel = (
   settings: Pick<ClaudeSettings, "env" | "model"> | undefined,
 ): string | undefined => {
@@ -191,15 +133,10 @@ const resolveClaudeRequestedModel = (
 export function translateModelName(
   model: string,
   settings?: Pick<ClaudeSettings, "env" | "model">,
-  requestedReasoningEffort?: string,
 ): string {
   const requestedModel = resolveClaudeRequestedModel(model, settings)
   const normalizedModel = normalizeClaudeModelAlias(requestedModel)
-  const routedModel = routeClaudeOpus47ByEffort(
-    normalizedModel,
-    requestedReasoningEffort ?? getConfiguredClaudeReasoningEffort(settings),
-  )
-  return resolveUpstreamModelId(routedModel)
+  return resolveUpstreamModelId(normalizedModel)
 }
 
 function isClaudeModel(modelId: string): boolean {
@@ -275,7 +212,7 @@ function translateThinking(
   payload: AnthropicMessagesPayload,
   settings?: Pick<ClaudeSettings, "env" | "model">,
 ): ChatCompletionsPayload["thinking"] {
-  const modelId = translateModelName(payload.model, settings, payload.reasoning_effort)
+  const modelId = translateModelName(payload.model, settings)
 
   if (!isClaudeOpus47Model(modelId)) {
     return undefined
@@ -292,7 +229,7 @@ function translateOutputConfig(
   payload: AnthropicMessagesPayload,
   settings?: Pick<ClaudeSettings, "env" | "model">,
 ): ChatCompletionsPayload["output_config"] {
-  const modelId = translateModelName(payload.model, settings, payload.reasoning_effort)
+  const modelId = translateModelName(payload.model, settings)
 
   if (!isClaudeOpus47Model(modelId)) {
     return undefined
@@ -335,7 +272,7 @@ function translateReasoningEffort(
   payload: AnthropicMessagesPayload,
   settings?: Pick<ClaudeSettings, "env" | "model">,
 ): ChatCompletionsPayload["reasoning_effort"] {
-  const modelId = translateModelName(payload.model, settings, payload.reasoning_effort)
+  const modelId = translateModelName(payload.model, settings)
 
   if (isClaudeOpus47Model(modelId)) {
     return undefined
@@ -379,7 +316,7 @@ export function translateToOpenAI(
   settings?: Pick<ClaudeSettings, "env" | "model">,
   toolNameMapper?: AnthropicToolNameMapper,
 ): ChatCompletionsPayload {
-  const model = translateModelName(payload.model, settings, payload.reasoning_effort)
+  const model = translateModelName(payload.model, settings)
   const mapper = toolNameMapper ?? createAnthropicToolNameMapper(payload.tools, {
     ...getToolNameMapperOptionsForModel(model),
   })
 
@@ -31,10 +31,6 @@ export const getToolNameMapperOptionsForModel = (
     return { allowDots: false, maxNameLength: EXTENDED_TOOL_NAME_MAX_LENGTH }
   }
 
-  if (/^claude-sonnet-4(?:$|-\d{8}$)/.test(normalized)) {
-    return { allowDots: false, maxNameLength: EXTENDED_TOOL_NAME_MAX_LENGTH }
-  }
-
   if (normalized.startsWith("gemini-")) {
     return { allowDots: true, maxNameLength: EXTENDED_TOOL_NAME_MAX_LENGTH }
   }
 
@@ -36,43 +36,14 @@ const removeReasoningEffort = (reasoning: ReasoningField): ReasoningField | unde
 const isPlainObject = (value: unknown): value is Record<string, unknown> =>
   typeof value === "object" && value !== null && !Array.isArray(value)
 
-const routeClaudeOpus47ByReasoningEffort = (
-  model: string,
-  effort: unknown,
-): string => {
-  if (model !== "claude-opus-4.7") {
-    return model
-  }
-
-  switch (typeof effort === "string" ? effort.toLowerCase() : undefined) {
-    case "high": {
-      return "claude-opus-4.7-high"
-    }
-    case "xhigh":
-    case "max": {
-      return "claude-opus-4.7-xhigh"
-    }
-    default: {
-      return model
-    }
-  }
-}
-
 export const normalizeCodexResponsesRequest = (
   payload: CodexResponsesRequest,
   configuredReasoningEffort?: unknown,
 ): CodexResponsesRequest => {
   const parsed = codexResponsesRequestSchema.parse(payload) as CodexResponsesRequest
     & { reasoning?: ReasoningField; text?: TextField }
 
-  const incomingReasoning =
-    isPlainObject(parsed.reasoning) ? (parsed.reasoning as ReasoningField) : undefined
-  const requestedReasoningEffort =
-    incomingReasoning?.effort ?? configuredReasoningEffort
-  const canonical = routeClaudeOpus47ByReasoningEffort(
-    resolveModelId(parsed.model),
-    requestedReasoningEffort,
-  )
+  const canonical = resolveModelId(parsed.model)
   const capability = getModelCapability(canonical)
   if (!capability) return parsed
 
@@ -87,10 +58,11 @@ export const normalizeCodexResponsesRequest = (
 
   if ("reasoning" in next) {
     if (!isPlainObject(next.reasoning)) {
-      if (configuredReasoningEffort === undefined || configuredReasoningEffort === null) {
+      const effort = configuredReasoningEffort
+      if (effort === undefined || effort === null) {
         delete (next as Record<string, unknown>).reasoning
       } else {
-        const clamped = clampReasoningEffort(canonical, configuredReasoningEffort)
+        const clamped = clampReasoningEffort(canonical, effort)
         if (clamped) {
           next.reasoning = { effort: clamped.effort }
         }
@@ -112,8 +84,13 @@ export const normalizeCodexResponsesRequest = (
         }
       }
     }
-  } else if (configuredReasoningEffort !== undefined && configuredReasoningEffort !== null) {
-    const clamped = clampReasoningEffort(canonical, configuredReasoningEffort)
+  } else if (
+    configuredReasoningEffort !== undefined && configuredReasoningEffort !== null
+  ) {
+    const clamped = clampReasoningEffort(
+      canonical,
+      configuredReasoningEffort,
+    )
     if (clamped) {
       next.reasoning = { effort: clamped.effort }
     }
 
@@ -11,6 +11,7 @@ interface AutoSessionResponse {
 
 const AUTO_MODE_BODY = { auto_mode: { model_hints: ["auto"] } }
 const FALLBACK_REFRESH_SECONDS = 30 * 60
+let refreshTimer: ReturnType<typeof setTimeout> | undefined
 
 const parseExpiresAt = (value: number | string | undefined): number | undefined => {
   if (typeof value === "number" && Number.isFinite(value)) {
@@ -68,12 +69,16 @@ const applyAutoSession = async (config: BridgeConfig) => {
 }
 
 const scheduleAutoSessionRefresh = (config: BridgeConfig) => {
+  if (refreshTimer) {
+    clearTimeout(refreshTimer)
+  }
+
   const now = Math.floor(Date.now() / 1000)
   const expiresAt =
     runtimeState.autoExpiresAt ?? now + FALLBACK_REFRESH_SECONDS
   const refreshIn = Math.max(expiresAt - now - 60, 60)
 
-  const timer = setTimeout(async () => {
+  refreshTimer = setTimeout(async () => {
     try {
       await applyAutoSession(config)
       consola.debug("Refreshed Copilot auto-mode session token")
@@ -84,14 +89,26 @@ const scheduleAutoSessionRefresh = (config: BridgeConfig) => {
     }
   }, refreshIn * 1000)
 
-  if (typeof timer.unref === "function") {
-    timer.unref()
+  if (typeof refreshTimer.unref === "function") {
+    refreshTimer.unref()
+  }
+}
+
+export const disableAutoMode = () => {
+  if (refreshTimer) {
+    clearTimeout(refreshTimer)
+    refreshTimer = undefined
   }
+  delete runtimeState.autoMode
+  delete runtimeState.autoSessionToken
+  delete runtimeState.autoExpiresAt
+  delete runtimeState.autoAvailableModels
 }
 
 export const enableAutoMode = async (
   config: BridgeConfig,
 ): Promise<AutoSessionResponse> => {
+  disableAutoMode()
   const data = await applyAutoSession(config)
   runtimeState.autoMode = true
   scheduleAutoSessionRefresh(config)
 
@@ -102,15 +102,17 @@ export const MODEL_CAPABILITIES: ReadonlyArray<ModelCapability> = [
   // translate to /v1/chat/completions. Only opus-4.7 places effort under
   // output_config.effort; the others use the standard reasoning_effort.
   ...[
-    { id: "claude-opus-4.7", supported: ["medium"], defaultEffort: "medium" },
+    {
+      id: "claude-opus-4.7",
+      supported: ["low", "medium", "high", "xhigh"],
+      defaultEffort: "medium",
+    },
     {
       id: "claude-opus-4.7-1m-internal",
       aliases: ["claude-opus-4.7-1m"],
       supported: ["low", "medium", "high", "xhigh"],
       defaultEffort: "medium",
     },
-    { id: "claude-opus-4.7-high", supported: ["high"], defaultEffort: "high" },
-    { id: "claude-opus-4.7-xhigh", supported: ["xhigh"], defaultEffort: "xhigh" },
   ].map(
     ({ id, aliases, supported, defaultEffort }): ModelCapability => ({
       id,
@@ -163,10 +165,6 @@ export const MODEL_CAPABILITIES: ReadonlyArray<ModelCapability> = [
     id: "claude-sonnet-4.5",
     fallback: "chat-completions",
   },
-  {
-    id: "claude-sonnet-4",
-    fallback: "chat-completions",
-  },
   {
     id: "claude-haiku-4.5",
     fallback: "chat-completions",
 
@@ -74,6 +74,9 @@ const pickBestModel = (models: Array<Model>): Model | undefined =>
     (left, right) => scoreModelCandidate(right) - scoreModelCandidate(left),
   )[0]
 
+const isClaudeMajorOnlyVersion = (modelId: string): boolean =>
+  /^claude-(?:opus|sonnet|haiku)-\d+$/.test(modelId)
+
 const getBestPrefixMatches = (
   models: Array<Model>,
   aliasCandidates: Array<string>,
@@ -86,6 +89,9 @@ const getBestPrefixMatches = (
     const matchedAliasLength = Math.max(
       0,
       ...aliasCandidates.map((candidate) => {
+        if (isClaudeMajorOnlyVersion(candidate)) {
+          return 0
+        }
         const normalizedCandidate = normalizeModelId(candidate)
         return normalizedCandidate.length >= 4
           && normalizedModelId.startsWith(normalizedCandidate)
Original file line number	Diff line number	Diff line change
`@@ -31,10 +31,6 @@ export const getToolNameMapperOptionsForModel = (`
`31`	`31`	`return { allowDots: false, maxNameLength: EXTENDED_TOOL_NAME_MAX_LENGTH }`
`32`	`32`	`}`
`33`	`33`
`34`		`- if (/^claude-sonnet-4(?:$\|-\d{8}$)/.test(normalized)) {`
`35`		`- return { allowDots: false, maxNameLength: EXTENDED_TOOL_NAME_MAX_LENGTH }`
`36`		`- }`
`37`		`-`
`38`	`34`	`if (normalized.startsWith("gemini-")) {`
`39`	`35`	`return { allowDots: true, maxNameLength: EXTENDED_TOOL_NAME_MAX_LENGTH }`
`40`	`36`	`}`