fix: replace isDeepStrictEqual with navigation-aware options comparison

The select cursor highlight was broken because isDeepStrictEqual in use-select-navigation.ts and use-multi-select-state.ts would fail when options contained identity-unstable properties (JSX label elements, function onChange callbacks, computed disabled booleans). This caused the reset logic to fire on every re-render, resetting focusedValue back to the first option. Replace isDeepStrictEqual with optionsNavigateEqual which only compares properties that affect navigation behavior: value, disabled, and type. ReactNode labels and function callbacks are intentionally excluded as they are identity-unstable but don't change navigation semantics. Fixes #472
fix example agents (#438 )
2026-04-08 13:58:18 +05:30 · 2026-04-08 02:55:27 +08:00 · 2026-04-08 02:45:49 +08:00 · 2026-04-08 00:33:52 +08:00 · 2026-04-07 23:24:10 +08:00 · 2026-04-07 17:26:00 +08:00
41 changed files with 3245 additions and 179 deletions
--- a/src/commands/provider/provider.test.tsx
+++ b/src/commands/provider/provider.test.tsx
@@ -52,7 +52,11 @@ async function renderFinalFrame(node: React.ReactNode): Promise<string> {
    patchConsole: false,
  })
-  await instance.waitUntilExit()
+  // Timeout guard: if render throws before exit effect fires, don't hang
  await Promise.race([
    instance.waitUntilExit(),
    new Promise<void>(resolve => setTimeout(resolve, 3000)),
  ])
  return stripAnsi(extractLastFrame(getOutput()))
 }
--- a/src/components/CustomSelect/use-multi-select-state.ts
+++ b/src/components/CustomSelect/use-multi-select-state.ts
@@ -1,5 +1,4 @@
 import { useCallback, useState } from 'react'
 import { isDeepStrictEqual } from 'util'
 import { useRegisterOverlay } from '../../context/overlayContext.js'
 import type { InputEvent } from '../../ink/events/input-event.js'
 // eslint-disable-next-line custom-rules/prefer-use-keybindings -- raw space/arrow multiselect input
@@ -9,6 +8,7 @@ import {
  normalizeFullWidthSpace,
 } from '../../utils/stringUtils.js'
 import type { OptionWithDescription } from './select.js'
 import { optionsNavigateEqual } from './use-select-navigation.js'
 import { useSelectNavigation } from './use-select-navigation.js'
 export type UseMultiSelectStateProps<T> = {
@@ -174,7 +174,7 @@ export function useMultiSelectState<T>({
  // and the deleted ui/useMultiSelectState.ts — without this, MCPServerDesktopImportDialog
  // keeps colliding servers checked after getAllMcpConfigs() resolves.
  const [lastOptions, setLastOptions] = useState(options)
-  if (options !== lastOptions && !isDeepStrictEqual(options, lastOptions)) {
+  if (options !== lastOptions && !optionsNavigateEqual(options, lastOptions)) {
    setSelectedValues(defaultValue)
    setLastOptions(options)
  }
--- a/src/components/CustomSelect/use-select-navigation.ts
+++ b/src/components/CustomSelect/use-select-navigation.ts
@@ -6,10 +6,34 @@ import {
  useRef,
  useState,
 } from 'react'
 import { isDeepStrictEqual } from 'util'
 import OptionMap from './option-map.js'
 import type { OptionWithDescription } from './select.js'
 /**
 * Compare two option arrays for structural equality on properties that
 * affect navigation behavior. ReactNode `label` and function `onChange`
 * are intentionally excluded — they are identity-unstable (new reference
 * each render) but don't change navigation semantics.
 */
 export function optionsNavigateEqual<T>(
  a: OptionWithDescription<T>[],
  b: OptionWithDescription<T>[],
 ): boolean {
  if (a.length !== b.length) return false
  for (let i = 0; i < a.length; i++) {
    const ao = a[i]!
    const bo = b[i]!
    if (
      ao.value !== bo.value ||
      ao.disabled !== bo.disabled ||
      ao.type !== bo.type
    ) {
      return false
    }
  }
  return true
 }
 type State<T> = {
  /**
   * Map where key is option's value and value is option's index.
@@ -524,7 +548,7 @@ export function useSelectNavigation<T>({
  const [lastOptions, setLastOptions] = useState(options)
-  if (options !== lastOptions && !isDeepStrictEqual(options, lastOptions)) {
+  if (options !== lastOptions && !optionsNavigateEqual(options, lastOptions)) {
    dispatch({
      type: 'reset',
      state: createDefaultState({
--- a/src/components/ProviderManager.test.tsx
+++ b/src/components/ProviderManager.test.tsx
@@ -0,0 +1,305 @@
 import { PassThrough } from 'node:stream'
 import { afterEach, expect, mock, test } from 'bun:test'
 import React from 'react'
 import stripAnsi from 'strip-ansi'
 import { createRoot } from '../ink.js'
 import { AppStateProvider } from '../state/AppState.js'
 const SYNC_START = '\x1B[?2026h'
 const SYNC_END = '\x1B[?2026l'
 const ORIGINAL_ENV = {
  CLAUDE_CODE_USE_GITHUB: process.env.CLAUDE_CODE_USE_GITHUB,
  GITHUB_TOKEN: process.env.GITHUB_TOKEN,
  GH_TOKEN: process.env.GH_TOKEN,
 }
 function extractLastFrame(output: string): string {
  let lastFrame: string | null = null
  let cursor = 0
  while (cursor < output.length) {
    const start = output.indexOf(SYNC_START, cursor)
    if (start === -1) {
      break
    }
    const contentStart = start + SYNC_START.length
    const end = output.indexOf(SYNC_END, contentStart)
    if (end === -1) {
      break
    }
    const frame = output.slice(contentStart, end)
    if (frame.trim().length > 0) {
      lastFrame = frame
    }
    cursor = end + SYNC_END.length
  }
  return lastFrame ?? output
 }
 function createTestStreams(): {
  stdout: PassThrough
  stdin: PassThrough & {
    isTTY: boolean
    setRawMode: (mode: boolean) => void
    ref: () => void
    unref: () => void
  }
  getOutput: () => string
 } {
  let output = ''
  const stdout = new PassThrough()
  const stdin = new PassThrough() as PassThrough & {
    isTTY: boolean
    setRawMode: (mode: boolean) => void
    ref: () => void
    unref: () => void
  }
  stdin.isTTY = true
  stdin.setRawMode = () => {}
  stdin.ref = () => {}
  stdin.unref = () => {}
  ;(stdout as unknown as { columns: number }).columns = 120
  stdout.on('data', chunk => {
    output += chunk.toString()
  })
  return {
    stdout,
    stdin,
    getOutput: () => output,
  }
 }
 async function waitForCondition(
  predicate: () => boolean,
  options?: { timeoutMs?: number; intervalMs?: number },
 ): Promise<void> {
  const timeoutMs = options?.timeoutMs ?? 2000
  const intervalMs = options?.intervalMs ?? 10
  const startedAt = Date.now()
  while (Date.now() - startedAt < timeoutMs) {
    if (predicate()) {
      return
    }
    await Bun.sleep(intervalMs)
  }
  throw new Error('Timed out waiting for ProviderManager test condition')
 }
 function createDeferred<T>(): {
  promise: Promise<T>
  resolve: (value: T) => void
 } {
  let resolve!: (value: T) => void
  const promise = new Promise<T>(r => {
    resolve = r
  })
  return { promise, resolve }
 }
 function mockProviderProfilesModule(): void {
  mock.module('../utils/providerProfiles.js', () => ({
    addProviderProfile: () => null,
    applyActiveProviderProfileFromConfig: () => {},
    deleteProviderProfile: () => ({ removed: false, activeProfileId: null }),
    getActiveProviderProfile: () => null,
    getProviderPresetDefaults: () => ({
      provider: 'openai',
      name: 'Mock provider',
      baseUrl: 'http://localhost:11434/v1',
      model: 'mock-model',
      apiKey: '',
    }),
    getProviderProfiles: () => [],
    setActiveProviderProfile: () => null,
    updateProviderProfile: () => null,
  }))
 }
 function mockProviderManagerDependencies(
  syncRead: () => string | undefined,
  asyncRead: () => Promise<string | undefined>,
 ): void {
  mockProviderProfilesModule()
  mock.module('../utils/githubModelsCredentials.js', () => ({
    clearGithubModelsToken: () => ({ success: true }),
    GITHUB_MODELS_HYDRATED_ENV_MARKER: 'CLAUDE_CODE_GITHUB_TOKEN_HYDRATED',
    hydrateGithubModelsTokenFromSecureStorage: () => {},
    readGithubModelsToken: syncRead,
    readGithubModelsTokenAsync: asyncRead,
  }))
  mock.module('../utils/settings/settings.js', () => ({
    updateSettingsForSource: () => ({ error: null }),
  }))
 }
 async function waitForFrameOutput(
  getOutput: () => string,
  predicate: (output: string) => boolean,
  timeoutMs = 2500,
 ): Promise<string> {
  let output = ''
  await waitForCondition(() => {
    output = stripAnsi(extractLastFrame(getOutput()))
    return predicate(output)
  }, { timeoutMs })
  return output
 }
 async function mountProviderManager(
  ProviderManager: React.ComponentType<{
    mode: 'first-run' | 'manage'
    onDone: () => void
  }>,
 ): Promise<{
  getOutput: () => string
  dispose: () => Promise<void>
 }> {
  const { stdout, stdin, getOutput } = createTestStreams()
  const root = await createRoot({
    stdout: stdout as unknown as NodeJS.WriteStream,
    stdin: stdin as unknown as NodeJS.ReadStream,
    patchConsole: false,
  })
  root.render(
    <AppStateProvider>
      <ProviderManager
        mode="manage"
        onDone={() => {}}
      />
    </AppStateProvider>,
  )
  return {
    getOutput,
    dispose: async () => {
      root.unmount()
      stdin.end()
      stdout.end()
      await Bun.sleep(0)
    },
  }
 }
 async function renderProviderManagerFrame(
  ProviderManager: React.ComponentType<{
    mode: 'first-run' | 'manage'
    onDone: () => void
  }>,
  options?: {
    waitForOutput?: (output: string) => boolean
    timeoutMs?: number
  },
 ): Promise<string> {
  const mounted = await mountProviderManager(ProviderManager)
  const output = await waitForFrameOutput(
    mounted.getOutput,
    frame => {
      if (!options?.waitForOutput) {
        return frame.includes('Provider manager')
      }
      return options.waitForOutput(frame)
    },
    options?.timeoutMs ?? 2500,
  )
  await mounted.dispose()
  return output
 }
 afterEach(() => {
  mock.restore()
  for (const [key, value] of Object.entries(ORIGINAL_ENV)) {
    if (value === undefined) {
      delete process.env[key as keyof typeof ORIGINAL_ENV]
    } else {
      process.env[key as keyof typeof ORIGINAL_ENV] = value
    }
  }
 })
 test('ProviderManager resolves GitHub virtual provider from async storage without sync reads in render flow', async () => {
  delete process.env.CLAUDE_CODE_USE_GITHUB
  delete process.env.GITHUB_TOKEN
  delete process.env.GH_TOKEN
  const syncRead = mock(() => {
    throw new Error('sync credential read should not run in ProviderManager render flow')
  })
  const asyncRead = mock(async () => 'stored-token')
  mockProviderManagerDependencies(syncRead, asyncRead)
  const nonce = `${Date.now()}-${Math.random()}`
  const { ProviderManager } = await import(`./ProviderManager.js?ts=${nonce}`)
  const output = await renderProviderManagerFrame(ProviderManager, {
    waitForOutput: frame =>
      frame.includes('Provider manager') &&
      frame.includes('GitHub Models') &&
      frame.includes('token stored'),
  })
  expect(output).toContain('Provider manager')
  expect(output).toContain('GitHub Models')
  expect(output).toContain('token stored')
  expect(output).not.toContain('No provider profiles configured yet.')
  expect(syncRead).not.toHaveBeenCalled()
  expect(asyncRead).toHaveBeenCalled()
 })
 test('ProviderManager avoids first-frame false negative while stored-token lookup is pending', async () => {
  delete process.env.CLAUDE_CODE_USE_GITHUB
  delete process.env.GITHUB_TOKEN
  delete process.env.GH_TOKEN
  const syncRead = mock(() => {
    throw new Error('sync credential read should not run in ProviderManager render flow')
  })
  const deferredStoredToken = createDeferred<string | undefined>()
  const asyncRead = mock(async () => deferredStoredToken.promise)
  mockProviderManagerDependencies(syncRead, asyncRead)
  const nonce = `${Date.now()}-${Math.random()}`
  const { ProviderManager } = await import(`./ProviderManager.js?ts=${nonce}`)
  const mounted = await mountProviderManager(ProviderManager)
  const firstFrame = await waitForFrameOutput(
    mounted.getOutput,
    frame => frame.includes('Provider manager'),
  )
  expect(firstFrame).toContain('Checking GitHub Models credentials...')
  expect(firstFrame).not.toContain('No provider profiles configured yet.')
  deferredStoredToken.resolve('stored-token')
  const resolvedFrame = await waitForFrameOutput(
    mounted.getOutput,
    frame => frame.includes('GitHub Models') && frame.includes('token stored'),
  )
  expect(resolvedFrame).toContain('GitHub Models')
  expect(resolvedFrame).toContain('token stored')
  await mounted.dispose()
  expect(syncRead).not.toHaveBeenCalled()
  expect(asyncRead).toHaveBeenCalled()
 })
--- a/src/components/ProviderManager.tsx
+++ b/src/components/ProviderManager.tsx
@@ -20,6 +20,7 @@ import {
  GITHUB_MODELS_HYDRATED_ENV_MARKER,
  hydrateGithubModelsTokenFromSecureStorage,
  readGithubModelsToken,
  readGithubModelsTokenAsync,
 } from '../utils/githubModelsCredentials.js'
 import { isEnvTruthy } from '../utils/envUtils.js'
 import { updateSettingsForSource } from '../utils/settings/settings.js'
@@ -118,25 +119,38 @@ function profileSummary(profile: ProviderProfile, isActive: boolean): string {
  return `${providerKind} · ${profile.baseUrl} · ${profile.model} · ${keyInfo}${activeSuffix}`
 }
-function getGithubCredentialSource(
+function getGithubCredentialSourceFromEnv(
  processEnv: NodeJS.ProcessEnv = process.env,
 ): GithubCredentialSource {
  if (readGithubModelsToken()?.trim()) {
    return 'stored'
  }
  if (processEnv.GITHUB_TOKEN?.trim() || processEnv.GH_TOKEN?.trim()) {
    return 'env'
  }
  return 'none'
 }
 async function resolveGithubCredentialSource(
  processEnv: NodeJS.ProcessEnv = process.env,
 ): Promise<GithubCredentialSource> {
  const envSource = getGithubCredentialSourceFromEnv(processEnv)
  if (envSource !== 'none') {
    return envSource
  }
  if (await readGithubModelsTokenAsync()) {
    return 'stored'
  }
  return 'none'
 }
 function isGithubProviderAvailable(
  credentialSource: GithubCredentialSource,
  processEnv: NodeJS.ProcessEnv = process.env,
 ): boolean {
  if (isEnvTruthy(processEnv.CLAUDE_CODE_USE_GITHUB)) {
    return true
  }
-  return getGithubCredentialSource(processEnv) !== 'none'
+  return credentialSource !== 'none'
 }
 function getGithubProviderModel(
@@ -164,19 +178,24 @@ function getGithubProviderSummary(
 }
 export function ProviderManager({ mode, onDone }: Props): React.ReactNode {
  const initialGithubCredentialSource = getGithubCredentialSourceFromEnv()
  const initialIsGithubActive = isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB)
  const initialHasGithubCredential = initialGithubCredentialSource !== 'none'
  const [profiles, setProfiles] = React.useState(() => getProviderProfiles())
  const [activeProfileId, setActiveProfileId] = React.useState(
    () => getActiveProviderProfile()?.id,
  )
-  const [githubProviderAvailable, setGithubProviderAvailable] = React.useState(() =>
+  const [githubProviderAvailable, setGithubProviderAvailable] = React.useState(
-    isGithubProviderAvailable(),
+    () => isGithubProviderAvailable(initialGithubCredentialSource),
  )
  const [githubCredentialSource, setGithubCredentialSource] = React.useState<GithubCredentialSource>(
-    () => getGithubCredentialSource(),
+    () => initialGithubCredentialSource,
  )
  const [isGithubActive, setIsGithubActive] = React.useState(() =>
    isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB),
  )
  const [isGithubActive, setIsGithubActive] = React.useState(() => initialIsGithubActive)
  const [isGithubCredentialSourceResolved, setIsGithubCredentialSourceResolved] =
    React.useState(() => initialHasGithubCredential || initialIsGithubActive)
  const githubRefreshEpochRef = React.useRef(0)
  const [screen, setScreen] = React.useState<Screen>(
    mode === 'first-run' ? 'select-preset' : 'menu',
  )
@@ -196,13 +215,48 @@ export function ProviderManager({ mode, onDone }: Props): React.ReactNode {
  const currentStepKey = currentStep.key
  const currentValue = draft[currentStepKey]
  const refreshGithubProviderState = React.useCallback((): void => {
    const envCredentialSource = getGithubCredentialSourceFromEnv()
    const githubActive = isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB)
    const canResolveFromEnv = githubActive || envCredentialSource !== 'none'
    if (canResolveFromEnv) {
      githubRefreshEpochRef.current += 1
      setGithubCredentialSource(envCredentialSource)
      setGithubProviderAvailable(isGithubProviderAvailable(envCredentialSource))
      setIsGithubActive(githubActive)
      setIsGithubCredentialSourceResolved(true)
      return
    }
    setIsGithubCredentialSourceResolved(false)
    const refreshEpoch = ++githubRefreshEpochRef.current
    void (async () => {
      const credentialSource = await resolveGithubCredentialSource()
      if (refreshEpoch !== githubRefreshEpochRef.current) {
        return
      }
      setGithubCredentialSource(credentialSource)
      setGithubProviderAvailable(isGithubProviderAvailable(credentialSource))
      setIsGithubActive(isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB))
      setIsGithubCredentialSourceResolved(true)
    })()
  }, [])
  React.useEffect(() => {
    refreshGithubProviderState()
    return () => {
      githubRefreshEpochRef.current += 1
    }
  }, [refreshGithubProviderState])
  function refreshProfiles(): void {
    const nextProfiles = getProviderProfiles()
    setProfiles(nextProfiles)
    setActiveProfileId(getActiveProviderProfile()?.id)
-    setGithubProviderAvailable(isGithubProviderAvailable())
+    refreshGithubProviderState()
    setGithubCredentialSource(getGithubCredentialSource())
    setIsGithubActive(isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB))
  }
  function clearStartupProviderOverrideFromUserSettings(): string | null {
@@ -640,7 +694,11 @@ export function ProviderManager({ mode, onDone }: Props): React.ReactNode {
        {statusMessage && <Text>{statusMessage}</Text>}
        <Box flexDirection="column">
          {profiles.length === 0 && !githubProviderAvailable ? (
-            <Text dimColor>No provider profiles configured yet.</Text>
+            isGithubCredentialSourceResolved ? (
              <Text dimColor>No provider profiles configured yet.</Text>
            ) : (
              <Text dimColor>Checking GitHub Models credentials...</Text>
            )
          ) : (
            <>
              {profiles.map(profile => (
--- a/src/components/agents/generateAgent.ts
+++ b/src/components/agents/generateAgent.ts
@@ -68,11 +68,11 @@ When a user describes what they want an agent to do, you will:
      assistant: "Now let me use the test-runner agent to run the tests"
    </example>
    - <example>
-      Context: User is creating an agent to respond to the word "hello" with a friendly jok.
+      Context: User is creating an agent for Claude Code product questions.
-      user: "Hello"
+      user: "How do I configure Claude Code hooks?"
-      assistant: "I'm going to use the ${AGENT_TOOL_NAME} tool to launch the greeting-responder agent to respond with a friendly joke"
+      assistant: "I'm going to use the ${AGENT_TOOL_NAME} tool to launch the claude-code-guide agent to answer the question"
      <commentary>
-      Since the user is greeting, use the greeting-responder agent to respond with a friendly joke. 
+      Since the user is asking how to use Claude Code, use the claude-code-guide agent.
      </commentary>
    </example>
  - If the user mentioned or implied that the agent should be used proactively, you should include examples of this.
--- a/src/entrypoints/cli.tsx
+++ b/src/entrypoints/cli.tsx
@@ -8,6 +8,34 @@ import {
  validateProviderEnvOrExit,
 } from '../utils/providerValidation.js'
 // OpenClaude: polyfill globalThis.File for Node < 20.
 // undici v7 references `File` at module evaluation time (webidl type
 // assertions). Node 18 lacks the global, causing a ReferenceError inside
 // the bundled __commonJS require chain which deadlocks the process when a
 // proxy is configured (configureGlobalAgents → require_undici).
 // eslint-disable-next-line custom-rules/no-top-level-side-effects
 if (typeof globalThis.File === 'undefined') {
  try {
    // Node 18.13+ exposes File in node:buffer but not as a global.
    // eslint-disable-next-line @typescript-eslint/no-require-imports
    const { File: NodeFile } = require('node:buffer')
    // @ts-expect-error -- polyfilling missing global
    globalThis.File = NodeFile
  } catch {
    // Absolute fallback: stub so `MakeTypeAssertion(File)` doesn't throw.
    // @ts-expect-error -- minimal polyfill
    globalThis.File = class File extends Blob {
      name: string
      lastModified: number
      constructor(parts: BlobPart[], name: string, opts?: FilePropertyBag) {
        super(parts, opts)
        this.name = name
        this.lastModified = opts?.lastModified ?? Date.now()
      }
    }
  }
 }
 // OpenClaude: disable experimental API betas by default.
 // Tool search (defer_loading), global cache scope, and context management
 // require internal API support not available to external accounts → 500.
--- a/src/grpc/server.ts
+++ b/src/grpc/server.ts
@@ -40,7 +40,7 @@ export class GrpcServer {
      grpc.ServerCredentials.createInsecure(),
      (error, boundPort) => {
        if (error) {
-          console.error('Failed to start gRPC server', error)
+          console.error('Failed to start gRPC server')
          return
        }
        console.log(`gRPC Server running at ${host}:${boundPort}`)
@@ -225,7 +225,7 @@ export class GrpcServer {
          call.end()
        }
      } catch (err: any) {
-        console.error("Error processing stream:", err)
+        console.error('Error processing stream')
        call.write({
          error: {
            message: err.message || "Internal server error",
--- a/src/ink/reconciler.ts
+++ b/src/ink/reconciler.ts
@@ -366,14 +366,12 @@ const reconciler = createReconciler<
  createTextInstance(
    text: string,
    _root: DOMElement,
-    hostContext: HostContext,
+    _hostContext: HostContext,
  ): TextNode {
-    if (!hostContext.isInsideText) {
+    // react-compiler memoization can reuse cached <Text> elements without
-      throw new Error(
+    // re-traversing getChildHostContext, so hostContext.isInsideText may be
-        `Text string "${text}" must be rendered inside <Text> component`,
+    // stale. Always create the text node — Ink will render it correctly
-      )
+    // regardless of the context tracking state.
    }
    return createTextNode(text)
  },
  resetTextContent() {},
--- a/src/ink/termio/osc.test.ts
+++ b/src/ink/termio/osc.test.ts
@@ -27,6 +27,21 @@ async function flushClipboardCopy(): Promise<void> {
  await new Promise(resolve => setTimeout(resolve, 0))
 }
 async function waitForExecCall(
  command: string,
  attempts = 20,
 ): Promise<(typeof execFileNoThrowMock.mock.calls)[number] | undefined> {
  for (let attempt = 0; attempt < attempts; attempt++) {
    const call = execFileNoThrowMock.mock.calls.find(([cmd]) => cmd === command)
    if (call) {
      return call
    }
    await flushClipboardCopy()
  }
  return undefined
 }
 describe('Windows clipboard fallback', () => {
  beforeEach(() => {
    execFileNoThrowMock.mockClear()
@@ -62,9 +77,7 @@ describe('Windows clipboard fallback', () => {
    await setClipboard('Привет мир')
    await flushClipboardCopy()
-    const windowsCall = execFileNoThrowMock.mock.calls.find(
+    const windowsCall = await waitForExecCall('powershell')
      ([cmd]) => cmd === 'powershell',
    )
    expect(windowsCall?.[2]).toMatchObject({
      stdin: 'ignore',
--- a/src/services/api/codexShim.test.ts
+++ b/src/services/api/codexShim.test.ts
@@ -201,6 +201,117 @@ describe('Codex request translation', () => {
    ])
  })
  test('preserves Grep tool pattern field in Codex strict schemas', () => {
    const tools = convertToolsToResponsesTools([
      {
        name: 'Grep',
        description: 'Search file contents',
        input_schema: {
          type: 'object',
          properties: {
            pattern: { type: 'string', description: 'Search pattern' },
            path: { type: 'string' },
          },
          required: ['pattern'],
          additionalProperties: false,
        },
      },
    ])
    expect(tools).toEqual([
      {
        type: 'function',
        name: 'Grep',
        description: 'Search file contents',
        parameters: {
          type: 'object',
          properties: {
            pattern: { type: 'string', description: 'Search pattern' },
            path: { type: 'string' },
          },
          required: ['pattern', 'path'],
          additionalProperties: false,
        },
        strict: true,
      },
    ])
  })
  test('preserves Glob tool pattern field in Codex strict schemas', () => {
    const tools = convertToolsToResponsesTools([
      {
        name: 'Glob',
        description: 'Find files by pattern',
        input_schema: {
          type: 'object',
          properties: {
            pattern: { type: 'string', description: 'Glob pattern' },
            path: { type: 'string' },
          },
          required: ['pattern'],
          additionalProperties: false,
        },
      },
    ])
    expect(tools).toEqual([
      {
        type: 'function',
        name: 'Glob',
        description: 'Find files by pattern',
        parameters: {
          type: 'object',
          properties: {
            pattern: { type: 'string', description: 'Glob pattern' },
            path: { type: 'string' },
          },
          required: ['pattern', 'path'],
          additionalProperties: false,
        },
        strict: true,
      },
    ])
  })
  test('strips validator pattern keyword but keeps string field named pattern in Codex schemas', () => {
    const tools = convertToolsToResponsesTools([
      {
        name: 'RegexProbe',
        description: 'Probe regex schema handling',
        input_schema: {
          type: 'object',
          properties: {
            pattern: {
              type: 'string',
              pattern: '^[a-z]+$',
            },
          },
          required: ['pattern'],
          additionalProperties: false,
        },
      },
    ])
    expect(tools).toEqual([
      {
        type: 'function',
        name: 'RegexProbe',
        description: 'Probe regex schema handling',
        parameters: {
          type: 'object',
          properties: {
            pattern: {
              type: 'string',
            },
          },
          required: ['pattern'],
          additionalProperties: false,
        },
        strict: true,
      },
    ])
  })
  test('removes unsupported uri format from strict Responses schemas', () => {
    const tools = convertToolsToResponsesTools([
      {
--- a/src/services/api/openaiShim.test.ts
+++ b/src/services/api/openaiShim.test.ts
--- a/src/services/api/openaiShim.ts
+++ b/src/services/api/openaiShim.ts
@@ -42,6 +42,10 @@ import {
 } from './providerConfig.js'
 import { sanitizeSchemaForOpenAICompat } from '../../utils/schemaSanitizer.js'
 import { redactSecretValueForDisplay } from '../../utils/providerProfile.js'
 import {
  normalizeToolArguments,
  hasToolFieldMapping,
 } from './toolArgumentNormalization.js'
 type SecretValueSource = Partial<{
  OPENAI_API_KEY: string
@@ -56,11 +60,22 @@ const GITHUB_API_VERSION = '2022-11-28'
 const GITHUB_429_MAX_RETRIES = 3
 const GITHUB_429_BASE_DELAY_SEC = 1
 const GITHUB_429_MAX_DELAY_SEC = 32
 const GEMINI_API_HOST = 'generativelanguage.googleapis.com'
 function isGithubModelsMode(): boolean {
  return isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB)
 }
 function hasGeminiApiHost(baseUrl: string | undefined): boolean {
  if (!baseUrl) return false
  try {
    return new URL(baseUrl).hostname.toLowerCase() === GEMINI_API_HOST
  } catch {
    return false
  }
 }
 function formatRetryAfterHint(response: Response): string {
  const ra = response.headers.get('retry-after')
  return ra ? ` (Retry-After: ${ra})` : ''
@@ -180,10 +195,12 @@ function convertContentBlocks(
        // handled separately
        break
      case 'thinking':
-        // Append thinking as text with a marker for models that support reasoning
+      case 'redacted_thinking':
-        if (block.thinking) {
+        // Strip thinking blocks for OpenAI-compatible providers.
-          parts.push({ type: 'text', text: `<thinking>${block.thinking}</thinking>` })
+        // These are Anthropic-specific content types that 3P providers
-        }
+        // don't understand. Serializing them as <thinking> text corrupts
        // multi-turn context: the model sees the tags as part of its
        // previous reply and may mimic or misattribute them.
        break
      default:
        if (block.text) {
@@ -197,6 +214,13 @@ function convertContentBlocks(
  return parts
 }
 function isGeminiMode(): boolean {
  return (
    isEnvTruthy(process.env.CLAUDE_CODE_USE_GEMINI) ||
    hasGeminiApiHost(process.env.OPENAI_BASE_URL)
  )
 }
 function convertMessages(
  messages: Array<{ role: string; message?: { role?: string; content?: unknown }; content?: unknown }>,
  system: unknown,
@@ -248,6 +272,7 @@ function convertMessages(
      // Check for tool_use blocks
      if (Array.isArray(content)) {
        const toolUses = content.filter((b: { type?: string }) => b.type === 'tool_use')
        const thinkingBlock = content.find((b: { type?: string }) => b.type === 'thinking')
        const textContent = content.filter(
          (b: { type?: string }) => b.type !== 'tool_use' && b.type !== 'thinking',
        )
@@ -267,18 +292,46 @@ function convertMessages(
              name?: string
              input?: unknown
              extra_content?: Record<string, unknown>
-            }) => ({
+              signature?: string
-              id: tu.id ?? `call_${crypto.randomUUID().replace(/-/g, '')}`,
+            }, index) => {
-              type: 'function' as const,
+              const toolCall: NonNullable<OpenAIMessage['tool_calls']>[number] = {
-              function: {
+                id: tu.id ?? `call_${crypto.randomUUID().replace(/-/g, '')}`,
-                name: tu.name ?? 'unknown',
+                type: 'function' as const,
-                arguments:
+                function: {
-                  typeof tu.input === 'string'
+                  name: tu.name ?? 'unknown',
-                    ? tu.input
+                  arguments:
-                    : JSON.stringify(tu.input ?? {}),
+                    typeof tu.input === 'string'
-              },
+                      ? tu.input
-              ...(tu.extra_content ? { extra_content: tu.extra_content } : {}),
+                      : JSON.stringify(tu.input ?? {}),
-            }),
+                },
              }
              // Preserve existing extra_content if present
              if (tu.extra_content) {
                toolCall.extra_content = { ...tu.extra_content }
              }
              // Handle Gemini thought_signature
              if (isGeminiMode()) {
                // If the model provided a signature in the tool_use block itself (e.g. from a previous Turn/Step)
                // Use thinkingBlock.signature for ALL tool calls in the same assistant turn if available.
                // The API requires the same signature on every replayed function call part in a parallel set.
                const signature = tu.signature ?? (thinkingBlock as any)?.signature
                // Merge into existing google-specific metadata if present
                const existingGoogle = (toolCall.extra_content?.google as Record<string, unknown>) ?? {}
                toolCall.extra_content = {
                  ...toolCall.extra_content,
                  google: {
                    ...existingGoogle,
                    thought_signature: signature ?? "skip_thought_signature_validator"
                  }
                }
              }
              return toolCall
            },
          )
        }
@@ -397,7 +450,7 @@ function normalizeSchemaForOpenAI(
 function convertTools(
  tools: Array<{ name: string; description?: string; input_schema?: Record<string, unknown> }>,
 ): OpenAITool[] {
-  const isGemini = isEnvTruthy(process.env.CLAUDE_CODE_USE_GEMINI)
+  const isGemini = isGeminiMode()
  return tools
    .filter(t => t.name !== 'ToolSearchTool') // Not relevant for OpenAI
@@ -439,6 +492,7 @@ interface OpenAIStreamChunk {
    delta: {
      role?: string
      content?: string | null
      reasoning_content?: string | null
      tool_calls?: Array<{
        index: number
        id?: string
@@ -476,6 +530,30 @@ function convertChunkUsage(
  }
 }
 const JSON_REPAIR_SUFFIXES = [
  '}', '"}', ']}', '"]}', '}}', '"}}', ']}}', '"]}}', '"]}]}', '}]}'
 ]
 function repairPossiblyTruncatedObjectJson(raw: string): string | null {
  try {
    const parsed = JSON.parse(raw)
    return parsed && typeof parsed === 'object' && !Array.isArray(parsed)
      ? raw
      : null
  } catch {
    for (const combo of JSON_REPAIR_SUFFIXES) {
      try {
        const repaired = raw + combo
        const parsed = JSON.parse(repaired)
        if (parsed && typeof parsed === 'object' && !Array.isArray(parsed)) {
          return repaired
        }
      } catch {}
    }
    return null
  }
 }
 /**
 * Async generator that transforms an OpenAI SSE stream into
 * Anthropic-format BetaRawMessageStreamEvent objects.
@@ -486,8 +564,19 @@ async function* openaiStreamToAnthropic(
 ): AsyncGenerator<AnthropicStreamEvent> {
  const messageId = makeMessageId()
  let contentBlockIndex = 0
-  const activeToolCalls = new Map<number, { id: string; name: string; index: number; jsonBuffer: string }>()
+  const activeToolCalls = new Map<
    number,
    {
      id: string
      name: string
      index: number
      jsonBuffer: string
      normalizeAtStop: boolean
    }
  >()
  let hasEmittedContentStart = false
  let hasEmittedThinkingStart = false
  let hasClosedThinking = false
  let lastStopReason: 'tool_use' | 'max_tokens' | 'end_turn' | null = null
  let hasEmittedFinalUsage = false
  let hasProcessedFinishReason = false
@@ -544,9 +633,34 @@ async function* openaiStreamToAnthropic(
      for (const choice of chunk.choices ?? []) {
        const delta = choice.delta
        // Reasoning models (e.g. GLM-5, DeepSeek) may stream chain-of-thought
        // in `reasoning_content` before the actual reply appears in `content`.
        // Emit reasoning as a thinking block and content as a text block.
        if (delta.reasoning_content != null && delta.reasoning_content !== '') {
          if (!hasEmittedThinkingStart) {
            yield {
              type: 'content_block_start',
              index: contentBlockIndex,
              content_block: { type: 'thinking', thinking: '' },
            }
            hasEmittedThinkingStart = true
          }
          yield {
            type: 'content_block_delta',
            index: contentBlockIndex,
            delta: { type: 'thinking_delta', thinking: delta.reasoning_content },
          }
        }
        // Text content — use != null to distinguish absent field from empty string,
        // some providers send "" as first delta to signal streaming start
-        if (delta.content != null) {
+        if (delta.content != null && delta.content !== '') {
          // Close thinking block if transitioning from reasoning to content
          if (hasEmittedThinkingStart && !hasClosedThinking) {
            yield { type: 'content_block_stop', index: contentBlockIndex }
            contentBlockIndex++
            hasClosedThinking = true
          }
          if (!hasEmittedContentStart) {
            yield {
              type: 'content_block_start',
@@ -566,7 +680,12 @@ async function* openaiStreamToAnthropic(
        if (delta.tool_calls) {
          for (const tc of delta.tool_calls) {
            if (tc.id && tc.function?.name) {
-              // New tool call starting
+              // New tool call starting — close any open thinking block first
              if (hasEmittedThinkingStart && !hasClosedThinking) {
                yield { type: 'content_block_stop', index: contentBlockIndex }
                contentBlockIndex++
                hasClosedThinking = true
              }
              if (hasEmittedContentStart) {
                yield {
                  type: 'content_block_stop',
@@ -577,11 +696,14 @@ async function* openaiStreamToAnthropic(
              }
              const toolBlockIndex = contentBlockIndex
              const initialArguments = tc.function.arguments ?? ''
              const normalizeAtStop = hasToolFieldMapping(tc.function.name)
              activeToolCalls.set(tc.index, {
                id: tc.id,
                name: tc.function.name,
                index: toolBlockIndex,
-                jsonBuffer: tc.function.arguments ?? '',
+                jsonBuffer: initialArguments,
                normalizeAtStop,
              })
              yield {
@@ -593,12 +715,19 @@ async function* openaiStreamToAnthropic(
                  name: tc.function.name,
                  input: {},
                  ...(tc.extra_content ? { extra_content: tc.extra_content } : {}),
                  // Extract Gemini signature from extra_content
                  ...((tc.extra_content?.google as any)?.thought_signature
                    ? {
                        signature: (tc.extra_content.google as any)
                          .thought_signature,
                      }
                    : {}),
                },
              }
              contentBlockIndex++
              // Emit any initial arguments
-              if (tc.function.arguments) {
+              if (tc.function.arguments && !normalizeAtStop) {
                yield {
                  type: 'content_block_delta',
                  index: toolBlockIndex,
@@ -615,6 +744,11 @@ async function* openaiStreamToAnthropic(
                if (tc.function.arguments) {
                  active.jsonBuffer += tc.function.arguments
                }
                if (active.normalizeAtStop) {
                  continue
                }
                yield {
                  type: 'content_block_delta',
                  index: active.index,
@@ -633,6 +767,12 @@ async function* openaiStreamToAnthropic(
        if (choice.finish_reason && !hasProcessedFinishReason) {
          hasProcessedFinishReason = true
          // Close any open thinking block that wasn't closed by content transition
          if (hasEmittedThinkingStart && !hasClosedThinking) {
            yield { type: 'content_block_stop', index: contentBlockIndex }
            contentBlockIndex++
            hasClosedThinking = true
          }
          // Close any open content blocks
          if (hasEmittedContentStart) {
            yield {
@@ -642,16 +782,44 @@ async function* openaiStreamToAnthropic(
          }
          // Close active tool calls
          for (const [, tc] of activeToolCalls) {
            if (tc.normalizeAtStop) {
              let partialJson: string
              if (choice.finish_reason === 'length') {
                // Truncated by max tokens — preserve raw buffer to avoid
                // turning an incomplete tool call into an executable command
                partialJson = tc.jsonBuffer
              } else {
                const repairedStructuredJson = repairPossiblyTruncatedObjectJson(
                  tc.jsonBuffer,
                )
                if (repairedStructuredJson) {
                  partialJson = repairedStructuredJson
                } else {
                  partialJson = JSON.stringify(
                    normalizeToolArguments(tc.name, tc.jsonBuffer),
                  )
                }
              }
              yield {
                type: 'content_block_delta',
                index: tc.index,
                delta: {
                  type: 'input_json_delta',
                  partial_json: partialJson,
                },
              }
              yield { type: 'content_block_stop', index: tc.index }
              continue
            }
            let suffixToAdd = ''
            if (tc.jsonBuffer) {
              try {
                JSON.parse(tc.jsonBuffer)
              } catch {
                const str = tc.jsonBuffer.trimEnd()
-                const combinations = [
+                for (const combo of JSON_REPAIR_SUFFIXES) {
                  '}', '"}', ']}', '"]}', '}}', '"}}', ']}}', '"]}}', '"]}]}', '}]}'
                ]
                for (const combo of combinations) {
                  try {
                    JSON.parse(str + combo)
                    suffixToAdd = combo
@@ -930,7 +1098,7 @@ class OpenAIShimMessages {
      ...(options?.headers ?? {}),
    }
-    const isGemini = isEnvTruthy(process.env.CLAUDE_CODE_USE_GEMINI)
+    const isGemini = isGeminiMode()
    const apiKey =
      this.providerOverride?.apiKey ?? process.env.OPENAI_API_KEY ?? ''
    // Detect Azure endpoints by hostname (not raw URL) to prevent bypass via
@@ -1043,6 +1211,7 @@ class OpenAIShimMessages {
            | string
            | null
            | Array<{ type?: string; text?: string }>
          reasoning_content?: string | null
          tool_calls?: Array<{
            id: string
            function: { name: string; arguments: string }
@@ -1064,7 +1233,17 @@ class OpenAIShimMessages {
    const choice = data.choices?.[0]
    const content: Array<Record<string, unknown>> = []
-    const rawContent = choice?.message?.content
+    // Some reasoning models (e.g. GLM-5) put their reply in reasoning_content
    // while content stays null — emit reasoning as a thinking block, then
    // fall back to it for visible text if content is empty.
    const reasoningText = choice?.message?.reasoning_content
    if (typeof reasoningText === 'string' && reasoningText) {
      content.push({ type: 'thinking', thinking: reasoningText })
    }
    const rawContent =
      choice?.message?.content !== '' && choice?.message?.content != null
        ? choice?.message?.content
        : choice?.message?.reasoning_content
    if (typeof rawContent === 'string' && rawContent) {
      content.push({ type: 'text', text: rawContent })
    } else if (Array.isArray(rawContent) && rawContent.length > 0) {
@@ -1087,18 +1266,20 @@ class OpenAIShimMessages {
    if (choice?.message?.tool_calls) {
      for (const tc of choice.message.tool_calls) {
-        let input: unknown
+        const input = normalizeToolArguments(
-        try {
+          tc.function.name,
-          input = JSON.parse(tc.function.arguments)
+          tc.function.arguments,
-        } catch {
+        )
          input = { raw: tc.function.arguments }
        }
        content.push({
          type: 'tool_use',
          id: tc.id,
          name: tc.function.name,
          input,
          ...(tc.extra_content ? { extra_content: tc.extra_content } : {}),
          // Extract Gemini signature from extra_content
          ...((tc.extra_content?.google as any)?.thought_signature
            ? { signature: (tc.extra_content.google as any).thought_signature }
            : {}),
        })
      }
    }
--- a/src/services/api/toolArgumentNormalization.test.ts
+++ b/src/services/api/toolArgumentNormalization.test.ts
@@ -0,0 +1,180 @@
 import { describe, expect, test } from 'bun:test'
 import { normalizeToolArguments } from './toolArgumentNormalization'
 describe('normalizeToolArguments', () => {
  describe('Bash tool', () => {
    test('wraps plain string into { command }', () => {
      expect(normalizeToolArguments('Bash', 'pwd')).toEqual({ command: 'pwd' })
    })
    test('wraps multi-word command', () => {
      expect(normalizeToolArguments('Bash', 'ls -la /tmp')).toEqual({
        command: 'ls -la /tmp',
      })
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments('Bash', '{"command":"echo hi"}'),
      ).toEqual({ command: 'echo hi' })
    })
    test('returns empty object for blank string', () => {
      expect(normalizeToolArguments('Bash', '')).toEqual({})
      expect(normalizeToolArguments('Bash', '   ')).toEqual({})
    })
    test('returns parsed blank for JSON-encoded blank string', () => {
      expect(normalizeToolArguments('Bash', '""')).toEqual('')
      expect(normalizeToolArguments('Bash', '"  "')).toEqual('  ')
    })
    test('returns empty object for malformed structured object literal', () => {
      expect(normalizeToolArguments('Bash', '{ "command": "pwd"')).toEqual({})
    })
    test.each([
      ['{command:"pwd"}'],
      ["{'command':'pwd'}"],
      ['{command: pwd}'],
    ])(
      'returns empty object for malformed object-shaped string %s (does not wrap into command)',
      (input) => {
        expect(normalizeToolArguments('Bash', input)).toEqual({})
      },
    )
    test.each([
      ['false', false],
      ['null', null],
      ['[]', [] as unknown[]],
      ['0', 0],
      ['true', true],
      ['123', 123],
    ])(
      'preserves JSON literal %s as-is (does not wrap into command)',
      (input, expected) => {
        expect(normalizeToolArguments('Bash', input)).toEqual(expected)
      },
    )
    test('wraps JSON-encoded string into { command }', () => {
      expect(normalizeToolArguments('Bash', '"pwd"')).toEqual({
        command: 'pwd',
      })
    })
  })
  describe('undefined arguments', () => {
    test('returns empty object for undefined', () => {
      expect(normalizeToolArguments('Bash', undefined)).toEqual({})
      expect(normalizeToolArguments('UnknownTool', undefined)).toEqual({})
    })
  })
  describe('Read tool', () => {
    test('wraps plain string into { file_path }', () => {
      expect(normalizeToolArguments('Read', '/home/user/file.txt')).toEqual({
        file_path: '/home/user/file.txt',
      })
    })
    test('wraps JSON-encoded string into { file_path }', () => {
      expect(normalizeToolArguments('Read', '"/home/user/file.txt"')).toEqual({
        file_path: '/home/user/file.txt',
      })
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments('Read', '{"file_path":"/tmp/f.txt","limit":10}'),
      ).toEqual({ file_path: '/tmp/f.txt', limit: 10 })
    })
  })
  describe('Write tool', () => {
    test('wraps plain string into { file_path }', () => {
      expect(normalizeToolArguments('Write', '/tmp/out.txt')).toEqual({
        file_path: '/tmp/out.txt',
      })
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments(
          'Write',
          '{"file_path":"/tmp/out.txt","content":"hello"}',
        ),
      ).toEqual({ file_path: '/tmp/out.txt', content: 'hello' })
    })
  })
  describe('Edit tool', () => {
    test('wraps plain string into { file_path }', () => {
      expect(normalizeToolArguments('Edit', '/tmp/edit.ts')).toEqual({
        file_path: '/tmp/edit.ts',
      })
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments(
          'Edit',
          '{"file_path":"/tmp/f.ts","old_string":"a","new_string":"b"}',
        ),
      ).toEqual({ file_path: '/tmp/f.ts', old_string: 'a', new_string: 'b' })
    })
  })
  describe('Glob tool', () => {
    test('wraps plain string into { pattern }', () => {
      expect(normalizeToolArguments('Glob', '**/*.ts')).toEqual({
        pattern: '**/*.ts',
      })
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments('Glob', '{"pattern":"*.js","path":"/src"}'),
      ).toEqual({ pattern: '*.js', path: '/src' })
    })
  })
  describe('Grep tool', () => {
    test('wraps plain string into { pattern }', () => {
      expect(normalizeToolArguments('Grep', 'TODO')).toEqual({
        pattern: 'TODO',
      })
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments('Grep', '{"pattern":"fixme","path":"/src"}'),
      ).toEqual({ pattern: 'fixme', path: '/src' })
    })
  })
  describe('unknown tools', () => {
    test('returns empty object for plain string (no known field mapping)', () => {
      expect(normalizeToolArguments('UnknownTool', 'some value')).toEqual({})
    })
    test('passes through structured JSON object', () => {
      expect(
        normalizeToolArguments('UnknownTool', '{"key":"val"}'),
      ).toEqual({ key: 'val' })
    })
    test('preserves JSON literals as-is', () => {
      expect(normalizeToolArguments('UnknownTool', 'false')).toEqual(false)
      expect(normalizeToolArguments('UnknownTool', 'null')).toEqual(null)
      expect(normalizeToolArguments('UnknownTool', '[]')).toEqual([])
    })
    test('returns parsed string for JSON-encoded string on unknown tools', () => {
      expect(normalizeToolArguments('UnknownTool', '"hello"')).toEqual(
        'hello',
      )
    })
  })
 })
--- a/src/services/api/toolArgumentNormalization.ts
+++ b/src/services/api/toolArgumentNormalization.ts
@@ -0,0 +1,69 @@
 const STRING_ARGUMENT_TOOL_FIELDS: Record<string, string> = {
  Bash: 'command',
  Read: 'file_path',
  Write: 'file_path',
  Edit: 'file_path',
  Glob: 'pattern',
  Grep: 'pattern',
 }
 function isBlankString(value: string): boolean {
  return value.trim().length === 0
 }
 function isLikelyStructuredObjectLiteral(value: string): boolean {
  // Match object-like patterns with key-value syntax:
  // {"key":, {key:, {'key':, { "key" :, etc.
  // But NOT bash compound commands like { pwd; } or { echo hi; }
  return /^\s*\{\s*['"]?\w+['"]?\s*:/.test(value)
 }
 function isRecord(value: unknown): value is Record<string, unknown> {
  return typeof value === 'object' && value !== null && !Array.isArray(value)
 }
 function getPlainStringToolArgumentField(toolName: string): string | null {
  return STRING_ARGUMENT_TOOL_FIELDS[toolName] ?? null
 }
 export function hasToolFieldMapping(toolName: string): boolean {
  return toolName in STRING_ARGUMENT_TOOL_FIELDS
 }
 function wrapPlainStringToolArguments(
  toolName: string,
  value: string,
 ): Record<string, string> | null {
  const field = getPlainStringToolArgumentField(toolName)
  if (!field) return null
  return { [field]: value }
 }
 export function normalizeToolArguments(
  toolName: string,
  rawArguments: string | undefined,
 ): unknown {
  if (rawArguments === undefined) return {}
  try {
    const parsed = JSON.parse(rawArguments)
    if (isRecord(parsed)) {
      return parsed
    }
    // Parsed as a non-object JSON value (string, number, boolean, null, array)
    if (typeof parsed === 'string' && !isBlankString(parsed)) {
      return wrapPlainStringToolArguments(toolName, parsed) ?? parsed
    }
    // For blank strings, booleans, null, arrays — pass through as-is
    // and let Zod schema validation produce a meaningful error
    return parsed
  } catch {
    // rawArguments is not valid JSON — treat as a plain string
    if (isBlankString(rawArguments) || isLikelyStructuredObjectLiteral(rawArguments)) {
      // Blank or looks like a malformed object literal — don't wrap into
      // a tool field to avoid turning garbage into executable input
      return {}
    }
    return wrapPlainStringToolArguments(toolName, rawArguments) ?? {}
  }
 }
--- a/src/services/compact/microCompact.test.ts
+++ b/src/services/compact/microCompact.test.ts
@@ -0,0 +1,127 @@
 import { describe, expect, test } from 'bun:test'
 import type { Message } from '../../types/message.js'
 import { createAssistantMessage, createUserMessage } from '../../utils/messages.js'
 // We test the exported collectCompactableToolIds behavior indirectly via
 // the public microcompactMessages + time-based path. But first we need to
 // verify the core predicate: MCP tools (prefixed 'mcp__') should be
 // compactable alongside the built-in tool set.
 // Import internals we can test
 import { evaluateTimeBasedTrigger } from './microCompact.js'
 /**
 * Helper: build a minimal assistant message with a tool_use block.
 */
 function assistantWithToolUse(toolName: string, toolId: string): Message {
  return createAssistantMessage({
    content: [
      {
        type: 'tool_use' as const,
        id: toolId,
        name: toolName,
        input: {},
      },
    ],
  })
 }
 /**
 * Helper: build a user message with a tool_result block.
 */
 function userWithToolResult(toolId: string, output: string): Message {
  return createUserMessage({
    content: [
      {
        type: 'tool_result' as const,
        tool_use_id: toolId,
        content: output,
      },
    ],
  })
 }
 describe('microCompact MCP tool compaction', () => {
  // We can't easily unit-test the private isCompactableTool directly,
  // but we can test the full time-based microcompact path which exercises
  // collectCompactableToolIds → isCompactableTool under the hood.
  // The time-based path is the simplest to trigger: it content-clears
  // old tool results when the gap since last assistant message exceeds
  // the threshold.
  // However, evaluateTimeBasedTrigger depends on config (GrowthBook).
  // So instead, let's test the observable behavior by importing the
  // microcompactMessages function and checking that MCP tool_use blocks
  // are collected.
  // Since collectCompactableToolIds is not exported, we test the predicate
  // behavior by verifying that the module loads without error and that
  // built-in and MCP tools are treated consistently.
  test('module exports load correctly', async () => {
    const mod = await import('./microCompact.js')
    expect(mod.microcompactMessages).toBeFunction()
    expect(mod.estimateMessageTokens).toBeFunction()
    expect(mod.evaluateTimeBasedTrigger).toBeFunction()
  })
  test('estimateMessageTokens counts MCP tool_use blocks', async () => {
    const { estimateMessageTokens } = await import('./microCompact.js')
    const builtinMessages: Message[] = [
      assistantWithToolUse('Read', 'tool-builtin-1'),
      userWithToolResult('tool-builtin-1', 'file contents here'),
    ]
    const mcpMessages: Message[] = [
      assistantWithToolUse('mcp__github__get_file_contents', 'tool-mcp-1'),
      userWithToolResult('tool-mcp-1', 'file contents here'),
    ]
    const builtinTokens = estimateMessageTokens(builtinMessages)
    const mcpTokens = estimateMessageTokens(mcpMessages)
    // Both should produce non-zero estimates
    expect(builtinTokens).toBeGreaterThan(0)
    expect(mcpTokens).toBeGreaterThan(0)
    // The tool_result content is identical, so token estimates should be
    // similar (tool_use name differs slightly, so not exactly equal)
    expect(Math.abs(builtinTokens - mcpTokens)).toBeLessThan(50)
  })
  test('microcompactMessages processes MCP tools without error', async () => {
    const { microcompactMessages } = await import('./microCompact.js')
    const messages: Message[] = [
      assistantWithToolUse('mcp__slack__send_message', 'tool-mcp-2'),
      userWithToolResult('tool-mcp-2', 'Message sent successfully'),
      assistantWithToolUse('mcp__github__create_pull_request', 'tool-mcp-3'),
      userWithToolResult('tool-mcp-3', JSON.stringify({ number: 42, url: 'https://github.com/org/repo/pull/42' })),
    ]
    // Should not throw — MCP tools should be handled gracefully
    const result = await microcompactMessages(messages)
    expect(result).toBeDefined()
    expect(result.messages).toBeDefined()
    expect(result.messages.length).toBe(messages.length)
  })
  test('microcompactMessages processes mixed built-in and MCP tools', async () => {
    const { microcompactMessages } = await import('./microCompact.js')
    const messages: Message[] = [
      assistantWithToolUse('Read', 'tool-read-1'),
      userWithToolResult('tool-read-1', 'some file content'),
      assistantWithToolUse('mcp__playwright__screenshot', 'tool-mcp-4'),
      userWithToolResult('tool-mcp-4', 'base64-encoded-screenshot-data'.repeat(100)),
      assistantWithToolUse('Bash', 'tool-bash-1'),
      userWithToolResult('tool-bash-1', 'command output'),
    ]
    const result = await microcompactMessages(messages)
    expect(result).toBeDefined()
    expect(result.messages.length).toBe(messages.length)
  })
 })
--- a/src/services/compact/microCompact.ts
+++ b/src/services/compact/microCompact.ts
@@ -37,7 +37,7 @@ export const TIME_BASED_MC_CLEARED_MESSAGE = '[Old tool result content cleared]'
 const IMAGE_MAX_TOKEN_SIZE = 2000
-// Only compact these tools
+// Only compact these built-in tools (MCP tools are also compactable via prefix match)
 const COMPACTABLE_TOOLS = new Set<string>([
  FILE_READ_TOOL_NAME,
  ...SHELL_TOOL_NAMES,
@@ -49,7 +49,13 @@ const COMPACTABLE_TOOLS = new Set<string>([
  FILE_WRITE_TOOL_NAME,
 ])
-// --- Cached microcompact state (internal-only, gated by feature('CACHED_MICROCOMPACT')) ---
+const MCP_TOOL_PREFIX = 'mcp__'
 function isCompactableTool(name: string): boolean {
  return COMPACTABLE_TOOLS.has(name) || name.startsWith(MCP_TOOL_PREFIX)
 }
 // --- Cached microcompact state (gated by feature('CACHED_MICROCOMPACT')) ---
 // Lazy-initialized cached MC module and state to avoid importing in external builds.
 // The imports and state live inside feature() checks for dead code elimination.
@@ -231,7 +237,7 @@ function collectCompactableToolIds(messages: Message[]): string[] {
      Array.isArray(message.message.content)
    ) {
      for (const block of message.message.content) {
-        if (block.type === 'tool_use' && COMPACTABLE_TOOLS.has(block.name)) {
+        if (block.type === 'tool_use' && isCompactableTool(block.name)) {
          ids.push(block.id)
        }
      }
--- a/src/services/tools/toolExecution.test.ts
+++ b/src/services/tools/toolExecution.test.ts
@@ -0,0 +1,33 @@
 import { describe, expect, test } from 'bun:test'
 import { SkillTool } from '../../tools/SkillTool/SkillTool.js'
 import {
  getSchemaValidationErrorOverride,
  getSchemaValidationToolUseResult,
 } from './toolExecution.js'
 describe('getSchemaValidationErrorOverride', () => {
  test('returns actionable missing-skill error for SkillTool', () => {
    expect(getSchemaValidationErrorOverride(SkillTool, {})).toBe(
      'Missing skill name. Pass the slash command name as the skill parameter (e.g., skill: "commit" for /commit, skill: "review-pr" for /review-pr).',
    )
  })
  test('does not override unrelated tool schema failures', () => {
    expect(getSchemaValidationErrorOverride({ name: 'Read' } as never, {})).toBe(
      null,
    )
  })
  test('does not override SkillTool when skill is present', () => {
    expect(
      getSchemaValidationErrorOverride(SkillTool, { skill: 'commit' }),
    ).toBe(null)
  })
  test('uses the actionable override for structured toolUseResult too', () => {
    expect(getSchemaValidationToolUseResult(SkillTool, {} as never)).toBe(
      'InputValidationError: Missing skill name. Pass the slash command name as the skill parameter (e.g., skill: "commit" for /commit, skill: "review-pr" for /review-pr).',
    )
  })
 })
--- a/src/services/tools/toolExecution.ts
+++ b/src/services/tools/toolExecution.ts
@@ -43,6 +43,7 @@ import { FILE_READ_TOOL_NAME } from '../../tools/FileReadTool/prompt.js'
 import { FILE_WRITE_TOOL_NAME } from '../../tools/FileWriteTool/prompt.js'
 import { NOTEBOOK_EDIT_TOOL_NAME } from '../../tools/NotebookEditTool/constants.js'
 import { POWERSHELL_TOOL_NAME } from '../../tools/PowerShellTool/toolName.js'
 import { SKILL_TOOL_NAME } from '../../tools/SkillTool/constants.js'
 import { parseGitCommitId } from '../../tools/shared/gitOperationTracking.js'
 import {
  isDeferredTool,
@@ -596,6 +597,31 @@ export function buildSchemaNotSentHint(
  )
 }
 export function getSchemaValidationErrorOverride(
  tool: Tool,
  input: unknown,
 ): string | null {
  if (tool.name !== SKILL_TOOL_NAME || !input || typeof input !== 'object') {
    return null
  }
  const skill = (input as { skill?: unknown }).skill
  if (skill === undefined || skill === null) {
    return 'Missing skill name. Pass the slash command name as the skill parameter (e.g., skill: "commit" for /commit, skill: "review-pr" for /review-pr).'
  }
  return null
 }
 export function getSchemaValidationToolUseResult(
  tool: Tool,
  input: unknown,
  fallbackMessage?: string,
 ): string {
  const override = getSchemaValidationErrorOverride(tool, input)
  return `InputValidationError: ${override ?? fallbackMessage ?? ''}`
 }
 async function checkPermissionsAndCallTool(
  tool: Tool,
  toolUseID: string,
@@ -614,7 +640,9 @@ async function checkPermissionsAndCallTool(
  // Validate input types with zod (surprisingly, the model is not great at generating valid input)
  const parsedInput = tool.inputSchema.safeParse(input)
  if (!parsedInput.success) {
-    let errorContent = formatZodValidationError(tool.name, parsedInput.error)
+    const fallbackErrorContent = formatZodValidationError(tool.name, parsedInput.error)
    let errorContent =
      getSchemaValidationErrorOverride(tool, input) ?? fallbackErrorContent
    const schemaHint = buildSchemaNotSentHint(
      tool,
@@ -672,7 +700,11 @@ async function checkPermissionsAndCallTool(
              tool_use_id: toolUseID,
            },
          ],
-          toolUseResult: `InputValidationError: ${parsedInput.error.message}`,
+          toolUseResult: getSchemaValidationToolUseResult(
            tool,
            input,
            parsedInput.error.message,
          ),
          sourceToolAssistantUUID: assistantMessage.uuid,
        }),
      },
--- a/src/tools/AgentTool/prompt.ts
+++ b/src/tools/AgentTool/prompt.ts
@@ -156,34 +156,24 @@ ${AGENT_TOOL_NAME}({
  const currentExamples = `Example usage:
 <example_agent_descriptions>
-"test-runner": use this agent after you are done writing code to run tests
+"claude-code-guide": use this agent when the user asks how Claude Code works or how to use its features
-"greeting-responder": use this agent to respond to user greetings with a friendly joke
+"statusline-setup": use this agent to configure the user's Claude Code status line setting
 </example_agent_descriptions>
 <example>
-user: "Please write a function that checks if a number is prime"
+user: "How do I configure Claude Code hooks?"
 assistant: I'm going to use the ${FILE_WRITE_TOOL_NAME} tool to write the following code:
 <code>
 function isPrime(n) {
  if (n <= 1) return false
  for (let i = 2; i * i <= n; i++) {
    if (n % i === 0) return false
  }
  return true
 }
 </code>
 <commentary>
-Since a significant piece of code was written and the task was completed, now use the test-runner agent to run the tests
+This is a Claude Code usage question, so use the claude-code-guide agent
 </commentary>
-assistant: Uses the ${AGENT_TOOL_NAME} tool to launch the test-runner agent
+assistant: Uses the ${AGENT_TOOL_NAME} tool to launch the claude-code-guide agent
 </example>
 <example>
-user: "Hello"
+user: "Set up my Claude Code status line"
 <commentary>
-Since the user is greeting, use the greeting-responder agent to respond with a friendly joke
+This matches the statusline-setup agent, so use it to configure the setting
 </commentary>
-assistant: "I'm going to use the ${AGENT_TOOL_NAME} tool to launch the greeting-responder agent"
+assistant: "I'm going to use the ${AGENT_TOOL_NAME} tool to launch the statusline-setup agent"
 </example>
 `
--- a/src/tools/SkillTool/SkillTool.test.ts
+++ b/src/tools/SkillTool/SkillTool.test.ts
@@ -0,0 +1,31 @@
 import { describe, expect, test } from 'bun:test'
 import { SkillTool } from './SkillTool.js'
 describe('SkillTool missing parameter handling', () => {
  test('missing skill stays required at the schema level', async () => {
    const parsed = SkillTool.inputSchema.safeParse({})
    expect(parsed.success).toBe(false)
  })
  test('validateInput still returns an actionable error when called with missing skill', async () => {
    const result = await SkillTool.validateInput?.({} as never, {
      options: { tools: [] },
      messages: [],
    } as never)
    expect(result).toEqual({
      result: false,
      message:
        'Missing skill name. Pass the slash command name as the skill parameter (e.g., skill: "commit" for /commit, skill: "review-pr" for /review-pr).',
      errorCode: 1,
    })
  })
  test('valid skill input still parses and validates', async () => {
    const parsed = SkillTool.inputSchema.safeParse({ skill: 'commit' })
    expect(parsed.success).toBe(true)
  })
 })
--- a/src/tools/SkillTool/SkillTool.ts
+++ b/src/tools/SkillTool/SkillTool.ts
@@ -352,6 +352,16 @@ export const SkillTool: Tool<InputSchema, Output, Progress> = buildTool({
  toAutoClassifierInput: ({ skill }) => skill ?? '',
  async validateInput({ skill }, context): Promise<ValidationResult> {
    if (!skill || typeof skill !== 'string') {
      return {
        result: false,
        message:
          'Missing skill name. Pass the slash command name as the skill parameter ' +
          '(e.g., skill: "commit" for /commit, skill: "review-pr" for /review-pr).',
        errorCode: 1,
      }
    }
    // Skills are just skill names, no arguments
    const trimmed = skill.trim()
    if (!trimmed) {
@@ -434,7 +444,7 @@ export const SkillTool: Tool<InputSchema, Output, Progress> = buildTool({
    context,
  ): Promise<PermissionDecision> {
    // Skills are just skill names, no arguments
-    const trimmed = skill.trim()
+    const trimmed = skill ?? ''
    // Remove leading slash if present (for compatibility)
    const commandName = trimmed.startsWith('/') ? trimmed.substring(1) : trimmed
@@ -592,7 +602,7 @@ export const SkillTool: Tool<InputSchema, Output, Progress> = buildTool({
    // - Skill is a prompt-based skill
    // Skills are just names, with optional arguments
-    const trimmed = skill.trim()
+    const trimmed = skill ?? ''
    // Remove leading slash if present (for compatibility)
    const commandName = trimmed.startsWith('/') ? trimmed.substring(1) : trimmed
--- a/src/utils/api.test.ts
+++ b/src/utils/api.test.ts
@@ -1,6 +1,7 @@
 import { expect, test } from 'bun:test'
 import { z } from 'zod/v4'
 import { getEmptyToolPermissionContext, type Tool, type Tools } from '../Tool.js'
 import { SkillTool } from '../tools/SkillTool/SkillTool.js'
 import { toolToAPISchema } from './api.js'
 test('toolToAPISchema preserves provider-specific schema keywords in input_schema', async () => {
@@ -64,3 +65,16 @@ test('toolToAPISchema preserves provider-specific schema keywords in input_schem
    },
  })
 })
 test('toolToAPISchema keeps skill required for SkillTool', async () => {
  const schema = await toolToAPISchema(SkillTool, {
    getToolPermissionContext: async () => getEmptyToolPermissionContext(),
    tools: [] as unknown as Tools,
    agents: [],
  })
  expect((schema as { input_schema: unknown }).input_schema).toMatchObject({
    type: 'object',
    required: ['skill'],
  })
 })
--- a/src/utils/context.test.ts
+++ b/src/utils/context.test.ts
@@ -94,3 +94,22 @@ test('gpt-5.4 family keeps large max output overrides within provider limits', (
  expect(getMaxOutputTokensForModel('gpt-5.4-mini')).toBe(128_000)
  expect(getMaxOutputTokensForModel('gpt-5.4-nano')).toBe(128_000)
 })
 test('MiniMax-M2.7 uses explicit provider-specific context and output caps', () => {
  process.env.CLAUDE_CODE_USE_OPENAI = '1'
  delete process.env.CLAUDE_CODE_MAX_OUTPUT_TOKENS
  expect(getContextWindowForModel('MiniMax-M2.7')).toBe(204_800)
  expect(getModelMaxOutputTokens('MiniMax-M2.7')).toEqual({
    default: 131_072,
    upperLimit: 131_072,
  })
  expect(getMaxOutputTokensForModel('MiniMax-M2.7')).toBe(131_072)
 })
 test('unknown openai-compatible models still use the conservative fallback window', () => {
  process.env.CLAUDE_CODE_USE_OPENAI = '1'
  delete process.env.CLAUDE_CODE_MAX_OUTPUT_TOKENS
  expect(getContextWindowForModel('some-unknown-3p-model')).toBe(8_000)
 })
--- a/src/utils/context.ts
+++ b/src/utils/context.ts
@@ -72,16 +72,23 @@ export function getContextWindowForModel(
    return 1_000_000
  }
-  // OpenAI-compatible provider — use known context windows for the model
+  // OpenAI-compatible provider — use known context windows for the model.
-  if (
+  // Unknown models get a conservative 8k default so auto-compact triggers
  // before hitting a hard context_window_exceeded error.
  const isOpenAIProvider =
    isEnvTruthy(process.env.CLAUDE_CODE_USE_OPENAI) ||
    isEnvTruthy(process.env.CLAUDE_CODE_USE_GEMINI) ||
    isEnvTruthy(process.env.CLAUDE_CODE_USE_GITHUB)
-  ) {
+  if (isOpenAIProvider) {
    const openaiWindow = getOpenAIContextWindow(model)
    if (openaiWindow !== undefined) {
      return openaiWindow
    }
    console.error(
      `[context] Warning: model "${model}" not in context window table — using conservative 8k default. ` +
      'Add it to src/utils/model/openaiContextWindows.ts for accurate compaction.',
    )
    return 8_000
  }
  const cap = getModelCapability(model)
--- a/src/utils/conversationRecovery.hooks.test.ts
+++ b/src/utils/conversationRecovery.hooks.test.ts
@@ -69,3 +69,93 @@ test('loadConversationForResume rejects oversized transcripts before resume hook
  )
  expect(hookSpy).not.toHaveBeenCalled()
 })
 test('deserializeMessagesWithInterruptDetection strips thinking blocks only for OpenAI-compatible providers', async () => {
  const serializedMessages = [
    user(id(10), 'hello'),
    {
      type: 'assistant',
      uuid: id(11),
      parentUuid: id(10),
      timestamp: ts,
      cwd: '/tmp',
      sessionId,
      version: 'test',
      message: {
        role: 'assistant',
        content: [
          { type: 'thinking', thinking: 'secret reasoning' },
          { type: 'text', text: 'visible reply' },
        ],
      },
    },
    {
      type: 'assistant',
      uuid: id(12),
      parentUuid: id(11),
      timestamp: ts,
      cwd: '/tmp',
      sessionId,
      version: 'test',
      message: {
        role: 'assistant',
        content: [{ type: 'thinking', thinking: 'only hidden reasoning' }],
      },
    },
    user(id(13), 'follow up'),
  ]
  mock.module('./model/providers.js', () => ({
    getAPIProvider: () => 'openai',
    isOpenAICompatibleProvider: (provider: string) =>
      provider === 'openai' ||
      provider === 'gemini' ||
      provider === 'github' ||
      provider === 'codex',
  }))
  const openaiModule = await import(`./conversationRecovery.ts?provider=openai-${Date.now()}`)
  const thirdParty = openaiModule.deserializeMessagesWithInterruptDetection(serializedMessages as never[])
  const thirdPartyAssistantMessages = thirdParty.messages.filter(
    message => message.type === 'assistant',
  )
  expect(thirdPartyAssistantMessages).toHaveLength(2)
  expect(thirdPartyAssistantMessages[0]?.message?.content).toEqual([
    { type: 'text', text: 'visible reply' },
  ])
  expect(
    JSON.stringify(thirdPartyAssistantMessages.map(message => message.message?.content)),
  ).not.toContain('secret reasoning')
  expect(
    JSON.stringify(thirdPartyAssistantMessages.map(message => message.message?.content)),
  ).not.toContain('only hidden reasoning')
  mock.restore()
  mock.module('./model/providers.js', () => ({
    getAPIProvider: () => 'bedrock',
    isOpenAICompatibleProvider: (provider: string) =>
      provider === 'openai' ||
      provider === 'gemini' ||
      provider === 'github' ||
      provider === 'codex',
  }))
  const bedrockModule = await import(`./conversationRecovery.ts?provider=bedrock-${Date.now()}`)
  const anthropicCompatible = bedrockModule.deserializeMessagesWithInterruptDetection(serializedMessages as never[])
  const anthropicAssistantMessages = anthropicCompatible.messages.filter(
    message => message.type === 'assistant',
  )
  expect(anthropicAssistantMessages).toHaveLength(2)
  expect(anthropicAssistantMessages[0]?.message?.content).toEqual([
    { type: 'thinking', thinking: 'secret reasoning' },
    { type: 'text', text: 'visible reply' },
  ])
  expect(
    JSON.stringify(anthropicAssistantMessages.map(message => message.message?.content)),
  ).toContain('secret reasoning')
  expect(
    JSON.stringify(anthropicAssistantMessages.map(message => message.message?.content)),
  ).not.toContain('only hidden reasoning')
 })
--- a/src/utils/conversationRecovery.test.ts
+++ b/src/utils/conversationRecovery.test.ts
@@ -13,6 +13,7 @@ const originalSimple = process.env.CLAUDE_CODE_SIMPLE
 const sessionId = '00000000-0000-4000-8000-000000001999'
 const ts = '2026-04-02T00:00:00.000Z'
 function id(n: number): string {
  return `00000000-0000-4000-8000-${String(n).padStart(12, '0')}`
 }
@@ -76,4 +77,3 @@ test('loadConversationForResume rejects oversized reconstructed transcripts', as
    'Reconstructed transcript is too large to resume safely',
  )
 })
--- a/src/utils/conversationRecovery.ts
+++ b/src/utils/conversationRecovery.ts
@@ -24,6 +24,7 @@ import {
  type FileHistorySnapshot,
 } from './fileHistory.js'
 import { logError } from './log.js'
 import { getAPIProvider } from './model/providers.js'
 import {
  createAssistantMessage,
  createUserMessage,
@@ -177,6 +178,25 @@ export type DeserializeResult = {
  turnInterruptionState: TurnInterruptionState
 }
 /**
 * Remove thinking/redacted_thinking content blocks from assistant messages.
 * Messages that become empty after stripping are removed entirely.
 */
 function stripThinkingBlocks(messages: NormalizedMessage[]): NormalizedMessage[] {
  return messages.reduce<NormalizedMessage[]>((acc, msg) => {
    if (msg.type !== 'assistant' || !Array.isArray(msg.message?.content)) {
      acc.push(msg)
      return acc
    }
    const filtered = msg.message.content.filter(
      (block: { type?: string }) => block.type !== 'thinking' && block.type !== 'redacted_thinking',
    )
    if (filtered.length === 0) return acc
    acc.push({ ...msg, message: { ...msg.message, content: filtered } })
    return acc
  }, [])
 }
 /**
 * Deserializes messages from a log file into the format expected by the REPL.
 * Filters unresolved tool uses, orphaned thinking messages, and appends a
@@ -227,10 +247,19 @@ export function deserializeMessagesWithInterruptDetection(
      filteredToolUses,
    ) as NormalizedMessage[]
    // Strip thinking/redacted_thinking content blocks from assistant messages
    // when resuming against a 3P provider. These Anthropic-specific blocks cause
    // 400 errors or context corruption on OpenAI-compatible providers (issue #248 finding 5).
    const provider = getAPIProvider()
    const isThirdPartyProvider = provider !== 'firstParty' && provider !== 'bedrock' && provider !== 'vertex' && provider !== 'foundry'
    const thinkingStripped = isThirdPartyProvider
      ? stripThinkingBlocks(filteredThinking)
      : filteredThinking
    // Filter out assistant messages with only whitespace text content.
    // This can happen when model outputs "\n\n" before thinking, user cancels mid-stream.
    const filteredMessages = filterWhitespaceOnlyAssistantMessages(
-      filteredThinking,
+      thinkingStripped,
    ) as NormalizedMessage[]
    const internalState = detectTurnInterruption(filteredMessages)
--- a/src/utils/dragDropPaths.test.ts
+++ b/src/utils/dragDropPaths.test.ts
@@ -4,6 +4,10 @@ import { tmpdir } from 'os'
 import { join } from 'path'
 import { extractDraggedFilePaths } from './dragDropPaths.js'
 function escapeFinderDraggedPath(filePath: string): string {
  return filePath.replace(/([\\ ])/g, '\\$1')
 }
 describe('extractDraggedFilePaths', () => {
  // Paths that exist on any system.
  const thisFile = import.meta.path
@@ -80,6 +84,12 @@ describe('extractDraggedFilePaths', () => {
    })
  })
  test('escapeFinderDraggedPath escapes spaces and backslashes', () => {
    expect(escapeFinderDraggedPath('/tmp/my\\notes file.txt')).toBe(
      '/tmp/my\\\\notes\\ file.txt',
    )
  })
  // Backslash-escaped paths are a Finder/macOS + Linux convention — on
  // Windows the shell-escape step is skipped, so these cases do not apply.
  if (process.platform !== 'win32') {
@@ -92,7 +102,7 @@ describe('extractDraggedFilePaths', () => {
      test('resolves an escaped real file with a space in its name', () => {
        // Raw form matches what a terminal delivers on Finder drag.
-        const escaped = spacedFile.replace(/ /g, '\\ ')
+        const escaped = escapeFinderDraggedPath(spacedFile)
        expect(extractDraggedFilePaths(escaped)).toEqual([spacedFile])
      })
    })
--- a/src/utils/githubModelsCredentials.hydrate.test.ts
+++ b/src/utils/githubModelsCredentials.hydrate.test.ts
@@ -41,7 +41,7 @@ describe('hydrateGithubModelsTokenFromSecureStorage', () => {
    }))
    const { hydrateGithubModelsTokenFromSecureStorage } = await import(
-      './githubModelsCredentials.js'
+      './githubModelsCredentials.js?hydrate=sets-token'
    )
    hydrateGithubModelsTokenFromSecureStorage()
    expect(process.env.GITHUB_TOKEN).toBe('stored-secret')
@@ -62,7 +62,7 @@ describe('hydrateGithubModelsTokenFromSecureStorage', () => {
    }))
    const { hydrateGithubModelsTokenFromSecureStorage } = await import(
-      './githubModelsCredentials.js'
+      './githubModelsCredentials.js?hydrate=preserve-existing'
    )
    hydrateGithubModelsTokenFromSecureStorage()
    expect(process.env.GITHUB_TOKEN).toBe('already')
--- a/src/utils/githubModelsCredentials.test.ts
+++ b/src/utils/githubModelsCredentials.test.ts
@@ -1,13 +1,11 @@
 import { describe, expect, test } from 'bun:test'
 import {
  clearGithubModelsToken,
  readGithubModelsToken,
  saveGithubModelsToken,
 } from './githubModelsCredentials.js'
 describe('readGithubModelsToken', () => {
-  test('returns undefined in bare mode', () => {
+  test('returns undefined in bare mode', async () => {
    const { readGithubModelsToken } = await import(
      './githubModelsCredentials.js?read-bare-mode'
    )
    const prev = process.env.CLAUDE_CODE_SIMPLE
    process.env.CLAUDE_CODE_SIMPLE = '1'
    expect(readGithubModelsToken()).toBeUndefined()
@@ -20,7 +18,11 @@ describe('readGithubModelsToken', () => {
 })
 describe('saveGithubModelsToken / clearGithubModelsToken', () => {
-  test('save returns failure in bare mode', () => {
+  test('save returns failure in bare mode', async () => {
    const { saveGithubModelsToken } = await import(
      './githubModelsCredentials.js?save-bare-mode'
    )
    const prev = process.env.CLAUDE_CODE_SIMPLE
    process.env.CLAUDE_CODE_SIMPLE = '1'
    const r = saveGithubModelsToken('abc')
@@ -33,7 +35,11 @@ describe('saveGithubModelsToken / clearGithubModelsToken', () => {
    }
  })
-  test('clear succeeds in bare mode', () => {
+  test('clear succeeds in bare mode', async () => {
    const { clearGithubModelsToken } = await import(
      './githubModelsCredentials.js?clear-bare-mode'
    )
    const prev = process.env.CLAUDE_CODE_SIMPLE
    process.env.CLAUDE_CODE_SIMPLE = '1'
    expect(clearGithubModelsToken().success).toBe(true)
--- a/src/utils/githubModelsCredentials.ts
+++ b/src/utils/githubModelsCredentials.ts
@@ -23,6 +23,19 @@ export function readGithubModelsToken(): string | undefined {
  }
 }
 export async function readGithubModelsTokenAsync(): Promise<string | undefined> {
  if (isBareMode()) return undefined
  try {
    const data = (await getSecureStorage().readAsync()) as
      | ({ githubModels?: GithubModelsCredentialBlob } & Record<string, unknown>)
      | null
    const t = data?.githubModels?.accessToken?.trim()
    return t || undefined
  } catch {
    return undefined
  }
 }
 /**
 * If GitHub Models mode is on and no token is in the environment, copy the
 * stored token into process.env so the OpenAI shim and validation see it.
--- a/src/utils/model/modelOptions.github.test.ts
+++ b/src/utils/model/modelOptions.github.test.ts
@@ -1,7 +1,17 @@
-import { afterEach, expect, mock, test } from 'bun:test'
+import { afterEach, beforeEach, expect, mock, test } from 'bun:test'
 import { resetModelStringsForTestingOnly } from '../../bootstrap/state.js'
 import { saveGlobalConfig } from '../config.js'
 async function importFreshModelOptionsModule() {
  mock.restore()
  mock.module('./providers.js', () => ({
    getAPIProvider: () => 'github',
  }))
  const nonce = `${Date.now()}-${Math.random()}`
  return import(`./modelOptions.js?ts=${nonce}`)
 }
 const originalEnv = {
  CLAUDE_CODE_USE_GITHUB: process.env.CLAUDE_CODE_USE_GITHUB,
  CLAUDE_CODE_USE_OPENAI: process.env.CLAUDE_CODE_USE_OPENAI,
@@ -14,6 +24,20 @@ const originalEnv = {
  ANTHROPIC_CUSTOM_MODEL_OPTION: process.env.ANTHROPIC_CUSTOM_MODEL_OPTION,
 }
 beforeEach(() => {
  mock.restore()
  delete process.env.CLAUDE_CODE_USE_GITHUB
  delete process.env.CLAUDE_CODE_USE_OPENAI
  delete process.env.CLAUDE_CODE_USE_GEMINI
  delete process.env.CLAUDE_CODE_USE_BEDROCK
  delete process.env.CLAUDE_CODE_USE_VERTEX
  delete process.env.CLAUDE_CODE_USE_FOUNDRY
  delete process.env.OPENAI_MODEL
  delete process.env.OPENAI_BASE_URL
  delete process.env.ANTHROPIC_CUSTOM_MODEL_OPTION
  resetModelStringsForTestingOnly()
 })
 afterEach(() => {
  process.env.CLAUDE_CODE_USE_GITHUB = originalEnv.CLAUDE_CODE_USE_GITHUB
  process.env.CLAUDE_CODE_USE_OPENAI = originalEnv.CLAUDE_CODE_USE_OPENAI
@@ -34,17 +58,9 @@ afterEach(() => {
    providerProfiles: [],
    activeProviderProfileId: undefined,
  }))
  resetModelStringsForTestingOnly()
 })
 async function importFreshModelOptionsModule() {
  mock.restore()
  mock.module('./providers.js', () => ({
    getAPIProvider: () => 'github',
  }))
  const nonce = `${Date.now()}-${Math.random()}`
  return import(`./modelOptions.js?ts=${nonce}`)
 }
 test('GitHub provider exposes only default + GitHub model in /model options', async () => {
  process.env.CLAUDE_CODE_USE_GITHUB = '1'
  delete process.env.CLAUDE_CODE_USE_OPENAI
@@ -58,7 +74,9 @@ test('GitHub provider exposes only default + GitHub model in /model options', as
  const { getModelOptions } = await importFreshModelOptionsModule()
  const options = getModelOptions(false)
-  const nonDefault = options.filter(option => option.value !== null)
+  const nonDefault = options.filter(
    (option: { value: unknown }) => option.value !== null,
  )
  expect(nonDefault.length).toBe(1)
  expect(nonDefault[0]?.value).toBe('github:copilot')
--- a/src/utils/model/openaiContextWindows.ts
+++ b/src/utils/model/openaiContextWindows.ts
@@ -44,6 +44,10 @@ const OPENAI_CONTEXT_WINDOWS: Record<string, number> = {
  'mistral-large-latest':     131_072,
  'mistral-small-latest':     131_072,
  // MiniMax
  'MiniMax-M2.7':             204_800,
  'minimax-m2.7':             204_800,
  // Google (via OpenRouter)
  'google/gemini-2.0-flash':1_048_576,
  'google/gemini-2.5-pro':  1_048_576,
@@ -110,6 +114,10 @@ const OPENAI_MAX_OUTPUT_TOKENS: Record<string, number> = {
  'mistral-large-latest':     32_768,
  'mistral-small-latest':     32_768,
  // MiniMax
  'MiniMax-M2.7':            131_072,
  'minimax-m2.7':            131_072,
  // Google (via OpenRouter)
  'google/gemini-2.0-flash':   8_192,
  'google/gemini-2.5-pro':    65_536,
--- a/src/utils/providerFlag.test.ts
+++ b/src/utils/providerFlag.test.ts
@@ -1,4 +1,4 @@
-import { describe, expect, test, afterEach } from 'bun:test'
+import { afterEach, beforeEach, describe, expect, test } from 'bun:test'
 import {
  parseProviderFlag,
  applyProviderFlag,
@@ -8,18 +8,26 @@ import {
 const originalEnv = { ...process.env }
 const RESET_KEYS = [
  'CLAUDE_CODE_USE_OPENAI',
  'CLAUDE_CODE_USE_GEMINI',
  'CLAUDE_CODE_USE_GITHUB',
  'CLAUDE_CODE_USE_BEDROCK',
  'CLAUDE_CODE_USE_VERTEX',
  'OPENAI_BASE_URL',
  'OPENAI_API_KEY',
  'OPENAI_MODEL',
  'GEMINI_MODEL',
 ] as const
 beforeEach(() => {
  for (const key of RESET_KEYS) {
    delete process.env[key]
  }
 })
 afterEach(() => {
-  for (const key of [
+  for (const key of RESET_KEYS) {
    'CLAUDE_CODE_USE_OPENAI',
    'CLAUDE_CODE_USE_GEMINI',
    'CLAUDE_CODE_USE_GITHUB',
    'CLAUDE_CODE_USE_BEDROCK',
    'CLAUDE_CODE_USE_VERTEX',
    'OPENAI_BASE_URL',
    'OPENAI_API_KEY',
    'OPENAI_MODEL',
    'GEMINI_MODEL',
  ]) {
    if (originalEnv[key] === undefined) delete process.env[key]
    else process.env[key] = originalEnv[key]
  }
--- a/src/utils/providerProfiles.test.ts
+++ b/src/utils/providerProfiles.test.ts
@@ -2,6 +2,10 @@ import { afterEach, describe, expect, mock, test } from 'bun:test'
 import type { ProviderProfile } from './config.js'
 async function importFreshProvidersModule() {
  return import(`./model/providers.ts?ts=${Date.now()}-${Math.random()}`)
 }
 const originalEnv = { ...process.env }
 const RESTORED_KEYS = [
@@ -96,24 +100,26 @@ function buildProfile(overrides: Partial<ProviderProfile> = {}): ProviderProfile
 describe('applyProviderProfileToProcessEnv', () => {
  test('openai profile clears competing gemini/github flags', async () => {
-    const { applyProviderProfileToProcessEnv, getAPIProvider } =
+    const { applyProviderProfileToProcessEnv } =
      await importFreshProviderProfileModules()
    process.env.CLAUDE_CODE_USE_GEMINI = '1'
    process.env.CLAUDE_CODE_USE_GITHUB = '1'
    applyProviderProfileToProcessEnv(buildProfile())
    const { getAPIProvider: getFreshAPIProvider } =
      await importFreshProvidersModule()
    expect(process.env.CLAUDE_CODE_USE_GEMINI).toBeUndefined()
    expect(process.env.CLAUDE_CODE_USE_GITHUB).toBeUndefined()
-    expect(process.env.CLAUDE_CODE_USE_OPENAI).toBe('1')
+    expect(String(process.env.CLAUDE_CODE_USE_OPENAI)).toBe('1')
    expect(process.env.CLAUDE_CODE_PROVIDER_PROFILE_ENV_APPLIED_ID).toBe(
      'provider_test',
    )
-    expect(getAPIProvider()).toBe('openai')
+    expect(getFreshAPIProvider()).toBe('openai')
  })
  test('anthropic profile clears competing gemini/github flags', async () => {
-    const { applyProviderProfileToProcessEnv, getAPIProvider } =
+    const { applyProviderProfileToProcessEnv } =
      await importFreshProviderProfileModules()
    process.env.CLAUDE_CODE_USE_GEMINI = '1'
    process.env.CLAUDE_CODE_USE_GITHUB = '1'
@@ -125,11 +131,13 @@ describe('applyProviderProfileToProcessEnv', () => {
        model: 'claude-sonnet-4-6',
      }),
    )
    const { getAPIProvider: getFreshAPIProvider } =
      await importFreshProvidersModule()
    expect(process.env.CLAUDE_CODE_USE_GEMINI).toBeUndefined()
    expect(process.env.CLAUDE_CODE_USE_GITHUB).toBeUndefined()
    expect(process.env.CLAUDE_CODE_USE_OPENAI).toBeUndefined()
-    expect(getAPIProvider()).toBe('firstParty')
+    expect(getFreshAPIProvider()).toBe('firstParty')
  })
 })
@@ -177,7 +185,7 @@ describe('applyActiveProviderProfileFromConfig', () => {
    } as any)
    expect(applied).toBeUndefined()
-    expect(process.env.CLAUDE_CODE_USE_OPENAI).toBe('1')
+    expect(String(process.env.CLAUDE_CODE_USE_OPENAI)).toBe('1')
    expect(process.env.OPENAI_BASE_URL).toBe('http://localhost:11434/v1')
    expect(process.env.OPENAI_MODEL).toBe('qwen2.5:3b')
  })
@@ -267,7 +275,7 @@ describe('applyActiveProviderProfileFromConfig', () => {
    } as any)
    expect(applied?.id).toBe('saved_openai')
-    expect(process.env.CLAUDE_CODE_USE_OPENAI).toBe('1')
+    expect(String(process.env.CLAUDE_CODE_USE_OPENAI)).toBe('1')
    expect(process.env.OPENAI_BASE_URL).toBe('https://api.openai.com/v1')
    expect(process.env.OPENAI_MODEL).toBe('gpt-4o')
  })
@@ -286,10 +294,10 @@ describe('persistActiveProviderProfileModel', () => {
      model: 'kimi-k2.5:cloud',
    })
-      saveMockGlobalConfig(current => ({
+    saveMockGlobalConfig(current => ({
-        ...current,
+      ...current,
-        providerProfiles: [activeProfile],
+      providerProfiles: [activeProfile],
-        activeProviderProfileId: activeProfile.id,
+      activeProviderProfileId: activeProfile.id,
    }))
    applyProviderProfileToProcessEnv(activeProfile)
@@ -303,7 +311,7 @@ describe('persistActiveProviderProfileModel', () => {
    )
    const saved = getProviderProfiles().find(
-      profile => profile.id === activeProfile.id,
+      (profile: ProviderProfile) => profile.id === activeProfile.id,
    )
    expect(saved?.model).toBe('minimax-m2.5:cloud')
  })
@@ -333,7 +341,7 @@ describe('persistActiveProviderProfileModel', () => {
    expect(process.env.OPENAI_MODEL).toBe('cli-model')
    const saved = getProviderProfiles().find(
-      profile => profile.id === activeProfile.id,
+      (profile: ProviderProfile) => profile.id === activeProfile.id,
    )
    expect(saved?.model).toBe('minimax-m2.5:cloud')
  })
@@ -414,7 +422,7 @@ describe('deleteProviderProfile', () => {
    expect(result.activeProfileId).toBeUndefined()
    expect(process.env.CLAUDE_CODE_PROVIDER_PROFILE_ENV_APPLIED).toBeUndefined()
-    expect(process.env.CLAUDE_CODE_USE_OPENAI).toBe('1')
+    expect(String(process.env.CLAUDE_CODE_USE_OPENAI)).toBe('1')
    expect(process.env.OPENAI_BASE_URL).toBe('http://localhost:11434/v1')
    expect(process.env.OPENAI_MODEL).toBe('qwen2.5:3b')
  })
--- a/src/utils/ripgrep.test.ts
+++ b/src/utils/ripgrep.test.ts
@@ -1,11 +1,52 @@
 import { expect, test } from 'bun:test'
 import path from 'path'
-import { wrapRipgrepUnavailableError } from './ripgrep.ts'
+import { resolveRipgrepConfig, wrapRipgrepUnavailableError } from './ripgrep.js'
 const MOCK_BUILTIN_PATH = path.normalize(
  process.platform === 'win32'
    ? `vendor/ripgrep/${process.arch}-win32/rg.exe`
    : `vendor/ripgrep/${process.arch}-${process.platform}/rg`,
 )
 test('ripgrepCommand falls back to system rg when builtin binary is missing', () => {
  const config = resolveRipgrepConfig({
    userWantsSystemRipgrep: false,
    bundledMode: false,
    builtinCommand: MOCK_BUILTIN_PATH,
    builtinExists: false,
    systemExecutablePath: '/usr/bin/rg',
    processExecPath: '/fake/bun',
  })
  expect(config).toMatchObject({
    mode: 'system',
    command: 'rg',
    args: [],
  })
 })
 test('ripgrepCommand keeps builtin mode when bundled binary exists', () => {
  const config = resolveRipgrepConfig({
    userWantsSystemRipgrep: false,
    bundledMode: false,
    builtinCommand: MOCK_BUILTIN_PATH,
    builtinExists: true,
    systemExecutablePath: '/usr/bin/rg',
    processExecPath: '/fake/bun',
  })
  expect(config).toMatchObject({
    mode: 'builtin',
    command: MOCK_BUILTIN_PATH,
    args: [],
  })
 })
 test('wrapRipgrepUnavailableError explains missing packaged fallback', () => {
  const error = wrapRipgrepUnavailableError(
    { code: 'ENOENT', message: 'spawn rg ENOENT' },
-    { mode: 'builtin', command: 'C:\\fake\\vendor\\ripgrep\\rg.exe' },
+    { mode: 'builtin', command: 'C:\\fake\\vendor\\ripgrep\\rg.exe', args: [] },
    'win32',
  )
@@ -18,7 +59,7 @@ test('wrapRipgrepUnavailableError explains missing packaged fallback', () => {
 test('wrapRipgrepUnavailableError explains missing system ripgrep', () => {
  const error = wrapRipgrepUnavailableError(
    { code: 'ENOENT', message: 'spawn rg ENOENT' },
-    { mode: 'system', command: 'rg' },
+    { mode: 'system', command: 'rg', args: [] },
    'linux',
  )
--- a/src/utils/ripgrep.ts
+++ b/src/utils/ripgrep.ts
@@ -1,5 +1,6 @@
 import type { ChildProcess, ExecFileException } from 'child_process'
 import { execFile, spawn } from 'child_process'
 import { existsSync } from 'fs'
 import memoize from 'lodash-es/memoize.js'
 import { homedir } from 'os'
 import * as path from 'path'
@@ -30,40 +31,72 @@ type RipgrepConfig = {
 type RipgrepErrorLike = Pick<NodeJS.ErrnoException, 'code' | 'message'>
-const getRipgrepConfig = memoize((): RipgrepConfig => {
+function isErrnoException(error: unknown): error is NodeJS.ErrnoException {
-  const userWantsSystemRipgrep = isEnvDefinedFalsy(
+  return error instanceof Error
-    process.env.USE_BUILTIN_RIPGREP,
+}
  )
-  // Try system ripgrep if user wants it
+type ResolveRipgrepConfigArgs = {
-  if (userWantsSystemRipgrep) {
+  userWantsSystemRipgrep: boolean
-    const { cmd: systemPath } = findExecutable('rg', [])
+  bundledMode: boolean
-    if (systemPath !== 'rg') {
+  builtinCommand: string
-      // SECURITY: Use command name 'rg' instead of systemPath to prevent PATH hijacking
+  builtinExists: boolean
-      // If we used systemPath, a malicious ./rg.exe in current directory could be executed
+  systemExecutablePath: string
-      // Using just 'rg' lets the OS resolve it safely with NoDefaultCurrentDirectoryInExePath protection
+  processExecPath?: string
-      return { mode: 'system', command: 'rg', args: [] }
+}
-    }
+
 export function resolveRipgrepConfig({
  userWantsSystemRipgrep,
  bundledMode,
  builtinCommand,
  builtinExists,
  systemExecutablePath,
  processExecPath = process.execPath,
 }: ResolveRipgrepConfigArgs): RipgrepConfig {
  if (userWantsSystemRipgrep && systemExecutablePath !== 'rg') {
    // SECURITY: Use command name 'rg' instead of systemExecutablePath to prevent PATH hijacking
    return { mode: 'system', command: 'rg', args: [] }
  }
-  // In bundled (native) mode, ripgrep is statically compiled into bun-internal
+  if (bundledMode) {
  // and dispatches based on argv[0]. We spawn ourselves with argv0='rg'.
  if (isInBundledMode()) {
    return {
      mode: 'embedded',
-      command: process.execPath,
+      command: processExecPath,
      args: ['--no-config'],
      argv0: 'rg',
    }
  }
  if (builtinExists) {
    return { mode: 'builtin', command: builtinCommand, args: [] }
  }
  if (systemExecutablePath !== 'rg') {
    return { mode: 'system', command: 'rg', args: [] }
  }
  return { mode: 'builtin', command: builtinCommand, args: [] }
 }
 const getRipgrepConfig = memoize((): RipgrepConfig => {
  const userWantsSystemRipgrep = isEnvDefinedFalsy(
    process.env.USE_BUILTIN_RIPGREP,
  )
  const bundledMode = isInBundledMode()
  const rgRoot = path.resolve(__dirname, 'vendor', 'ripgrep')
-  const command =
+  const builtinCommand =
    process.platform === 'win32'
      ? path.resolve(rgRoot, `${process.arch}-win32`, 'rg.exe')
      : path.resolve(rgRoot, `${process.arch}-${process.platform}`, 'rg')
  const builtinExists = existsSync(builtinCommand)
  const { cmd: systemExecutablePath } = findExecutable('rg', [])
-  return { mode: 'builtin', command, args: [] }
+  return resolveRipgrepConfig({
    userWantsSystemRipgrep,
    bundledMode,
    builtinCommand,
    builtinExists,
    systemExecutablePath,
  })
 })
 export function ripgrepCommand(): {
@@ -324,7 +357,9 @@ async function ripGrepFileCount(
      if (settled) return
      settled = true
      reject(
-        err.code === 'ENOENT' ? wrapRipgrepUnavailableError(err) : err,
+        isErrnoException(err) && err.code === 'ENOENT'
          ? wrapRipgrepUnavailableError(err)
          : err,
      )
    })
  })
@@ -388,7 +423,9 @@ export async function ripGrepStream(
      if (settled) return
      settled = true
      reject(
-        err.code === 'ENOENT' ? wrapRipgrepUnavailableError(err) : err,
+        isErrnoException(err) && err.code === 'ENOENT'
          ? wrapRipgrepUnavailableError(err)
          : err,
      )
    })
  })
@@ -436,7 +473,9 @@ export async function ripGrep(
      const CRITICAL_ERROR_CODES = ['ENOENT', 'EACCES', 'EPERM']
      if (CRITICAL_ERROR_CODES.includes(error.code as string)) {
        reject(
-          error.code === 'ENOENT' ? wrapRipgrepUnavailableError(error) : error,
+          isErrnoException(error) && error.code === 'ENOENT'
            ? wrapRipgrepUnavailableError(error)
            : error,
        )
        return
      }
--- a/src/utils/schemaSanitizer.test.ts
+++ b/src/utils/schemaSanitizer.test.ts
@@ -0,0 +1,68 @@
 import { describe, expect, test } from 'bun:test'
 import { sanitizeSchemaForOpenAICompat } from './schemaSanitizer'
 describe('sanitizeSchemaForOpenAICompat', () => {
  test('preserves Grep-like properties.pattern while keeping it required', () => {
    const schema = {
      type: 'object',
      properties: {
        pattern: {
          type: 'string',
          description: 'The regular expression pattern to search for in file contents',
        },
        path: { type: 'string' },
        glob: { type: 'string' },
      },
      required: ['pattern'],
    }
    const sanitized = sanitizeSchemaForOpenAICompat(schema)
    const properties = sanitized.properties as Record<string, unknown> | undefined
    expect(Object.keys(properties ?? {})).toEqual(['pattern', 'path', 'glob'])
    expect(properties?.pattern).toEqual({
      type: 'string',
      description: 'The regular expression pattern to search for in file contents',
    })
    expect(sanitized.required).toEqual(['pattern'])
  })
  test('preserves Glob-like properties.pattern while keeping it required', () => {
    const schema = {
      type: 'object',
      properties: {
        pattern: {
          type: 'string',
          description: 'The glob pattern to match files against',
        },
        path: { type: 'string' },
      },
      required: ['pattern'],
    }
    const sanitized = sanitizeSchemaForOpenAICompat(schema)
    const properties = sanitized.properties as Record<string, unknown> | undefined
    expect(Object.keys(properties ?? {})).toEqual(['pattern', 'path'])
    expect(properties?.pattern).toEqual({
      type: 'string',
      description: 'The glob pattern to match files against',
    })
    expect(sanitized.required).toEqual(['pattern'])
  })
  test('strips JSON Schema validator pattern from string schemas', () => {
    const schema = {
      type: 'string',
      pattern: '^[a-z]+$',
      minLength: 1,
    }
    const sanitized = sanitizeSchemaForOpenAICompat(schema)
    expect(sanitized).toEqual({
      type: 'string',
    })
  })
 })
--- a/src/utils/schemaSanitizer.ts
+++ b/src/utils/schemaSanitizer.ts
@@ -33,6 +33,15 @@ function stripSchemaKeywords(schema: unknown, keywords: Set<string>): unknown {
  const result: Record<string, unknown> = {}
  for (const [key, value] of Object.entries(schema)) {
    if (key === 'properties' && isSchemaRecord(value)) {
      const sanitizedProps: Record<string, unknown> = {}
      for (const [propName, propSchema] of Object.entries(value)) {
        sanitizedProps[propName] = stripSchemaKeywords(propSchema, keywords)
      }
      result[key] = sanitizedProps
      continue
    }
    if (keywords.has(key)) {
      continue
    }
@@ -215,10 +224,13 @@ export function sanitizeSchemaForOpenAICompat(
    }
  }
-  if (Array.isArray(record.required) && isSchemaRecord(record.properties)) {
+  const properties = isSchemaRecord(record.properties)
    ? record.properties
    : undefined
  if (Array.isArray(record.required) && properties) {
    record.required = record.required.filter(
-      (value): value is string =>
+      (value): value is string => typeof value === 'string' && value in properties,
        typeof value === 'string' && value in record.properties,
    )
  }
--- a/src/utils/staticRender.tsx
+++ b/src/utils/staticRender.tsx
@@ -97,8 +97,12 @@ export function renderToAnsiString(node: React.ReactNode, columns?: number): Pro
      patchConsole: false
    });
-    // Wait for the component to exit naturally
+    // Wait for the component to exit naturally, with a timeout guard so
-    await instance.waitUntilExit();
+    // tests never hang indefinitely if a render error prevents exit().
    await Promise.race([
      instance.waitUntilExit(),
      new Promise<void>(resolve => setTimeout(resolve, 3000)),
    ]);
    // Extract only the first frame's content to avoid duplication
    // (Ink outputs multiple frames in non-TTY mode)
Author	SHA1	Message	Date
OpenClaude Worker 3	d51256df6f	fix: replace isDeepStrictEqual with navigation-aware options comparison The select cursor highlight was broken because isDeepStrictEqual in use-select-navigation.ts and use-multi-select-state.ts would fail when options contained identity-unstable properties (JSX label elements, function onChange callbacks, computed disabled booleans). This caused the reset logic to fire on every re-render, resetting focusedValue back to the first option. Replace isDeepStrictEqual with optionsNavigateEqual which only compares properties that affect navigation behavior: value, disabled, and type. ReactNode labels and function callbacks are intentionally excluded as they are identity-unstable but don't change navigation semantics. Fixes #472	2026-04-08 13:58:18 +05:30
lunamonke	3188f6ac66	fix example agents (#438 )	2026-04-08 02:55:27 +08:00
Kevin Codex	69ea1f1e4a	fix: restore default context window for unknown 3p models (#494 ) * fix: restore default context window for unknown 3p models * fix: add MiniMax context metadata	2026-04-08 02:45:49 +08:00
KRATOS	f9ce81bfb3	fix: handle missing skill parameter in SkillTool (#485 ) * fix: handle missing skill parameter in SkillTool * fix: preserve SkillTool schema contract * fix: align SkillTool schema error output	2026-04-08 00:33:52 +08:00
Juan Camilo Auriti	4975cfc2e0	fix: strip Anthropic params from 3P resume paths (#479 ) * fix: strip Anthropic-specific params from 3P provider paths Three silent failure modes affecting all third-party provider users: 1. Thinking blocks serialized as <thinking> text corrupt multi-turn context — strip them instead of converting to raw text tags. 2. Unknown models fall through to 200k context window default, so auto-compact never triggers — use conservative 8k for unknown 3P models with a warning log. 3. Session resume with thinking blocks causes 400 or context corruption on 3P providers — strip thinking/redacted_thinking content blocks from deserialized messages when resuming against a non-Anthropic provider. Addresses findings 2, 3, and 5 from #248. * test: align resume stripping expectation with orphan-thinking filter * test: isolate provider env in conversation recovery tests * test: move provider-sensitive resume coverage behind module mocks * test: trim extra blank lines in conversation recovery test Keep the focused provider-resume test diff clean so the regression branch stays easy to review. Co-Authored-By: Claude Opus 4.6 <noreply@openclaude.dev> --------- Co-authored-by: Claude Opus 4.6 <noreply@openclaude.dev>	2026-04-07 23:24:10 +08:00
ibaaaaal	600c01faf7	fix: restore Grep and Glob reliability on OpenAI paths (#461 ) * fix: restore Grep and Glob reliability on OpenAI paths Preserve Grep and Glob pattern fields during OpenAI/Codex schema sanitization, and fall back to system ripgrep when the packaged binary is missing. This keeps search tool schemas intact and improves Linux usability for npm/source installs. Co-Authored-By: Claude Opus 4.6 <noreply@openclaude.dev> * test: clean up ripgrep fallback test helpers Remove the unused ripgrepCommand import and normalize mocked builtin ripgrep paths so the test behaves consistently across platforms. Co-Authored-By: Claude Opus 4.6 <noreply@openclaude.dev> * test: remove duplicate Codex URI schema case Drop the duplicated WebFetch URI-format test in codexShim.test.ts so test names stay unique and failures remain easier to read. Co-Authored-By: Claude Opus 4.6 <noreply@openclaude.dev> * test: stabilize ripgrep fallback coverage Avoid fs/module mocking in ripgrep fallback tests by extracting the config selection logic into a pure helper. This preserves the fallback coverage while removing the test interaction that caused the narrowed Bun hang repro. Co-Authored-By: Claude Opus 4.6 <noreply@openclaude.dev> * test: tighten ripgrep and schema coverage Align the ripgrep fallback test with the actual auto-fallback branch, clean up strict typing in schema sanitizer tests, and tighten ripgrep error narrowing for type safety. Co-Authored-By: Claude Opus 4.6 <noreply@openclaude.dev> --------- Co-authored-by: Claude Opus 4.6 <noreply@openclaude.dev>	2026-04-07 17:26:00 +08:00
makskopchan-tech	b07bafa5bd	Security code scanning (#459 ) * fix: address code scanning alerts Parse Gemini hostnames instead of matching raw URL substrings, redact gRPC error logs, and harden the Finder drag-drop test escape helper so the flagged paths are fixed without regressing working behavior. * Potential fix for pull request finding 'CodeQL / Clear-text logging of sensitive information' Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com> * fix: restore safe grpc error summaries A later autofix commit removed the exported gRPC error summarizer while the new regression test still imported it. Restore the safe name/code-only summary so CI stays green without reintroducing clear-text logging. * fix: keep grpc logging generic Remove the stale helper/test pair and keep the gRPC startup and stream logs free of error-derived data so the CodeQL clear-text logging alert stays closed while the rest of the security fixes remain intact. --------- Co-authored-by: OpenClaude Worker 3 <worker-3@openclaude.local> Co-authored-by: Vasanth T <148849890+Vasanthdev2004@users.noreply.github.com> Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>	2026-04-07 16:03:16 +08:00
changjiaoxigua	85aa8b0985	fix: add File polyfill for Node < 20 to prevent startup deadlock with proxy (#442 ) When a proxy is configured, configureGlobalAgents() loads undici to set a global dispatcher. However, undici v7.24.6 requires Node.js >= 20.18.1 and references globalThis.File at module evaluation time for webidl type assertions. Node 18 lacks the File global, causing ReferenceError inside the bundled __commonJS require chain, which deadlocks due to unresolved circular dependencies in the module initialization. Fix by polyfilling globalThis.File early in cli.tsx entrypoint, before any undici code loads. Try node:buffer.File (available in Node 18.13+), fallback to minimal Blob-based stub. Fixes: bun run start hangs indefinitely when HTTP_PROXY/HTTPS_PROXY is set Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>	2026-04-07 16:02:05 +08:00
Vasanth T	e365cb4010	fix: address code scanning alerts (#434 ) * fix: address code scanning alerts Parse Gemini hostnames instead of matching raw URL substrings, redact gRPC error logs, and harden the Finder drag-drop test escape helper so the flagged paths are fixed without regressing working behavior. * Potential fix for pull request finding 'CodeQL / Clear-text logging of sensitive information' Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com> * fix: restore safe grpc error summaries A later autofix commit removed the exported gRPC error summarizer while the new regression test still imported it. Restore the safe name/code-only summary so CI stays green without reintroducing clear-text logging. * fix: keep grpc logging generic Remove the stale helper/test pair and keep the gRPC startup and stream logs free of error-derived data so the CodeQL clear-text logging alert stays closed while the rest of the security fixes remain intact. --------- Co-authored-by: OpenClaude Worker 3 <worker-3@openclaude.local> Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>	2026-04-07 00:43:09 +08:00
CRABHIVE	52d33a87a0	fix: include MCP tool results in microcompact to reduce token waste (#348 ) ## Summary - Added `isCompactableTool()` helper in `microCompact.ts` that matches both the existing COMPACTABLE_TOOLS set and any tool prefixed `mcp__` - MCP tool results were never compacted because the hardcoded allowlist only contained 9 built-in tools — MCP tools fell through and persisted in full for the entire session, wasting 10-500K tokens/session ## Impact - user-facing impact: long sessions using MCP servers (GitHub, Slack, Playwright, etc.) will compact stale MCP tool results, reducing token usage and delaying autocompact triggers - developer/maintainer impact: new MCP servers are automatically covered via prefix match — no need to update the allowlist per-server ## Testing - [x] `bun run build` - [x] `bun run smoke` - [x] focused tests: `bun test src/services/compact/microCompact.test.ts` - module exports load correctly - estimateMessageTokens counts MCP tool_use blocks - microcompactMessages processes MCP tools without error - microcompactMessages processes mixed built-in and MCP tools ## Notes - provider/model path tested: n/a (compaction logic is model-agnostic) - screenshots attached (if UI changed): n/a - follow-up work or known limitations: subagent results and thinking blocks are still not compacted (separate RFCs) https://claude.ai/code/session_01D7kprMn4c66a5WrZscF7rv Co-authored-by: Claude <noreply@anthropic.com>	2026-04-06 23:13:20 +08:00
KRATOS	b4bd95b477	fix: normalize malformed Bash tool arguments from OpenAI-compatible providers (#385 ) * fix: normalize malformed Bash tool arguments from OpenAI-compatible providers * fix: keep invalid Bash tool args from becoming commands * fix: preserve malformed Bash JSON literals * test: stabilize rebased PR 385 checks * test: isolate provider profile env assertions * fix: extend tool argument normalization to all tools and harden edge cases - Extend STRING_ARGUMENT_TOOL_FIELDS to normalize Read, Write, Edit, Glob, and Grep plain-string arguments (fixes "Invalid tool parameters" errors reported by VennDev) - Normalize streaming Bash args regardless of finish_reason, not only when finish_reason is 'tool_calls' - Broaden isLikelyStructuredObjectLiteral to catch malformed object-shaped strings like {command:"pwd"} and {'command':'pwd'} (fixes CR2 from Vasanthdev2004) - Apply blank/object-literal guard to all tools, not just Bash - Extract duplicated JSON repair suffix combinations into shared constant - Add 32 isolated unit tests for toolArgumentNormalization Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * fix: skip streaming normalization on finish_reason length Truncated tool calls (finish_reason: 'length') now preserve the raw buffer instead of normalizing into executable commands, preventing incomplete commands from becoming runnable. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * fix: comprehensive tool argument normalization hardening - Remove all { raw: ... } returns that caused InputValidationError with z.strictObject schemas — return {} instead for clean Zod errors - Extend normalizeAtStop buffering to all mapped tools (Read, Write, Edit, Glob, Grep) so streaming paths also get normalized - Make repairPossiblyTruncatedObjectJson generic — repair any valid JSON object, not just ones with a command field - Export hasToolFieldMapping for streaming normalizeAtStop decision - Skip normalization on finish_reason: length to preserve raw truncated buffer - Update all test expectations to match new behavior Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> --------- Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>	2026-04-06 22:08:45 +08:00
Otávio Carvalho	1e057025d6	Fix GLM-5 and other reasoning models appearing to hang via OpenAI shim (#365 ) * Fix GLM-5 and other reasoning models appearing to hang via OpenAI shim Reasoning models like GLM-5 and DeepSeek stream chain-of-thought in `reasoning_content` while `content` stays empty (""). The OpenAI shim only read `delta.content`, so it saw empty strings and never emitted any Anthropic stream events — causing the UI to appear frozen. - Add `reasoning_content` to streaming chunk and non-streaming response types - Emit `reasoning_content` as thinking blocks (thinking_delta) in streaming mode - Properly transition from thinking to text blocks when content phase begins - Fall back to `reasoning_content` in non-streaming mode when content is null Fixes #214 Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * Fix non-streaming reasoning_content fallback and add tests - Use explicit empty-string check instead of \|\| for content fallback so content: "" doesn't leak reasoning_content as visible text - Close thinking block before tool call blocks in streaming path - Add non-streaming and streaming reasoning_content tests Co-Authored-By: GLM-5.1 <noreply@openclaude.dev> * Fix flaky Ink reconciler tests caused by react-compiler memoization Remove hard throw in createTextInstance that crashed when hostContext.isInsideText was stale due to react-compiler element caching. Add timeout guards to prevent test hangs when render errors prevent exit() from firing. Co-Authored-By: Claude GLM-5.1 <noreply@openclaude.dev> --------- Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com> Co-authored-by: GLM-5.1 <noreply@openclaude.dev>	2026-04-06 22:02:29 +08:00
Agent_J	aff2bd87e4	fix: avoid sync github credential reads in provider manager (#428 ) * fix: avoid sync github credential reads in provider manager * test: stabilize provider manager async credential test * fix: avoid first-frame github provider false negative --------- Co-authored-by: KRATOS <84986124+gnanam1990@users.noreply.github.com>	2026-04-06 21:29:53 +08:00
hsain9357	72e6a945fe	Fixed gemini error Function call is missing a thought_signature in functionCall parts (#426 ) * docs(docs): add agent guidance and repository instructions - Created `AGENTS.md` and `CLAUDE.md` to provide high-signal guidance for AI agents and developers working in the repository. - Outlined critical developer commands for building, testing, and running diagnostics using `bun`. - Documented the repository architecture, source entrypoints, and core service logic. - Defined framework-specific quirks, including module stubbing for internal modules and macro versioning. - Established style and workflow guidelines regarding telemetry, environment variables, and security scan requirements. * feat(api): support gemini thought signatures in openai shim - Added `isGeminiMode` utility to detect Gemini backends via `CLAUDE_CODE_USE_GEMINI` or `OPENAI_BASE_URL`. - Updated `convertMessages` to extract `thought_signature` from thinking blocks and inject them into tool calls. - Implemented a fallback mechanism that provides a `skip_thought_signature_validator` string to avoid 400 validation errors when a signature is missing. - Enhanced `openaiStreamToAnthropic` and `OpenAIShimMessages` to correctly preserve and pass through Gemini-specific metadata in `extra_content`. * refactor(api): improve gemini metadata handling and remove redundant docs - Updated `src/services/api/openaiShim.ts` to merge existing `google`-specific metadata within `extra_content` instead of overwriting it. - Simplified the `thought_signature` assignment logic to use a fallback value of `skip_thought_signature_validator` when no signature is provided. - Deleted `AGENTS.md` and `CLAUDE.md` files to eliminate redundant agent guidance documentation. * fix(api): propagate gemini thought signatures to all parallel tool calls - Removed the index constraint when assigning the `signature` from a `thinkingBlock` to tool calls in `openaiShim.ts`. - Ensured that the `thought_signature` is applied to every tool call in a parallel set, rather than just the first one. - Aligned the shim with Gemini API requirements, which mandate that the same signature must be present on every replayed function call part within an assistant turn.	2026-04-06 21:04:49 +08:00