fix: prevent agent communication bounds from hiding CI regressions

Tighten the UDS auth, framing, and response-reader boundaries while keeping the AgentSummary lifecycle covered so Codecov and CI fail on real regressions instead of missing coverage. The poorMode settings mock mirrors unrelated real settings defaults to avoid Bun mock retention changing later permission tests. Constraint: PR #369 must fix Codecov/CI precisely without warning suppression, fallback masking, or mock pollution Rejected: Delete AgentSummary lifecycle coverage | would hide Codecov loss and stale-summary behavior Rejected: Store inline UDS rejection in a hidden input sentinel | cloned observable inputs can drop it and bypass rejection Rejected: Ignore malformed UDS frames until timeout | leaves client slots and SendMessage calls open to exhaustion Confidence: high Scope-risk: moderate Directive: Keep empty #token= markers rejected; do not require a non-empty token value in hasInlineUdsToken Tested: bun test packages/builtin-tools/src/tools/SendMessageTool/__tests__/udsRecipientSanitization.test.ts src/utils/__tests__/udsMessaging.test.ts src/utils/__tests__/udsResponseReader.test.ts src/utils/__tests__/ndjsonFramer.test.ts Tested: bunx tsc --noEmit --pretty false Tested: bun run lint Tested: bun test --coverage --coverage-reporter lcov --coverage-dir coverage Tested: bun run test:all Tested: bun audit Tested: bun run build Tested: bun run build:vite Not-tested: GitHub-hosted Codecov upload until pushed PR checks rerun
fix: harden bounded agent communication review fixes
2026-06-15 21:05:51 +00:00 · 2026-04-27 14:51:22 +08:00 · 2026-04-27 10:32:18 +08:00 · 2026-04-26 21:44:42 +08:00
60 changed files with 4121 additions and 3904 deletions
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
  "name": "claude-code-best",
-  "version": "1.10.4",
+  "version": "1.10.2",
  "description": "Reverse-engineered Anthropic Claude Code CLI — interactive AI coding assistant in the terminal",
  "type": "module",
  "author": "claude-code-best <claude-code-best@proton.me>",
--- a/packages/@ant/model-provider/src/index.ts
+++ b/packages/@ant/model-provider/src/index.ts
@@ -61,10 +61,3 @@ export { anthropicMessagesToOpenAI } from './shared/openaiConvertMessages.js'
 export type { ConvertMessagesOptions } from './shared/openaiConvertMessages.js'
 export { anthropicToolsToOpenAI, anthropicToolChoiceToOpenAI } from './shared/openaiConvertTools.js'
 export { adaptOpenAIStreamToAnthropic } from './shared/openaiStreamAdapter.js'
-
-// Codex provider utilities
-export { normalizeCodexCallId, resolveCodexCallId, createCodexFallbackCallId } from './providers/codex/callIds.js'
-export { resolveCodexModel, resolveCodexMaxTokens } from './providers/codex/modelMapping.js'
-export { anthropicMessagesToCodexInput } from './providers/codex/convertMessages.js'
-export type { CodexImageConversionOptions } from './providers/codex/convertMessages.js'
-export { anthropicToolsToCodex } from './providers/codex/convertTools.js'
--- a/packages/@ant/model-provider/src/providers/codex/tests/modelMapping.test.ts
+++ b/packages/@ant/model-provider/src/providers/codex/tests/modelMapping.test.ts
@@ -1,94 +0,0 @@
-import { describe, expect, test, beforeEach, afterEach } from 'bun:test'
-import { resolveCodexModel } from '../modelMapping.js'
-
-describe('resolveCodexModel', () => {
-  const originalEnv = {
-    CODEX_MODEL: process.env.CODEX_MODEL,
-    CODEX_DEFAULT_HAIKU_MODEL: process.env.CODEX_DEFAULT_HAIKU_MODEL,
-    CODEX_DEFAULT_SONNET_MODEL: process.env.CODEX_DEFAULT_SONNET_MODEL,
-    CODEX_DEFAULT_OPUS_MODEL: process.env.CODEX_DEFAULT_OPUS_MODEL,
-  }
-
-  beforeEach(() => {
-    delete process.env.CODEX_MODEL
-    delete process.env.CODEX_DEFAULT_HAIKU_MODEL
-    delete process.env.CODEX_DEFAULT_SONNET_MODEL
-    delete process.env.CODEX_DEFAULT_OPUS_MODEL
-  })
-
-  afterEach(() => {
-    Object.assign(process.env, originalEnv)
-  })
-
-  test('CODEX_MODEL env var overrides all', () => {
-    process.env.CODEX_MODEL = 'my-custom-model'
-    expect(resolveCodexModel('claude-sonnet-4-6')).toBe('my-custom-model')
-  })
-
-  test('CODEX_DEFAULT_SONNET_MODEL overrides default map', () => {
-    process.env.CODEX_DEFAULT_SONNET_MODEL = 'my-sonnet'
-    expect(resolveCodexModel('claude-sonnet-4-6')).toBe('my-sonnet')
-  })
-
-  test('CODEX_DEFAULT_HAIKU_MODEL overrides default map', () => {
-    process.env.CODEX_DEFAULT_HAIKU_MODEL = 'my-haiku'
-    expect(resolveCodexModel('claude-haiku-4-5-20251001')).toBe('my-haiku')
-  })
-
-  test('CODEX_DEFAULT_OPUS_MODEL overrides default map', () => {
-    process.env.CODEX_DEFAULT_OPUS_MODEL = 'my-opus'
-    expect(resolveCodexModel('claude-opus-4-6')).toBe('my-opus')
-  })
-
-  test('maps known sonnet model via DEFAULT_MODEL_MAP', () => {
-    expect(resolveCodexModel('claude-sonnet-4-6')).toBe('gpt-5.4-mini')
-  })
-
-  test('maps known haiku model via DEFAULT_MODEL_MAP', () => {
-    expect(resolveCodexModel('claude-haiku-4-5-20251001')).toBe('gpt-5.4-nano')
-  })
-
-  test('maps known opus model via DEFAULT_MODEL_MAP', () => {
-    expect(resolveCodexModel('claude-opus-4-6')).toBe('gpt-5.4')
-  })
-
-  test('maps legacy sonnet models', () => {
-    expect(resolveCodexModel('claude-sonnet-4-20250514')).toBe('gpt-5.4-mini')
-    expect(resolveCodexModel('claude-3-5-sonnet-20241022')).toBe('gpt-5.4-mini')
-  })
-
-  test('maps legacy haiku models', () => {
-    expect(resolveCodexModel('claude-3-5-haiku-20241022')).toBe('gpt-5.4-nano')
-  })
-
-  test('maps legacy opus models', () => {
-    expect(resolveCodexModel('claude-opus-4-20250514')).toBe('gpt-5.4')
-    expect(resolveCodexModel('claude-opus-4-5-20251101')).toBe('gpt-5.4')
-  })
-
-  test('uses family default for unrecognized haiku model', () => {
-    expect(resolveCodexModel('claude-haiku-99')).toBe('gpt-5.4-nano')
-  })
-
-  test('uses family default for unrecognized sonnet model', () => {
-    expect(resolveCodexModel('claude-sonnet-99')).toBe('gpt-5.4-mini')
-  })
-
-  test('uses family default for unrecognized opus model', () => {
-    expect(resolveCodexModel('claude-opus-99')).toBe('gpt-5.4')
-  })
-
-  test('passes through unknown model name without family', () => {
-    expect(resolveCodexModel('some-random-model')).toBe('some-random-model')
-  })
-
-  test('strips [1m] suffix', () => {
-    expect(resolveCodexModel('claude-sonnet-4-6[1m]')).toBe('gpt-5.4-mini')
-  })
-
-  test('CODEX_MODEL takes precedence over family-specific vars', () => {
-    process.env.CODEX_MODEL = 'global-override'
-    process.env.CODEX_DEFAULT_SONNET_MODEL = 'family-override'
-    expect(resolveCodexModel('claude-sonnet-4-6')).toBe('global-override')
-  })
-})
--- a/packages/@ant/model-provider/src/providers/codex/callIds.ts
+++ b/packages/@ant/model-provider/src/providers/codex/callIds.ts
@@ -1,31 +0,0 @@
-import { createHash } from 'crypto'
-
-const MAX_CODEX_CALL_ID_LENGTH = 96
-
-export function normalizeCodexCallId(value: unknown): string | null {
-  if (typeof value !== 'string') {
-    return null
-  }
-
-  const sanitized = value
-    .trim()
-    .replace(/\s+/g, '_')
-    .replace(/[^A-Za-z0-9._:-]/g, '_')
-    .replace(/_+/g, '_')
-    .slice(0, MAX_CODEX_CALL_ID_LENGTH)
-
-  return sanitized.length > 0 ? sanitized : null
-}
-
-export function createCodexFallbackCallId(seed: string): string {
-  const hash = createHash('sha1')
-    .update(seed.length > 0 ? seed : 'codex-call')
-    .digest('hex')
-    .slice(0, 24)
-
-  return `call_${hash}`
-}
-
-export function resolveCodexCallId(value: unknown, seed: string): string {
-  return normalizeCodexCallId(value) ?? createCodexFallbackCallId(seed)
-}
--- a/packages/@ant/model-provider/src/providers/codex/convertMessages.ts
+++ b/packages/@ant/model-provider/src/providers/codex/convertMessages.ts
@@ -1,392 +0,0 @@
-import type {
-  ResponseFunctionToolCallOutputItem,
-  ResponseInputImage,
-  ResponseInputItem,
-  ResponseInputText,
-} from 'openai/resources/responses/responses.mjs'
-import type { Message } from '../../types/index.js'
-import {
-  normalizeCodexCallId,
-  resolveCodexCallId,
-} from './callIds.js'
-
-type ContentBlock = {
-  type: string
-  text?: string
-  source?: {
-    type?: string
-    data?: string
-    media_type?: string
-    url?: string
-  }
-}
-
-type ToolUseLikeBlock = {
-  type: 'tool_use'
-  id: string
-  name: string
-  input: unknown
-}
-
-type ToolResultLikeBlock = {
-  type: 'tool_result'
-  tool_use_id: string
-  content?: string | ReadonlyArray<ContentBlock>
-}
-
-export type CodexImageConversionOptions = {
-  resolveBase64ImageUrl?: (
-    data: string,
-    mediaType?: string,
-  ) => Promise<string | null>
-}
-
-type CodexCallIdState = {
-  byOriginalId: Map<string, string>
-  sequence: number
-}
-
-function createInputText(text: string): ResponseInputText {
-  return {
-    type: 'input_text',
-    text,
-  }
-}
-
-function createInputImage(imageUrl: string): ResponseInputImage {
-  return {
-    type: 'input_image',
-    image_url: imageUrl,
-    detail: 'high',
-  }
-}
-
-function getUnsupportedBlockText(type: string): string | null {
-  switch (type) {
-    case 'image':
-      return '[Image omitted: codex gateway currently requires remote image URLs. Configure CODEX_IMGBB_API_KEY to auto-convert local images.]'
-    case 'document':
-      return '[Document omitted: codex gateway does not support document replay.]'
-    default:
-      return null
-  }
-}
-
-function getImageUrl(block: ContentBlock): string | null {
-  const source = block.source
-  if (!source) {
-    return null
-  }
-
-  if (source.type === 'url' && typeof source.url === 'string' && source.url.length > 0) {
-    return source.url
-  }
-
-  return null
-}
-
-async function resolveImageUrl(
-  block: ContentBlock,
-  options: CodexImageConversionOptions,
-): Promise<string | null> {
-  const directUrl = getImageUrl(block)
-  if (directUrl) {
-    return directUrl
-  }
-
-  if (block.source?.type !== 'base64') {
-    return null
-  }
-
-  if (options.resolveBase64ImageUrl && typeof block.source.data === 'string') {
-    const uploadedUrl = await options.resolveBase64ImageUrl(
-      block.source.data,
-      block.source.media_type,
-    )
-    if (uploadedUrl) {
-      return uploadedUrl
-    }
-  }
-  return null
-}
-
-async function convertBlocksToInputContent(
-  content: ReadonlyArray<ContentBlock>,
-  options: CodexImageConversionOptions,
-): Promise<Array<ResponseInputText | ResponseInputImage>> {
-  const output: Array<ResponseInputText | ResponseInputImage> = []
-
-  for (const block of content) {
-    if (block.type === 'text' && block.text) {
-      output.push(createInputText(block.text))
-      continue
-    }
-
-    if (block.type === 'image') {
-      const imageUrl = await resolveImageUrl(block, options)
-      if (imageUrl) {
-        output.push(createInputImage(imageUrl))
-        continue
-      }
-    }
-
-    const fallback = getUnsupportedBlockText(block.type)
-    if (fallback) {
-      output.push(createInputText(fallback))
-    }
-  }
-
-  return output
-}
-
-async function convertToolResultOutput(
-  content: string | ReadonlyArray<ContentBlock> | undefined,
-  options: CodexImageConversionOptions,
-): Promise<ResponseFunctionToolCallOutputItem['output']> {
-  if (!content) {
-    return ''
-  }
-
-  if (typeof content === 'string') {
-    return content
-  }
-
-  const output = await convertBlocksToInputContent(content, options)
-
-  if (output.length === 0) {
-    return ''
-  }
-
-  if (output.length === 1 && output[0].type === 'input_text') {
-    return output[0].text
-  }
-
-  return output
-}
-
-function pushUserMessage(
-  items: ResponseInputItem[],
-  textParts: string[],
-  imageUrls: string[] = [],
-): void {
-  const text = textParts.join('\n').trim()
-  if (text.length === 0 && imageUrls.length === 0) {
-    return
-  }
-
-  items.push({
-    type: 'message',
-    role: 'user',
-    content: [
-      ...(text.length > 0 ? [createInputText(text)] : []),
-      ...imageUrls.map(createInputImage),
-    ],
-  } as unknown as ResponseInputItem)
-}
-
-function pushAssistantMessage(
-  items: ResponseInputItem[],
-  textParts: string[],
-): void {
-  const text = textParts.join('\n').trim()
-  if (text.length === 0) {
-    return
-  }
-
-  items.push({
-    type: 'message',
-    role: 'assistant',
-    content: [
-      {
-        type: 'output_text',
-        text,
-        annotations: [],
-      },
-    ],
-  } as unknown as ResponseInputItem)
-}
-
-function stringifyToolInput(input: unknown): string {
-  if (typeof input === 'string') {
-    return input
-  }
-
-  try {
-    return JSON.stringify(input ?? {})
-  } catch {
-    return '{}'
-  }
-}
-
-function createCodexCallIdState(): CodexCallIdState {
-  return {
-    byOriginalId: new Map(),
-    sequence: 0,
-  }
-}
-
-function resolveAssistantCallId(
-  block: ToolUseLikeBlock,
-  state: CodexCallIdState,
-): string {
-  const originalId = typeof block.id === 'string' ? block.id : ''
-  const seed = `${block.name}:${stringifyToolInput(block.input)}:${state.sequence}`
-  const callId = resolveCodexCallId(originalId, seed)
-
-  if (originalId.length > 0) {
-    state.byOriginalId.set(originalId, callId)
-  }
-  state.sequence += 1
-
-  return callId
-}
-
-function resolveToolResultCallId(
-  toolUseId: unknown,
-  state: CodexCallIdState,
-): string | null {
-  if (typeof toolUseId !== 'string') {
-    return null
-  }
-
-  return state.byOriginalId.get(toolUseId) ?? normalizeCodexCallId(toolUseId)
-}
-
-async function convertUserContentToInputItems(
-  items: ResponseInputItem[],
-  content: ReadonlyArray<string | ContentBlock>,
-  options: CodexImageConversionOptions,
-  callIdState: CodexCallIdState,
-): Promise<void> {
-  const textParts: string[] = []
-  const imageUrls: string[] = []
-
-  for (const block of content) {
-    if (typeof block === 'string') {
-      textParts.push(block)
-      continue
-    }
-
-    if (block.type === 'tool_result') {
-      pushUserMessage(items, textParts, imageUrls)
-      textParts.length = 0
-      imageUrls.length = 0
-
-      const toolResultBlock = block as ToolResultLikeBlock
-      const callId = resolveToolResultCallId(
-        toolResultBlock.tool_use_id,
-        callIdState,
-      )
-      if (!callId) {
-        continue
-      }
-
-      items.push({
-        type: 'function_call_output',
-        call_id: callId,
-        output: await convertToolResultOutput(toolResultBlock.content, options),
-      })
-      continue
-    }
-
-    if (block.type === 'text' && block.text) {
-      textParts.push(block.text)
-      continue
-    }
-
-    if (block.type === 'image') {
-      const imageUrl = await resolveImageUrl(block, options)
-      if (imageUrl) {
-        imageUrls.push(imageUrl)
-        continue
-      }
-    }
-
-    const fallback = getUnsupportedBlockText(block.type)
-    if (fallback) {
-      textParts.push(fallback)
-    }
-  }
-
-  pushUserMessage(items, textParts, imageUrls)
-}
-
-function convertAssistantContentToInputItems(
-  items: ResponseInputItem[],
-  content: ReadonlyArray<string | ContentBlock>,
-  callIdState: CodexCallIdState,
-): void {
-  const textParts: string[] = []
-
-  for (const block of content) {
-    if (typeof block === 'string') {
-      textParts.push(block)
-      continue
-    }
-
-    if (block.type === 'tool_use') {
-      pushAssistantMessage(items, textParts)
-      textParts.length = 0
-
-      const toolUseBlock = block as unknown as ToolUseLikeBlock
-      items.push({
-        type: 'function_call',
-        call_id: resolveAssistantCallId(toolUseBlock, callIdState),
-        name: toolUseBlock.name,
-        arguments: stringifyToolInput(toolUseBlock.input),
-      })
-      continue
-    }
-
-    if (block.type === 'text' && block.text) {
-      textParts.push(block.text)
-    }
-  }
-
-  pushAssistantMessage(items, textParts)
-}
-
-export async function anthropicMessagesToCodexInput(
-  messages: Message[],
-  options: CodexImageConversionOptions = {},
-): Promise<ResponseInputItem[]> {
-  const items: ResponseInputItem[] = []
-  const callIdState = createCodexCallIdState()
-
-  for (const message of messages) {
-    if (message.type !== 'user' && message.type !== 'assistant') {
-      continue
-    }
-
-    const apiMessage = message.message
-    if (!apiMessage?.content) {
-      continue
-    }
-
-    if (typeof apiMessage.content === 'string') {
-      if (message.type === 'user') {
-        pushUserMessage(items, [apiMessage.content])
-      } else {
-        pushAssistantMessage(items, [apiMessage.content])
-      }
-      continue
-    }
-
-    if (message.type === 'user') {
-      await convertUserContentToInputItems(
-        items,
-        apiMessage.content as ReadonlyArray<string | ContentBlock>,
-        options,
-        callIdState,
-      )
-    } else {
-      convertAssistantContentToInputItems(
-        items,
-        apiMessage.content as ReadonlyArray<string | ContentBlock>,
-        callIdState,
-      )
-    }
-  }
-
-  return items
-}
--- a/packages/@ant/model-provider/src/providers/codex/convertTools.ts
+++ b/packages/@ant/model-provider/src/providers/codex/convertTools.ts
@@ -1,39 +0,0 @@
-import type { BetaToolUnion } from '@anthropic-ai/sdk/resources/beta/messages/messages.mjs'
-import type { Tool as CodexTool } from 'openai/resources/responses/responses.mjs'
-
-function isClientFunctionTool(
-  tool: BetaToolUnion,
-): tool is BetaToolUnion & {
-  name: string
-  description?: string
-  input_schema?: { [key: string]: unknown }
-  strict?: boolean
-  defer_loading?: boolean
-} {
-  const value = tool as unknown as Record<string, unknown>
-  return typeof value.name === 'string'
-}
-
-export function anthropicToolsToCodex(
-  tools: BetaToolUnion[],
-): CodexTool[] {
-  return tools.flatMap(tool => {
-    const value = tool as unknown as Record<string, unknown>
-    if (
-      value.type === 'advisor_20260301' ||
-      value.type === 'computer_20250124' ||
-      !isClientFunctionTool(tool)
-    ) {
-      return []
-    }
-
-    return [{
-      type: 'function',
-      name: tool.name,
-      description: tool.description,
-      parameters: tool.input_schema ?? {},
-      strict: tool.strict ?? null,
-      ...(tool.defer_loading && { defer_loading: true }),
-    }]
-  })
-}
--- a/packages/@ant/model-provider/src/providers/codex/modelMapping.ts
+++ b/packages/@ant/model-provider/src/providers/codex/modelMapping.ts
@@ -1,85 +0,0 @@
-/**
- * Default mapping from Anthropic model names to Codex (OpenAI Responses API) model names.
- * Used only when CODEX_DEFAULT_{FAMILY}_MODEL env vars are not set.
- */
-const DEFAULT_MODEL_MAP: Record<string, string> = {
-  'claude-sonnet-4-20250514': 'gpt-5.4-mini',
-  'claude-sonnet-4-5-20250929': 'gpt-5.4-mini',
-  'claude-sonnet-4-6': 'gpt-5.4-mini',
-  'claude-3-7-sonnet-20250219': 'gpt-5.4-mini',
-  'claude-3-5-sonnet-20241022': 'gpt-5.4-mini',
-  'claude-opus-4-20250514': 'gpt-5.4',
-  'claude-opus-4-1-20250805': 'gpt-5.4',
-  'claude-opus-4-5-20251101': 'gpt-5.4',
-  'claude-opus-4-6': 'gpt-5.4',
-  'claude-haiku-4-5-20251001': 'gpt-5.4-nano',
-  'claude-3-5-haiku-20241022': 'gpt-5.4-nano',
-}
-
-/**
- * Default model for each family when an exact match is not in DEFAULT_MODEL_MAP.
- */
-const DEFAULT_FAMILY_MAP: Record<string, string> = {
-  haiku: 'gpt-5.4-nano',
-  sonnet: 'gpt-5.4-mini',
-  opus: 'gpt-5.4',
-}
-
-function getModelFamily(model: string): 'haiku' | 'sonnet' | 'opus' | null {
-  if (/haiku/i.test(model)) return 'haiku'
-  if (/opus/i.test(model)) return 'opus'
-  if (/sonnet/i.test(model)) return 'sonnet'
-  return null
-}
-
-/**
- * Resolve the Codex (OpenAI Responses API) model name for a given Anthropic model.
- *
- * Priority:
- * 1. CODEX_MODEL env var (override all)
- * 2. CODEX_DEFAULT_{FAMILY}_MODEL env var (e.g. CODEX_DEFAULT_SONNET_MODEL)
- * 3. DEFAULT_MODEL_MAP lookup (exact Anthropic model name match)
- * 4. DEFAULT_FAMILY_MAP lookup (family-based default)
- * 5. Pass through original model name
- */
-export function resolveCodexModel(model: string): string {
-  if (process.env.CODEX_MODEL) {
-    return process.env.CODEX_MODEL
-  }
-
-  const cleanModel = model.replace(/\[1m\]$/, '')
-  const family = getModelFamily(cleanModel)
-  if (family) {
-    const familyOverride = process.env[`CODEX_DEFAULT_${family.toUpperCase()}_MODEL`]
-    if (familyOverride) {
-      return familyOverride
-    }
-  }
-
-  const mapped = DEFAULT_MODEL_MAP[cleanModel]
-  if (mapped) {
-    return mapped
-  }
-
-  if (family) {
-    return DEFAULT_FAMILY_MAP[family]
-  }
-
-  return cleanModel
-}
-
-export function resolveCodexMaxTokens(
-  upperLimit: number,
-  maxOutputTokensOverride?: number,
-): number {
-  return (
-    maxOutputTokensOverride ??
-    (process.env.CODEX_MAX_TOKENS
-      ? parseInt(process.env.CODEX_MAX_TOKENS, 10) || undefined
-      : undefined) ??
-    (process.env.CLAUDE_CODE_MAX_OUTPUT_TOKENS
-      ? parseInt(process.env.CLAUDE_CODE_MAX_OUTPUT_TOKENS, 10) || undefined
-      : undefined) ??
-    upperLimit
-  )
-}
--- a/packages/builtin-tools/src/tools/AgentTool/tests/filterIncompleteToolCalls.test.ts
+++ b/packages/builtin-tools/src/tools/AgentTool/tests/filterIncompleteToolCalls.test.ts
@@ -0,0 +1,180 @@
+import { describe, expect, test } from 'bun:test'
+import type { Message } from 'src/types/message.js'
+import { filterIncompleteToolCalls } from '../filterIncompleteToolCalls.js'
+
+describe('filterIncompleteToolCalls', () => {
+  test('drops assistant tool uses that do not have matching results', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          role: 'assistant',
+          content: [{ type: 'tool_use', id: 'missing', name: 'Read' }],
+        },
+      },
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: { role: 'user', content: 'continue' },
+      },
+    ] as unknown as Message[]
+
+    expect(
+      filterIncompleteToolCalls(messages).map(message => String(message.uuid)),
+    ).toEqual(['u1'])
+  })
+
+  test('preserves assistant text when dropping orphan tool uses', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          role: 'assistant',
+          content: [
+            { type: 'text', text: 'I will read the file.' },
+            { type: 'tool_use', id: 'missing', name: 'Read' },
+          ],
+        },
+      },
+    ] as unknown as Message[]
+
+    const filtered = filterIncompleteToolCalls(messages)
+    expect(filtered).toHaveLength(1)
+    const first = filtered[0]!
+    const content = first.message!.content
+    expect(
+      Array.isArray(content) ? content.map(block => block.type) : [],
+    ).toEqual(['text'])
+  })
+
+  test('keeps completed parallel tool calls when dropping an orphan', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          role: 'assistant',
+          content: [
+            { type: 'tool_use', id: 'done', name: 'Read' },
+            { type: 'tool_use', id: 'missing', name: 'Grep' },
+          ],
+        },
+      },
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: {
+          role: 'user',
+          content: [{ type: 'tool_result', tool_use_id: 'done', content: 'ok' }],
+        },
+      },
+    ] as unknown as Message[]
+
+    const filtered = filterIncompleteToolCalls(messages)
+    expect(filtered.map(message => String(message.uuid))).toEqual(['a1', 'u1'])
+    const first = filtered[0]!
+    const content = first.message!.content
+    expect(
+      Array.isArray(content)
+        ? content.map(block =>
+            block.type === 'tool_use' ? block.id : block.type,
+          )
+        : [],
+    ).toEqual(['done'])
+  })
+
+  test('keeps assistant tool uses that have matching results', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          role: 'assistant',
+          content: [{ type: 'tool_use', id: 'done', name: 'Read' }],
+        },
+      },
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: {
+          role: 'user',
+          content: [{ type: 'tool_result', tool_use_id: 'done', content: 'ok' }],
+        },
+      },
+    ] as unknown as Message[]
+
+    expect(
+      filterIncompleteToolCalls(messages).map(message => String(message.uuid)),
+    ).toEqual(['a1', 'u1'])
+  })
+
+  test('drops orphan tool results when their tool use was removed', () => {
+    const messages = [
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: {
+          role: 'user',
+          content: [
+            { type: 'tool_result', tool_use_id: 'missing', content: 'late' },
+          ],
+        },
+      },
+    ] as unknown as Message[]
+
+    expect(filterIncompleteToolCalls(messages)).toEqual([])
+  })
+
+  test('keeps user text while dropping orphan tool results', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: { role: 'assistant', content: 'done' },
+      },
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: {
+          role: 'user',
+          content: [
+            { type: 'text', text: 'keep this' },
+            { type: 'tool_result', tool_use_id: 'missing', content: 'late' },
+          ],
+        },
+      },
+    ] as unknown as Message[]
+
+    const filtered = filterIncompleteToolCalls(messages)
+    expect(filtered.map(message => String(message.uuid))).toEqual(['a1', 'u1'])
+    const content = filtered[1]!.message!.content
+    expect(Array.isArray(content) ? content : []).toEqual([
+      { type: 'text', text: 'keep this' },
+    ])
+  })
+
+  test('drops malformed tool blocks without ids', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          role: 'assistant',
+          content: [{ type: 'tool_use', name: 'Read' }],
+        },
+      },
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: {
+          role: 'user',
+          content: [{ type: 'tool_result', content: 'late' }],
+        },
+      },
+    ] as unknown as Message[]
+
+    expect(filterIncompleteToolCalls(messages)).toEqual([])
+  })
+})
--- a/packages/builtin-tools/src/tools/AgentTool/filterIncompleteToolCalls.ts
+++ b/packages/builtin-tools/src/tools/AgentTool/filterIncompleteToolCalls.ts
@@ -0,0 +1,110 @@
+import type {
+  AssistantMessage,
+  Message,
+  UserMessage,
+} from 'src/types/message.js'
+
+/**
+ * Removes invalid or orphaned tool_use/tool_result blocks while preserving
+ * completed tool-call pairs. This is intentionally block-level, not
+ * message-level, so completed parallel tool calls stay paired with results.
+ */
+export function filterIncompleteToolCalls(messages: Message[]): Message[] {
+  const toolUseIdsWithResults = new Set<string>()
+
+  for (const message of messages) {
+    if (message?.type === 'user') {
+      const userMessage = message as UserMessage
+      const content = userMessage.message.content
+      if (Array.isArray(content)) {
+        for (const block of content) {
+          if (block.type === 'tool_result' && block.tool_use_id) {
+            toolUseIdsWithResults.add(block.tool_use_id)
+          }
+        }
+      }
+    }
+  }
+
+  const retainedToolUseIds = new Set<string>()
+  const withoutOrphanToolUses: Message[] = []
+
+  for (const message of messages) {
+    if (message?.type === 'assistant') {
+      const assistantMessage = message as AssistantMessage
+      const content = assistantMessage.message.content
+      if (Array.isArray(content)) {
+        let changed = false
+        const filteredContent = content.filter(block => {
+          if (block.type !== 'tool_use') return true
+          if (!block.id) {
+            changed = true
+            return false
+          }
+          if (toolUseIdsWithResults.has(block.id)) {
+            retainedToolUseIds.add(block.id)
+            return true
+          }
+          changed = true
+          return false
+        })
+
+        if (!changed) {
+          withoutOrphanToolUses.push(message)
+          continue
+        }
+        if (filteredContent.length > 0) {
+          withoutOrphanToolUses.push({
+            ...assistantMessage,
+            message: {
+              ...assistantMessage.message,
+              content: filteredContent,
+            },
+          })
+        }
+        continue
+      }
+    }
+    withoutOrphanToolUses.push(message)
+  }
+
+  const filteredMessages: Message[] = []
+  for (const message of withoutOrphanToolUses) {
+    if (message?.type !== 'user') {
+      filteredMessages.push(message)
+      continue
+    }
+    const userMessage = message as UserMessage
+    const content = userMessage.message.content
+    if (!Array.isArray(content)) {
+      filteredMessages.push(message)
+      continue
+    }
+    let changed = false
+    const filteredContent = content.filter(block => {
+      if (block.type !== 'tool_result') return true
+      if (!block.tool_use_id) {
+        changed = true
+        return false
+      }
+      if (retainedToolUseIds.has(block.tool_use_id)) return true
+      changed = true
+      return false
+    })
+    if (!changed) {
+      filteredMessages.push(message)
+      continue
+    }
+    if (filteredContent.length > 0) {
+      filteredMessages.push({
+        ...userMessage,
+        message: {
+          ...userMessage.message,
+          content: filteredContent,
+        },
+      })
+    }
+  }
+
+  return filteredMessages
+}
--- a/packages/builtin-tools/src/tools/AgentTool/runAgent.ts
+++ b/packages/builtin-tools/src/tools/AgentTool/runAgent.ts
@@ -86,8 +86,11 @@ import {
 import type { ContentReplacementState } from 'src/utils/toolResultStorage.js'
 import { createAgentId } from 'src/utils/uuid.js'
 import { resolveAgentTools } from './agentToolUtils.js'
+import { filterIncompleteToolCalls } from './filterIncompleteToolCalls.js'
 import { type AgentDefinition, isBuiltInAgent } from './loadAgentsDir.js'

+export { filterIncompleteToolCalls } from './filterIncompleteToolCalls.js'
+
 /**
 * Initialize agent-specific MCP servers
 * Agents can define their own MCP servers in their frontmatter that are additive
@@ -886,50 +889,6 @@ export async function* runAgent({
  }
 }

-/**
- * Filters out assistant messages with incomplete tool calls (tool uses without results).
- * This prevents API errors when sending messages with orphaned tool calls.
- */
-export function filterIncompleteToolCalls(messages: Message[]): Message[] {
-  // Build a set of tool use IDs that have results
-  const toolUseIdsWithResults = new Set<string>()
-
-  for (const message of messages) {
-    if (message?.type === 'user') {
-      const userMessage = message as UserMessage
-      const content = userMessage.message.content
-      if (Array.isArray(content)) {
-        for (const block of content) {
-          if (block.type === 'tool_result' && block.tool_use_id) {
-            toolUseIdsWithResults.add(block.tool_use_id)
-          }
-        }
-      }
-    }
-  }
-
-  // Filter out assistant messages that contain tool calls without results
-  return messages.filter(message => {
-    if (message?.type === 'assistant') {
-      const assistantMessage = message as AssistantMessage
-      const content = assistantMessage.message.content
-      if (Array.isArray(content)) {
-        // Check if this assistant message has any tool uses without results
-        const hasIncompleteToolCall = content.some(
-          block =>
-            block.type === 'tool_use' &&
-            block.id &&
-            !toolUseIdsWithResults.has(block.id),
-        )
-        // Exclude messages with incomplete tool calls
-        return !hasIncompleteToolCall
-      }
-    }
-    // Keep all non-assistant messages and assistant messages without tool calls
-    return true
-  })
-}
-
 async function getAgentSystemPrompt(
  agentDefinition: AgentDefinition,
  toolUseContext: Pick<ToolUseContext, 'options'>,
--- a/packages/builtin-tools/src/tools/ListPeersTool/ListPeersTool.ts
+++ b/packages/builtin-tools/src/tools/ListPeersTool/ListPeersTool.ts
@@ -84,22 +84,48 @@ Use this tool to discover messaging targets before sending cross-session message
    // UDS socket directory. The implementation scans for live sockets
    // and optionally includes Remote Control bridge peers.
    const peers: PeerInfo[] = []
+    const seen = new Set<string>()
+    const addPeer = (peer: PeerInfo): void => {
+      if (seen.has(peer.address)) return
+      seen.add(peer.address)
+      peers.push(peer)
+    }

-    // Discovery is handled by the UDS messaging subsystem initialized in setup.ts.
-    // Return discovered peers from the app state.
-    const appState = context.getAppState()
-    const messagingSocketPath = (appState as Record<string, unknown>).messagingSocketPath as string | undefined
+    /* eslint-disable @typescript-eslint/no-require-imports */
+    const udsMessaging =
+      require('src/utils/udsMessaging.js') as typeof import('src/utils/udsMessaging.js')
+    const udsClient =
+      require('src/utils/udsClient.js') as typeof import('src/utils/udsClient.js')
+    const bridgePeers =
+      require('src/bridge/peerSessions.js') as typeof import('src/bridge/peerSessions.js')
+    /* eslint-enable @typescript-eslint/no-require-imports */
+
+    const messagingSocketPath = udsMessaging.getUdsMessagingSocketPath()
    if (messagingSocketPath) {
      // Self entry for reference
      if (_input.include_self) {
-        peers.push({
-          address: `uds:${messagingSocketPath}`,
+        addPeer({
+          address: udsMessaging.formatUdsAddress(messagingSocketPath),
          name: 'self',
          pid: process.pid,
        })
      }
    }

+    for (const peer of await udsClient.listPeers()) {
+      if (!peer.messagingSocketPath) continue
+      addPeer({
+        address: udsMessaging.formatUdsAddress(peer.messagingSocketPath),
+        name: peer.name ?? peer.kind,
+        cwd: peer.cwd,
+        pid: peer.pid,
+      })
+    }
+
+    for (const peer of await bridgePeers.listBridgePeers()) {
+      addPeer(peer)
+    }
+
    return {
      data: { peers },
    }
--- a/packages/builtin-tools/src/tools/SendMessageTool/SendMessageTool.ts
+++ b/packages/builtin-tools/src/tools/SendMessageTool/SendMessageTool.ts
@@ -130,6 +130,41 @@ export type SendMessageToolOutput =
  | RequestOutput
  | ResponseOutput

+const UDS_INLINE_TOKEN_MARKER = '#token='
+
+function stripInlineUdsToken(target: string): string {
+  const markerIndex = target.indexOf(UDS_INLINE_TOKEN_MARKER)
+  return markerIndex === -1 ? target : target.slice(0, markerIndex)
+}
+
+function hasInlineUdsToken(to: string): boolean {
+  const addr = parseAddress(to)
+  // Empty-token markers are still inline-token attempts. Observable input
+  // redaction preserves "#token=" so cloned inputs remain rejected.
+  return (
+    addr.scheme === 'uds' && addr.target.includes(UDS_INLINE_TOKEN_MARKER)
+  )
+}
+
+function recipientForDisplay(to: string): string {
+  const addr = parseAddress(to)
+  if (addr.scheme !== 'uds') return to
+  return `uds:${stripInlineUdsToken(addr.target)}`
+}
+
+function redactInlineUdsTokenForRejection(to: string): string {
+  const addr = parseAddress(to)
+  if (addr.scheme !== 'uds') return to
+  const markerIndex = addr.target.indexOf(UDS_INLINE_TOKEN_MARKER)
+  if (markerIndex === -1) return to
+  return `uds:${addr.target.slice(0, markerIndex)}${UDS_INLINE_TOKEN_MARKER}`
+}
+
+function redactObservableInlineUdsToken(input: { to: string }): void {
+  if (!hasInlineUdsToken(input.to)) return
+  input.to = redactInlineUdsTokenForRejection(input.to)
+}
+
 function findTeammateColor(
  appState: {
    teamContext?: { teammates: { [id: string]: { color?: string } } }
@@ -541,15 +576,17 @@ export const SendMessageTool: Tool<InputSchema, SendMessageToolOutput> =
    },

    backfillObservableInput(input) {
-      if ('type' in input) return
      if (typeof input.to !== 'string') return

+      redactObservableInlineUdsToken(input as { to: string })
+      if ('type' in input) return
+
      if (input.to === '*') {
        input.type = 'broadcast'
        if (typeof input.message === 'string') input.content = input.message
      } else if (typeof input.message === 'string') {
        input.type = 'message'
-        input.recipient = input.to
+        input.recipient = recipientForDisplay(input.to)
        input.content = input.message
      } else if (typeof input.message === 'object' && input.message !== null) {
        const msg = input.message as {
@@ -560,7 +597,7 @@ export const SendMessageTool: Tool<InputSchema, SendMessageToolOutput> =
          feedback?: string
        }
        input.type = msg.type
-        input.recipient = input.to
+        input.recipient = recipientForDisplay(input.to)
        if (msg.request_id !== undefined) input.request_id = msg.request_id
        if (msg.approve !== undefined) input.approve = msg.approve
        const content = msg.reason ?? msg.feedback
@@ -569,16 +606,20 @@ export const SendMessageTool: Tool<InputSchema, SendMessageToolOutput> =
    },

    toAutoClassifierInput(input) {
+      const recipient = recipientForDisplay(input.to)
      if (typeof input.message === 'string') {
-        return `to ${input.to}: ${input.message}`
+        return `to ${recipient}: ${input.message}`
      }
      switch (input.message.type) {
        case 'shutdown_request':
-          return `shutdown_request to ${input.to}`
+          return `shutdown_request to ${recipient}`
        case 'shutdown_response':
          return `shutdown_response ${input.message.approve ? 'approve' : 'reject'} ${input.message.request_id}`
        case 'plan_approval_response':
-          return `plan_approval ${input.message.approve ? 'approve' : 'reject'} to ${input.to}`
+          const planApprovalDecision = input.message.approve
+            ? 'approve'
+            : 'reject'
+          return `plan_approval ${planApprovalDecision} to ${recipient}`
      }
    },

@@ -630,6 +671,17 @@ export const SendMessageTool: Tool<InputSchema, SendMessageToolOutput> =
          errorCode: 9,
        }
      }
+      if (
+        addr.scheme === 'uds' &&
+        hasInlineUdsToken(input.to)
+      ) {
+        return {
+          result: false,
+          message:
+            'uds addresses must not include inline auth tokens; use the ListPeers address',
+          errorCode: 9,
+        }
+      }
      if (input.to.includes('@')) {
        return {
          result: false,
@@ -753,6 +805,19 @@ export const SendMessageTool: Tool<InputSchema, SendMessageToolOutput> =
    },

    async call(input, context, canUseTool, assistantMessage) {
+      if (typeof input.message === 'string') {
+        const addr = parseAddress(input.to)
+        if (addr.scheme === 'uds' && hasInlineUdsToken(input.to)) {
+          return {
+            data: {
+              success: false,
+              message:
+                'uds addresses must not include inline auth tokens; use the ListPeers address',
+            },
+          }
+        }
+      }
+
      if (feature('UDS_INBOX') && typeof input.message === 'string') {
        const addr = parseAddress(input.to)
        if (addr.scheme === 'bridge') {
--- a/packages/builtin-tools/src/tools/SendMessageTool/tests/udsRecipientSanitization.test.ts
+++ b/packages/builtin-tools/src/tools/SendMessageTool/tests/udsRecipientSanitization.test.ts
@@ -0,0 +1,181 @@
+import { describe, expect, test } from 'bun:test'
+import { SendMessageTool } from '../SendMessageTool.js'
+
+describe('SendMessageTool UDS recipient handling', () => {
+  test('redacts inline UDS tokens before classifier and observable paths', async () => {
+    const tokenAddress = 'uds:/tmp/peer.sock#token=secret-token'
+
+    const observableInput = {
+      to: tokenAddress,
+      message: 'hello',
+    } as Record<string, unknown>
+    SendMessageTool.backfillObservableInput!(observableInput)
+
+    expect(observableInput.recipient).toBe('uds:/tmp/peer.sock')
+    expect(observableInput.to).toBe('uds:/tmp/peer.sock#token=')
+    expect(JSON.stringify(observableInput)).not.toContain('secret-token')
+    expect(
+      SendMessageTool.toAutoClassifierInput({
+        to: tokenAddress,
+        message: 'hello',
+      }),
+    ).toBe('to uds:/tmp/peer.sock: hello')
+  })
+
+  test('keeps redacted UDS token rejection through observable backfill', async () => {
+    const observableInput = {
+      to: 'uds:/tmp/peer.sock#token=secret-token',
+      message: {
+        type: 'plan_approval_response',
+        request_id: 'req-1',
+        approve: false,
+        reason: 'needs tests',
+      },
+    } as Record<string, unknown>
+
+    SendMessageTool.backfillObservableInput!(observableInput)
+
+    expect(observableInput.to).toBe('uds:/tmp/peer.sock#token=')
+    expect(observableInput.recipient).toBe('uds:/tmp/peer.sock')
+    expect(observableInput.type).toBe('plan_approval_response')
+    expect(observableInput.request_id).toBe('req-1')
+    expect(observableInput.approve).toBe(false)
+    expect(observableInput.content).toBe('needs tests')
+    expect(JSON.stringify(observableInput)).not.toContain('secret-token')
+
+    const result = await SendMessageTool.validateInput!(
+      observableInput as never,
+      {} as never,
+    )
+
+    expect(result.result).toBe(false)
+    if (result.result !== false) {
+      throw new Error('expected validation to reject redacted inline UDS token')
+    }
+    expect(result.message).toContain('inline auth tokens')
+  })
+
+  test('keeps inline-token rejection when observable input is cloned', async () => {
+    const observableInput = {
+      to: 'uds:/tmp/peer.sock#token=secret-token',
+      message: 'hello',
+    } as Record<string, unknown>
+
+    SendMessageTool.backfillObservableInput!(observableInput)
+    const clonedInput = {
+      to: observableInput.to,
+      message: observableInput.message,
+      summary: 'hello peer',
+    }
+
+    const validation = await SendMessageTool.validateInput!(
+      clonedInput as never,
+      {} as never,
+    )
+    const result = await SendMessageTool.call(
+      clonedInput as never,
+      {} as never,
+      undefined as never,
+      undefined as never,
+    )
+
+    expect(validation.result).toBe(false)
+    expect(result.data.success).toBe(false)
+    expect(JSON.stringify(clonedInput)).not.toContain('secret-token')
+    expect(JSON.stringify(result)).not.toContain('secret-token')
+  })
+
+  test('redacts UDS tokens in structured classifier text', async () => {
+    const to = 'uds:/tmp/peer.sock#token=secret-token'
+
+    expect(
+      SendMessageTool.toAutoClassifierInput({
+        to,
+        message: { type: 'shutdown_request' },
+      }),
+    ).toBe('shutdown_request to uds:/tmp/peer.sock')
+    expect(
+      SendMessageTool.toAutoClassifierInput({
+        to,
+        message: {
+          type: 'plan_approval_response',
+          request_id: 'req-1',
+          approve: true,
+        },
+      }),
+    ).toBe('plan_approval approve to uds:/tmp/peer.sock')
+    expect(
+      SendMessageTool.toAutoClassifierInput({
+        to,
+        message: {
+          type: 'plan_approval_response',
+          request_id: 'req-2',
+          approve: false,
+        },
+      }),
+    ).toBe('plan_approval reject to uds:/tmp/peer.sock')
+    expect(
+      SendMessageTool.toAutoClassifierInput({
+        to,
+        message: {
+          type: 'shutdown_response',
+          request_id: 'shutdown-1',
+          approve: false,
+        },
+      }),
+    ).toBe('shutdown_response reject shutdown-1')
+  })
+
+  test('redacts from the first inline UDS token marker', async () => {
+    const tokenAddress = 'uds:/tmp/peer.sock#token=first#token=second'
+
+    const observableInput = {
+      to: tokenAddress,
+      message: 'hello',
+    } as Record<string, unknown>
+    SendMessageTool.backfillObservableInput!(observableInput)
+
+    expect(observableInput.to).toBe('uds:/tmp/peer.sock#token=')
+    expect(observableInput.recipient).toBe('uds:/tmp/peer.sock')
+    expect(JSON.stringify(observableInput)).not.toContain('first')
+    expect(JSON.stringify(observableInput)).not.toContain('second')
+    expect(
+      SendMessageTool.toAutoClassifierInput({
+        to: tokenAddress,
+        message: 'hello',
+      }),
+    ).toBe('to uds:/tmp/peer.sock: hello')
+  })
+
+  test('rejects inline UDS tokens during validation', async () => {
+    const result = await SendMessageTool.validateInput!(
+      {
+        to: 'uds:/tmp/peer.sock#token=secret-token',
+        message: 'hello',
+      },
+      {} as never,
+    )
+
+    expect(result.result).toBe(false)
+    if (result.result !== false) {
+      throw new Error('expected validation to reject inline UDS token')
+    }
+    expect(result.message).toContain('inline auth tokens')
+    expect(JSON.stringify(result)).not.toContain('secret-token')
+  })
+
+  test('rejects inline UDS tokens during execution without leaking them', async () => {
+    const result = await SendMessageTool.call(
+      {
+        to: 'uds:/tmp/peer.sock#token=secret-token',
+        message: 'hello',
+      },
+      {} as never,
+      undefined as never,
+      undefined as never,
+    )
+
+    expect(result.data.success).toBe(false)
+    expect(JSON.stringify(result)).not.toContain('secret-token')
+  })
+})
--- a/src/bridge/peerSessions.ts
+++ b/src/bridge/peerSessions.ts
@@ -6,6 +6,38 @@ import { getBridgeAccessToken } from './bridgeConfig.js'
 import { getReplBridgeHandle } from './replBridgeHandle.js'
 import { toCompatSessionId } from './sessionIdCompat.js'

+export type BridgePeerSession = {
+  address: string
+  name?: string
+  cwd?: string
+  pid?: number
+}
+
+/**
+ * List locally registered sessions that have published a Remote Control
+ * session ID. The PID registry is the local source of truth for bridge peers
+ * already known to this machine; SendMessage can use these bridge:<id>
+ * addresses when the current process has an active bridge handle.
+ */
+export async function listBridgePeers(): Promise<BridgePeerSession[]> {
+  const { listAllLiveSessions } = await import('../utils/udsClient.js')
+  const sessions = await listAllLiveSessions()
+  const peers: BridgePeerSession[] = []
+
+  for (const session of sessions) {
+    if (session.pid === process.pid || !session.bridgeSessionId) continue
+    const compatId = toCompatSessionId(session.bridgeSessionId)
+    peers.push({
+      address: `bridge:${compatId}`,
+      name: session.name ?? session.kind,
+      cwd: session.cwd,
+      pid: session.pid,
+    })
+  }
+
+  return peers
+}
+
 /**
 * Send a plain-text message to another Claude session via the bridge API.
 *
--- a/src/cli/print.ts
+++ b/src/cli/print.ts
@@ -2763,13 +2763,37 @@ function runHeadlessStreaming(
  // when a message arrives via the UDS socket in headless mode.
  if (feature('UDS_INBOX')) {
    /* eslint-disable @typescript-eslint/no-require-imports */
-    const { setOnEnqueue } = require('../utils/udsMessaging.js')
+    const { drainInbox, setOnEnqueue } =
+      require('../utils/udsMessaging.js') as typeof import('../utils/udsMessaging.js')
    /* eslint-enable @typescript-eslint/no-require-imports */
+
+    const enqueueUdsInboxMessages = (): boolean => {
+      const entries = drainInbox()
+      for (const entry of entries) {
+        const value =
+          typeof entry.message.data === 'string'
+            ? entry.message.data
+            : jsonStringify(entry.message.data)
+        enqueue({
+          mode: 'prompt',
+          value,
+          uuid: randomUUID(),
+        })
+      }
+      return entries.length > 0
+    }
+
    setOnEnqueue(() => {
      if (!inputClosed) {
-        void run()
+        if (enqueueUdsInboxMessages()) {
+          void run()
+        }
      }
    })
+
+    if (enqueueUdsInboxMessages()) {
+      void run()
+    }
  }

  // Cron scheduler: runs scheduled_tasks.json tasks in SDK/-p mode.
--- a/src/commands/clear/conversation.ts
+++ b/src/commands/clear/conversation.ts
@@ -10,10 +10,6 @@ import {
  getOriginalCwd,
  getSessionId,
  regenerateSessionId,
-  resetCostState,
-  setLastAPIRequest,
-  setLastAPIRequestMessages,
-  setLastClassifierRequests,
 } from '../../bootstrap/state.js'
 import type { SDKStatusMessage } from '../../entrypoints/sdk/coreTypes.js'
 import {
@@ -148,14 +144,6 @@ export async function clearConversation({
  // tracking) is retained so those agents keep functioning.
  clearSessionCaches(preservedAgentIds)

-  // Clear large STATE-held data that outlives the message array.
-  // lastAPIRequestMessages can hold the full post-compaction conversation
-  // (hundreds of KB–MB) for /share; resetCostState clears modelUsage.
-  setLastAPIRequest(null)
-  setLastAPIRequestMessages(null)
-  setLastClassifierRequests(null)
-  resetCostState()
-
  setCwd(getOriginalCwd())
  readFileState.clear()
  discoveredSkillNames?.clear()
--- a/src/commands/peers/peers.ts
+++ b/src/commands/peers/peers.ts
@@ -1,6 +1,9 @@
 import type { LocalCommandCall } from '../../types/command.js'
 import { listPeers, isPeerAlive } from '../../utils/udsClient.js'
-import { getUdsMessagingSocketPath } from '../../utils/udsMessaging.js'
+import {
+  formatUdsAddress,
+  getUdsMessagingSocketPath,
+} from '../../utils/udsMessaging.js'

 export const call: LocalCommandCall = async (_args, _context) => {
  const mySocket = getUdsMessagingSocketPath()
@@ -29,11 +32,11 @@ export const call: LocalCommandCall = async (_args, _context) => {
        ? `  started: ${formatAge(peer.startedAt)}`
        : ''

-      lines.push(
-        `  [${status}] PID ${peer.pid} (${label})${cwd}${age}`,
-      )
+      lines.push(`  [${status}] PID ${peer.pid} (${label})${cwd}${age}`)
      if (peer.messagingSocketPath) {
-        lines.push(`           socket: ${peer.messagingSocketPath}`)
+        lines.push(
+          `           socket: ${formatUdsAddress(peer.messagingSocketPath)}`,
+        )
      }
      if (peer.sessionId) {
        lines.push(`           session: ${peer.sessionId}`)
@@ -43,7 +46,7 @@ export const call: LocalCommandCall = async (_args, _context) => {

  lines.push('')
  lines.push(
-    'To message a peer: use SendMessage with to="uds:<socket-path>"',
+    'To message a peer: use SendMessage with the shown uds:<socket-path> address',
  )

  return { type: 'text', value: lines.join('\n') }
--- a/src/commands/poor/tests/poorMode.test.ts
+++ b/src/commands/poor/tests/poorMode.test.ts
@@ -5,7 +5,8 @@
 * After the fix, it reads from / writes to settings.json via
 * getInitialSettings() and updateSettingsForSource().
 */
-import { describe, expect, test, beforeEach, mock } from 'bun:test'
+import { afterAll, describe, expect, test, beforeEach, mock } from 'bun:test'
+import * as settingsModule from '../../../utils/settings/settings.js'

 // ── Mocks must be declared before the module under test is imported ──────────

@@ -13,24 +14,48 @@ let mockSettings: Record<string, unknown> = {}
 let lastUpdate: { source: string; patch: Record<string, unknown> } | null = null

 mock.module('src/utils/settings/settings.js', () => ({
+  loadManagedFileSettings: () => ({ settings: null, errors: [] }),
+  getManagedFileSettingsPresence: () => ({
+    hasBase: false,
+    hasDropIns: false,
+  }),
+  parseSettingsFile: () => ({ settings: null, errors: [] }),
+  getSettingsRootPathForSource: () => '',
+  getSettingsFilePathForSource: () => undefined,
+  getRelativeSettingsFilePathForSource: () => '',
  getInitialSettings: () => mockSettings,
+  getSettingsForSource: () => mockSettings,
+  getPolicySettingsOrigin: () => null,
+  getSettingsWithErrors: () => ({ settings: mockSettings, errors: [] }),
+  getSettingsWithSources: () => ({ effective: mockSettings, sources: [] }),
+  getSettings_DEPRECATED: () => mockSettings,
+  settingsMergeCustomizer: () => undefined,
+  getManagedSettingsKeysForLogging: () => [],
+  // Keep unrelated exports aligned with the real settings module so this
+  // full-surface mock cannot change later test files if Bun keeps it alive.
+  hasAutoModeOptIn: () => true,
+  hasSkipDangerousModePermissionPrompt: () => false,
+  getAutoModeConfig: () => undefined,
+  getUseAutoModeDuringPlan: () => true,
+  rawSettingsContainsKey: (key: string) => key in mockSettings,
  updateSettingsForSource: (source: string, patch: Record<string, unknown>) => {
    lastUpdate = { source, patch }
    mockSettings = { ...mockSettings, ...patch }
  },
 }))

-// Import AFTER mocks are registered
-const { isPoorModeActive, setPoorMode } = await import('../poorMode.js')
+afterAll(() => {
+  mock.restore()
+  mock.module('src/utils/settings/settings.js', () => settingsModule)
+})

-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-/** Reset module-level singleton between tests by re-importing a fresh copy. */
-async function freshModule() {
-  // Bun caches modules; we manipulate the exported functions directly since
-  // the singleton `poorModeActive` is reset to null only on first import.
-  // Instead we test the observable behaviour through set/get pairs.
-}
+// Import AFTER mocks are registered. The query suffix gives this file its own
+// module instance so cross-file poorMode.js mocks cannot replace the subject
+// under test during Bun's shared coverage run.
+const poorModeModulePath = '../poorMode.js?poorModeTest'
+const { isPoorModeActive, setPoorMode } = (await import(
+  poorModeModulePath
+)) as typeof import('../poorMode.js')

 // ── Tests ────────────────────────────────────────────────────────────────────

--- a/src/commands/provider.ts
+++ b/src/commands/provider.ts
@@ -15,8 +15,6 @@ function getEnvVarForProvider(provider: string): string {
      return 'CLAUDE_CODE_USE_FOUNDRY'
    case 'gemini':
      return 'CLAUDE_CODE_USE_GEMINI'
-    case 'codex':
-      return 'CLAUDE_CODE_USE_CODEX'
    case 'grok':
      return 'CLAUDE_CODE_USE_GROK'
    default:
@@ -53,7 +51,6 @@ const call: LocalCommandCall = async (args, context) => {
    delete process.env.CLAUDE_CODE_USE_VERTEX
    delete process.env.CLAUDE_CODE_USE_FOUNDRY
    delete process.env.CLAUDE_CODE_USE_OPENAI
-    delete process.env.CLAUDE_CODE_USE_CODEX
    delete process.env.CLAUDE_CODE_USE_GEMINI
    delete process.env.CLAUDE_CODE_USE_GROK
    return {
@@ -66,7 +63,6 @@ const call: LocalCommandCall = async (args, context) => {
  const validProviders = [
    'anthropic',
    'openai',
-    'codex',
    'gemini',
    'grok',
    'bedrock',
@@ -97,18 +93,6 @@ const call: LocalCommandCall = async (args, context) => {
    }
  }

-  if (arg === 'codex') {
-    const mergedEnv = getMergedEnv()
-    const hasKey = !!mergedEnv.CODEX_API_KEY
-    if (!hasKey) {
-      updateSettingsForSource('userSettings', { modelType: 'codex' })
-      return {
-        type: 'text',
-        value: `Switched to OpenAI Responses provider.\nWarning: Missing env var: CODEX_API_KEY\nConfigure via /login, settings.json env, or set manually.`,
-      }
-    }
-  }
-
  // Check env vars when switching to grok (including settings.env)
  if (arg === 'grok') {
    const mergedEnv = getMergedEnv()
@@ -139,24 +123,19 @@ const call: LocalCommandCall = async (args, context) => {
  // Handle different provider types
  // - 'anthropic', 'openai', 'gemini' are stored in settings.json (persistent)
  // - 'bedrock', 'vertex', 'foundry' are env-only (do NOT touch settings.json)
-  if (arg === 'anthropic' || arg === 'openai' || arg === 'codex' || arg === 'gemini' || arg === 'grok') {
+  if (arg === 'anthropic' || arg === 'openai' || arg === 'gemini' || arg === 'grok') {
    // Clear any cloud provider env vars to avoid conflicts
    delete process.env.CLAUDE_CODE_USE_BEDROCK
    delete process.env.CLAUDE_CODE_USE_VERTEX
    delete process.env.CLAUDE_CODE_USE_FOUNDRY
    delete process.env.CLAUDE_CODE_USE_OPENAI
-    delete process.env.CLAUDE_CODE_USE_CODEX
    delete process.env.CLAUDE_CODE_USE_GEMINI
    delete process.env.CLAUDE_CODE_USE_GROK
    // Update settings.json
    updateSettingsForSource('userSettings', { modelType: arg })
    // Ensure settings.env gets applied to process.env
    applyConfigEnvironmentVariables()
-    const message =
-      arg === 'codex' && !getMergedEnv().CODEX_IMGBB_API_KEY
-        ? `API provider set to ${arg}.\nOptional: set CODEX_IMGBB_API_KEY to enable local image uploads for image understanding.`
-        : `API provider set to ${arg}.`
-    return { type: 'text', value: message }
+    return { type: 'text', value: `API provider set to ${arg}.` }
  } else {
    // Cloud providers: set env vars only, do NOT touch settings.json
    delete process.env.CLAUDE_CODE_USE_OPENAI
@@ -178,9 +157,9 @@ const provider = {
  type: 'local',
  name: 'provider',
  description:
-    'Switch API provider (anthropic/openai/codex/gemini/grok/bedrock/vertex/foundry)',
+    'Switch API provider (anthropic/openai/gemini/grok/bedrock/vertex/foundry)',
  aliases: ['api'],
-  argumentHint: '[anthropic|openai|codex|gemini|grok|bedrock|vertex|foundry|unset]',
+  argumentHint: '[anthropic|openai|gemini|grok|bedrock|vertex|foundry|unset]',
  supportsNonInteractive: true,
  load: () => Promise.resolve({ call }),
 } satisfies Command
--- a/src/components/ConsoleOAuthFlow.tsx
+++ b/src/components/ConsoleOAuthFlow.tsx
@@ -55,14 +55,6 @@ type OAuthStatus =
      opusModel: string
      activeField: 'base_url' | 'api_key' | 'haiku_model' | 'sonnet_model' | 'opus_model'
    } // Gemini Generate Content API platform
-  | {
-      state: 'codex_responses_api'
-      baseUrl: string
-      apiKey: string
-      model: string
-      imgbbApiKey: string
-      activeField: 'base_url' | 'api_key' | 'model' | 'imgbb_api_key'
-    } // Codex / Responses API platform
  | { state: 'ready_to_start' } // Flow started, waiting for browser to open
  | { state: 'waiting_for_login'; url: string } // Browser opened, waiting for user to login
  | { state: 'creating_api_key' } // Got access token, creating API key
@@ -464,7 +456,7 @@ function OAuthStatusMessage({
                {
                  label: (
                    <Text>
-                      Anthropic Compatible -{' '}
+                      Anthropic Compatible ·{' '}
                      <Text dimColor>Configure your own API endpoint</Text>
                      {'\n'}
                    </Text>
@@ -474,7 +466,7 @@ function OAuthStatusMessage({
                {
                  label: (
                    <Text>
-                      OpenAI Compatible -{' '}
+                      OpenAI Compatible ·{' '}
                      <Text dimColor>
                        Ollama, DeepSeek, vLLM, One API, etc.
                      </Text>
@@ -486,17 +478,7 @@ function OAuthStatusMessage({
                {
                  label: (
                    <Text>
-                      Codex Responses API -{' '}
-                      <Text dimColor>OpenAI Codex via Responses API</Text>
-                      {'\n'}
-                    </Text>
-                  ),
-                  value: 'codex_responses_api',
-                },
-                {
-                  label: (
-                    <Text>
-                      Gemini API -{' '}
+                      Gemini API ·{' '}
                      <Text dimColor>Google Gemini native REST/SSE</Text>
                      {'\n'}
                    </Text>
@@ -506,7 +488,7 @@ function OAuthStatusMessage({
                {
                  label: (
                    <Text>
-                      Claude account with subscription -{' '}
+                      Claude account with subscription ·{' '}
                      <Text dimColor>Pro, Max, Team, or Enterprise</Text>
                      {process.env.USER_TYPE === 'ant' && (
                        <Text>
@@ -527,7 +509,7 @@ function OAuthStatusMessage({
                {
                  label: (
                    <Text>
-                      Anthropic Console account -{' '}
+                      Anthropic Console account ·{' '}
                      <Text dimColor>API usage billing</Text>
                      {'\n'}
                    </Text>
@@ -537,7 +519,7 @@ function OAuthStatusMessage({
                {
                  label: (
                    <Text>
-                      3rd-party platform -{' '}
+                      3rd-party platform ·{' '}
                      <Text dimColor>
                        Amazon Bedrock, Microsoft Foundry, or Vertex AI
                      </Text>
@@ -581,16 +563,6 @@ function OAuthStatusMessage({
                    opusModel: process.env.GEMINI_DEFAULT_OPUS_MODEL ?? '',
                    activeField: 'base_url',
                  })
-                } else if (value === 'codex_responses_api') {
-                  logEvent('tengu_codex_responses_api_selected', {})
-                  setOAuthStatus({
-                    state: 'codex_responses_api',
-                    baseUrl: process.env.CODEX_BASE_URL ?? '',
-                    apiKey: process.env.CODEX_API_KEY ?? '',
-                    model: process.env.CODEX_MODEL ?? '',
-                    imgbbApiKey: process.env.CODEX_IMGBB_API_KEY ?? '',
-                    activeField: 'base_url',
-                  })
                } else if (value === 'platform') {
                  logEvent('tengu_oauth_platform_selected', {})
                  setOAuthStatus({ state: 'platform_setup' })
@@ -825,7 +797,7 @@ function OAuthStatusMessage({
              {renderRow('opus_model', 'Opus     ')}
            </Box>
            <Text dimColor>
-              ↑↓/Tab to switch - Enter on last field to save - Esc to go back
+              ↑↓/Tab to switch · Enter on last field to save · Esc to go back
            </Text>
          </Box>
        )
@@ -1064,7 +1036,7 @@ function OAuthStatusMessage({
              {renderOpenAIRow('opus_model', 'Opus     ')}
            </Box>
            <Text dimColor>
-              ↑↓/Tab to switch - Enter on last field to save - Esc to go back
+              ↑↓/Tab to switch · Enter on last field to save · Esc to go back
            </Text>
          </Box>
        )
@@ -1297,254 +1269,7 @@ function OAuthStatusMessage({
              {renderGeminiRow('opus_model', 'Opus     ')}
            </Box>
            <Text dimColor>
-              ↑↓/Tab to switch - Enter on last field to save - Esc to go back
-            </Text>
-          </Box>
-        )
-      }
-
-    case 'codex_responses_api':
-      {
-        type CodexField = 'base_url' | 'api_key' | 'model' | 'imgbb_api_key'
-        const CODEX_FIELDS: CodexField[] = [
-          'base_url',
-          'api_key',
-          'model',
-          'imgbb_api_key',
-        ]
-        const cp = oauthStatus as {
-          state: 'codex_responses_api'
-          activeField: CodexField
-          baseUrl: string
-          apiKey: string
-          model: string
-          imgbbApiKey: string
-        }
-        const { activeField, baseUrl, apiKey, model, imgbbApiKey } = cp
-        const codexDisplayValues: Record<CodexField, string> = {
-          base_url: baseUrl,
-          api_key: apiKey,
-          model,
-          imgbb_api_key: imgbbApiKey,
-        }
-
-        const [codexInputValue, setCodexInputValue] = useState(
-          () => codexDisplayValues[activeField],
-        )
-        const [codexInputCursorOffset, setCodexInputCursorOffset] = useState(
-          () => codexDisplayValues[activeField].length,
-        )
-
-        const buildCodexState = useCallback(
-          (field: CodexField, value: string, newActive?: CodexField) => {
-            const state = {
-              state: 'codex_responses_api' as const,
-              activeField: newActive ?? activeField,
-              baseUrl,
-              apiKey,
-              model,
-              imgbbApiKey,
-            }
-            switch (field) {
-              case 'base_url':
-                return { ...state, baseUrl: value }
-              case 'api_key':
-                return { ...state, apiKey: value }
-              case 'model':
-                return { ...state, model: value }
-              case 'imgbb_api_key':
-                return { ...state, imgbbApiKey: value }
-            }
-          },
-          [activeField, apiKey, baseUrl, imgbbApiKey, model],
-        )
-
-        const doCodexSave = useCallback(() => {
-          const finalVals = {
-            ...codexDisplayValues,
-            [activeField]: codexInputValue,
-          }
-          if (!finalVals.base_url || !finalVals.api_key || !finalVals.model) {
-            setOAuthStatus({
-              state: 'error',
-              message:
-                'Codex setup requires CODEX_BASE_URL, CODEX_API_KEY, and CODEX_MODEL.',
-              toRetry: {
-                state: 'codex_responses_api',
-                baseUrl: finalVals.base_url,
-                apiKey: finalVals.api_key,
-                model: finalVals.model,
-                imgbbApiKey: finalVals.imgbb_api_key,
-                activeField,
-              },
-            })
-            return
-          }
-
-          try {
-            new URL(finalVals.base_url)
-          } catch {
-            setOAuthStatus({
-              state: 'error',
-              message:
-                'Invalid base URL: please enter a full URL including protocol (e.g., https://code.ylsagi.com/codex)',
-              toRetry: {
-                state: 'codex_responses_api',
-                baseUrl: finalVals.base_url,
-                apiKey: finalVals.api_key,
-                model: finalVals.model,
-                imgbbApiKey: finalVals.imgbb_api_key,
-                activeField: 'base_url',
-              },
-            })
-            return
-          }
-
-          const env: Record<string, string | undefined> = {
-            CODEX_BASE_URL: finalVals.base_url,
-            CODEX_API_KEY: finalVals.api_key,
-            CODEX_MODEL: finalVals.model,
-            CODEX_IMGBB_API_KEY: finalVals.imgbb_api_key || undefined,
-          }
-          const { error } = updateSettingsForSource('userSettings', {
-            modelType: 'codex' as any,
-            env,
-          } as any)
-          if (error) {
-            setOAuthStatus({
-              state: 'error',
-              message: `Failed to save: ${error.message}`,
-              toRetry: {
-                state: 'codex_responses_api',
-                baseUrl: finalVals.base_url,
-                apiKey: finalVals.api_key,
-                model: finalVals.model,
-                imgbbApiKey: finalVals.imgbb_api_key,
-                activeField,
-              },
-            })
-            return
-          }
-
-          for (const [key, value] of Object.entries(env)) {
-            if (value === undefined) {
-              delete process.env[key]
-            } else {
-              process.env[key] = value
-            }
-          }
-          setOAuthStatus({ state: 'success' })
-          void onDone()
-        }, [activeField, codexDisplayValues, codexInputValue, onDone])
-
-        const handleCodexEnter = useCallback(() => {
-          const idx = CODEX_FIELDS.indexOf(activeField)
-          if (idx === CODEX_FIELDS.length - 1) {
-            setOAuthStatus(buildCodexState(activeField, codexInputValue))
-            doCodexSave()
-          } else {
-            const next = CODEX_FIELDS[idx + 1]!
-            setOAuthStatus(buildCodexState(activeField, codexInputValue, next))
-            setCodexInputValue(codexDisplayValues[next] ?? '')
-            setCodexInputCursorOffset((codexDisplayValues[next] ?? '').length)
-          }
-        }, [
-          activeField,
-          buildCodexState,
-          codexDisplayValues,
-          codexInputValue,
-          doCodexSave,
-        ])
-
-        useKeybinding(
-          'tabs:next',
-          () => {
-            const idx = CODEX_FIELDS.indexOf(activeField)
-            if (idx < CODEX_FIELDS.length - 1) {
-              const next = CODEX_FIELDS[idx + 1]!
-              setOAuthStatus(buildCodexState(activeField, codexInputValue, next))
-              setCodexInputValue(codexDisplayValues[next] ?? '')
-              setCodexInputCursorOffset((codexDisplayValues[next] ?? '').length)
-            }
-          },
-          { context: 'FormField' },
-        )
-        useKeybinding(
-          'tabs:previous',
-          () => {
-            const idx = CODEX_FIELDS.indexOf(activeField)
-            if (idx > 0) {
-              const prev = CODEX_FIELDS[idx - 1]!
-              setOAuthStatus(buildCodexState(activeField, codexInputValue, prev))
-              setCodexInputValue(codexDisplayValues[prev] ?? '')
-              setCodexInputCursorOffset((codexDisplayValues[prev] ?? '').length)
-            }
-          },
-          { context: 'FormField' },
-        )
-        useKeybinding(
-          'confirm:no',
-          () => {
-            setOAuthStatus({ state: 'idle' })
-          },
-          { context: 'Confirmation' },
-        )
-
-        const codexColumns = useTerminalSize().columns - 20
-
-        const renderCodexRow = (
-          field: CodexField,
-          label: string,
-          opts?: { mask?: boolean },
-        ) => {
-          const active = activeField === field
-          const value = codexDisplayValues[field]
-          return (
-            <Box>
-              <Text
-                backgroundColor={active ? 'suggestion' : undefined}
-                color={active ? 'inverseText' : undefined}
-              >
-                {` ${label} `}
-              </Text>
-              <Text> </Text>
-              {active ? (
-                <TextInput
-                  value={codexInputValue}
-                  onChange={setCodexInputValue}
-                  onSubmit={handleCodexEnter}
-                  cursorOffset={codexInputCursorOffset}
-                  onChangeCursorOffset={setCodexInputCursorOffset}
-                  columns={codexColumns}
-                  mask={opts?.mask ? '*' : undefined}
-                  focus={true}
-                />
-              ) : value ? (
-                <Text color="success">
-                  {opts?.mask
-                    ? value.slice(0, 8) + '\u00b7'.repeat(Math.max(0, value.length - 8))
-                    : value}
-                </Text>
-              ) : null}
-            </Box>
-          )
-        }
-
-        return (
-          <Box flexDirection="column" gap={1}>
-            <Text bold>Codex Responses API Setup</Text>
-            <Text dimColor>
-              Configure a Codex-compatible Responses API endpoint. ImgBB is optional
-              and enables local image uploads for image understanding.
-            </Text>
-            <Box flexDirection="column" gap={1}>
-              {renderCodexRow('base_url', 'Base URL ')}
-              {renderCodexRow('api_key', 'API Key  ', { mask: true })}
-              {renderCodexRow('model', 'Model    ')}
-              {renderCodexRow('imgbb_api_key', 'ImgBB Key', { mask: true })}
-            </Box>
-            <Text dimColor>
-              ↑↓/Tab to switch - Enter on last field to save - Esc to go back
+              ↑↓/Tab to switch · Enter on last field to save · Esc to go back
            </Text>
          </Box>
        )
@@ -1570,19 +1295,19 @@ function OAuthStatusMessage({
            <Box flexDirection="column" marginTop={1}>
              <Text bold>Documentation:</Text>
              <Text>
-                - Amazon Bedrock:{' '}
+                · Amazon Bedrock:{' '}
                <Link url="https://code.claude.com/docs/en/amazon-bedrock">
                  https://code.claude.com/docs/en/amazon-bedrock
                </Link>
              </Text>
              <Text>
-                - Microsoft Foundry:{' '}
+                · Microsoft Foundry:{' '}
                <Link url="https://code.claude.com/docs/en/microsoft-foundry">
                  https://code.claude.com/docs/en/microsoft-foundry
                </Link>
              </Text>
              <Text>
-                - Vertex AI:{' '}
+                · Vertex AI:{' '}
                <Link url="https://code.claude.com/docs/en/google-vertex-ai">
                  https://code.claude.com/docs/en/google-vertex-ai
                </Link>
--- a/src/components/Onboarding.tsx
+++ b/src/components/Onboarding.tsx
@@ -15,7 +15,6 @@ import { normalizeApiKeyForConfig } from '../utils/authPortable.js'
 import { getCustomApiKeyStatus } from '../utils/config.js'
 import { env } from '../utils/env.js'
 import { isRunningOnHomespace } from '../utils/envUtils.js'
-import { gracefulShutdownSync } from '../utils/gracefulShutdown.js'
 import { PreflightStep } from '../utils/preflightChecks.js'
 import type { ThemeSetting } from '../utils/theme.js'
 import { ApproveApiKey } from './ApproveApiKey.js'
@@ -75,9 +74,7 @@ export function Onboarding({ onDone }: Props): React.ReactNode {
    goToNextStep()
  }

-  const exitState = useExitOnCtrlCDWithKeybindings(() =>
-    gracefulShutdownSync(0),
-  )
+  const exitState = useExitOnCtrlCDWithKeybindings()

  // Define all onboarding steps
  const themeStep = (
--- a/src/components/ThemePicker.tsx
+++ b/src/components/ThemePicker.tsx
@@ -75,12 +75,9 @@ export function ThemePicker({
    },
    { context: 'ThemePicker' },
  )
-  // When onboarding owns exit handling, keep this hook inactive so its
-  // ThemePicker-scoped keybindings don't swallow the parent Global handler.
+  // Always call the hook to follow React rules, but conditionally assign the exit handler
  const exitState = useExitOnCtrlCDWithKeybindings(
-    undefined,
-    undefined,
-    !skipExitHandling,
+    skipExitHandling ? () => {} : undefined,
  )

  const themeOptions: { label: string; value: ThemeSetting }[] = [
--- a/src/screens/REPL.tsx
+++ b/src/screens/REPL.tsx
@@ -3051,22 +3051,12 @@ export function REPL({
            // are O(n) per render, so drop everything before the previous
            // boundary to keep n bounded across multi-day sessions.
            if (isFullscreenEnvEnabled()) {
-              setMessages(old => {
-                const postBoundary = getMessagesAfterCompactBoundary(old, {
+              setMessages(old => [
+                ...getMessagesAfterCompactBoundary(old, {
                  includeSnipped: true,
-                })
-                // Hard cap: keep at most 500 messages in fullscreen scrollback
-                // to prevent unbounded memory growth in multi-day sessions.
-                // normalizeMessages/applyGrouping are O(n), and Ink fiber
-                // trees cost ~250KB RSS per message. Without this cap,
-                // scrollback after several compactions can reach thousands
-                // of messages (observed: 13k+, 1GB+ heap).
-                const MAX_FULLSCREEN_SCROLLBACK = 500
-                const kept = postBoundary.length > MAX_FULLSCREEN_SCROLLBACK
-                  ? postBoundary.slice(-MAX_FULLSCREEN_SCROLLBACK)
-                  : postBoundary
-                return [...kept, newMessage]
-              });
+                }),
+                newMessage,
+              ]);
            } else {
              setMessages(() => [newMessage]);
            }
@@ -3092,23 +3082,17 @@ export function REPL({
            // history). Replacing those leaves the AgentTool UI stuck at
            // "Initializing…" because it renders the full progress trail.
            setMessages(oldMessages => {
+              const last = oldMessages.at(-1);
+              const lastData = last?.data as Record<string, unknown> | undefined;
              const newData = newMessage.data as Record<string, unknown>;
-              // Scan backwards to find the last ephemeral progress with matching
-              // parentToolUseID and type. Previously only checked the last message,
-              // so interleaved non-ephemeral messages caused duplicate progress
-              // entries to accumulate (observed 13k+ entries in sleep-heavy sessions).
-              for (let i = oldMessages.length - 1; i >= 0; i--) {
-                const m = oldMessages[i]!
-                if (m.type !== 'progress') break
-                const mData = m.data as Record<string, unknown> | undefined
-                if (
-                  m.parentToolUseID === newMessage.parentToolUseID &&
-                  mData?.type === newData.type
-                ) {
-                  const copy = oldMessages.slice();
-                  copy[i] = newMessage;
-                  return copy;
-                }
+              if (
+                last?.type === 'progress' &&
+                last.parentToolUseID === newMessage.parentToolUseID &&
+                lastData?.type === newData.type
+              ) {
+                const copy = oldMessages.slice();
+                copy[copy.length - 1] = newMessage;
+                return copy;
              }
              return [...oldMessages, newMessage];
            });
--- a/src/services/AgentSummary/tests/agentSummary.test.ts
+++ b/src/services/AgentSummary/tests/agentSummary.test.ts
@@ -0,0 +1,212 @@
+import { beforeEach, describe, expect, test } from 'bun:test'
+import { asAgentId } from '../../../types/ids.js'
+import type { Message } from '../../../types/message.js'
+import type {
+  CacheSafeParams,
+  ForkedAgentResult,
+} from '../../../utils/forkedAgent.js'
+import {
+  type AgentSummaryDependencies,
+  startAgentSummarization,
+} from '../agentSummary.js'
+
+const transcriptMessages = [
+  { type: 'user', message: { content: 'start' }, uuid: 'u1' },
+  {
+    type: 'assistant',
+    message: { content: [{ type: 'text', text: 'working' }] },
+    uuid: 'a1',
+  },
+  { type: 'user', message: { content: 'continue' }, uuid: 'u2' },
+] as unknown as Message[]
+
+type ForkCall = {
+  cacheSafeParams: CacheSafeParams
+}
+
+describe('startAgentSummarization', () => {
+  let scheduled: (() => void | Promise<void>) | undefined
+  let handle: { stop: () => void } | undefined
+  let forkCalls: ForkCall[]
+  let updateCalls: Array<{ taskId: string; summary: string }>
+  let transcriptMessagesForTest: Message[]
+  let debugLogs: string[]
+  let loggedErrors: Error[]
+  let clearedHandles: unknown[]
+
+  function startTestSummarization(
+    dependencies: AgentSummaryDependencies = {},
+  ): { stop: () => void } {
+    return startAgentSummarization(
+      'task-1',
+      asAgentId('a0000000000000000'),
+      {
+        forkContextMessages: [
+          { type: 'user', message: { content: 'stale' }, uuid: 'old' },
+        ],
+        model: 'claude-test',
+      } as unknown as CacheSafeParams,
+      () => undefined,
+      {
+        clearTimeout: ((timeoutId: unknown) => {
+          clearedHandles.push(timeoutId)
+        }) as typeof clearTimeout,
+        getAgentTranscript: async () => ({
+          messages: transcriptMessagesForTest,
+          contentReplacements: [],
+        }),
+        isPoorModeActive: () => false,
+        logError: error => {
+          loggedErrors.push(
+            error instanceof Error ? error : new Error(String(error)),
+          )
+        },
+        logForDebugging: message => {
+          debugLogs.push(message)
+        },
+        runForkedAgent: async (args: ForkCall) => {
+          forkCalls.push(args)
+          return {
+            messages: [
+              {
+                type: 'assistant',
+                message: {
+                  content: [{ type: 'text', text: 'Reading udsClient.ts' }],
+                },
+              },
+            ],
+          } as unknown as ForkedAgentResult
+        },
+        setTimeout: ((callback: TimerHandler) => {
+          if (typeof callback !== 'function') {
+            throw new Error('Expected timer callback')
+          }
+          scheduled = callback as () => void | Promise<void>
+          return 1 as unknown as ReturnType<typeof setTimeout>
+        }) as unknown as typeof setTimeout,
+        updateAgentSummary: (taskId: string, summary: string) => {
+          updateCalls.push({ taskId, summary })
+        },
+        ...dependencies,
+      },
+    )
+  }
+
+  beforeEach(() => {
+    forkCalls = []
+    updateCalls = []
+    scheduled = undefined
+    handle = undefined
+    transcriptMessagesForTest = transcriptMessages
+    debugLogs = []
+    loggedErrors = []
+    clearedHandles = []
+  })
+
+  test('summarizes bounded transcript once and skips unchanged fingerprints', async () => {
+    handle = startTestSummarization()
+
+    expect(typeof scheduled).toBe('function')
+    await scheduled!()
+
+    expect(forkCalls).toHaveLength(1)
+    expect(updateCalls).toEqual([
+      { taskId: 'task-1', summary: 'Reading udsClient.ts' },
+    ])
+
+    const forkContext = forkCalls[0].cacheSafeParams.forkContextMessages ?? []
+    expect(forkContext.map(message => String(message.uuid))).toEqual([
+      'u1',
+      'a1',
+      'u2',
+    ])
+    expect(forkContext.some(message => String(message.uuid) === 'old')).toBe(
+      false,
+    )
+
+    await scheduled!()
+
+    expect(forkCalls).toHaveLength(1)
+    expect(updateCalls).toHaveLength(1)
+  })
+
+  test('skips summarization when filtering leaves too little bounded context', async () => {
+    transcriptMessagesForTest = [
+      { type: 'user', message: { content: 'start' }, uuid: 'u1' },
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          content: [{ type: 'tool_use', id: 'missing', name: 'Read' }],
+        },
+      },
+      { type: 'user', message: { content: 'continue' }, uuid: 'u2' },
+    ] as unknown as Message[]
+
+    handle = startTestSummarization()
+
+    expect(typeof scheduled).toBe('function')
+    await scheduled!()
+
+    expect(forkCalls).toEqual([])
+    expect(updateCalls).toEqual([])
+    expect(debugLogs).toContain(
+      '[AgentSummary] Skipping summary for task-1: no bounded context available',
+    )
+  })
+
+  test('skips summarization before building context when transcript is too short', async () => {
+    transcriptMessagesForTest = transcriptMessages.slice(0, 2)
+    handle = startTestSummarization()
+
+    expect(typeof scheduled).toBe('function')
+    await scheduled!()
+
+    expect(forkCalls).toEqual([])
+    expect(updateCalls).toEqual([])
+    expect(debugLogs).toContain(
+      '[AgentSummary] Skipping summary for task-1: not enough messages (2)',
+    )
+  })
+
+  test('skips and reschedules while poor mode is active', async () => {
+    handle = startTestSummarization({
+      isPoorModeActive: () => true,
+    })
+
+    expect(typeof scheduled).toBe('function')
+    await scheduled!()
+
+    expect(forkCalls).toEqual([])
+    expect(updateCalls).toEqual([])
+    expect(debugLogs).toContain(
+      '[AgentSummary] Skipping summary — poor mode active',
+    )
+  })
+
+  test('logs summary errors and keeps the next timer owned by the summarizer', async () => {
+    const error = new Error('fork failed')
+    handle = startTestSummarization({
+      runForkedAgent: async () => {
+        throw error
+      },
+    })
+
+    expect(typeof scheduled).toBe('function')
+    await scheduled!()
+
+    expect(loggedErrors).toEqual([error])
+    expect(updateCalls).toEqual([])
+  })
+
+  test('stop clears the pending summary timer', () => {
+    handle = startTestSummarization()
+
+    handle.stop()
+
+    expect(debugLogs).toContain(
+      '[AgentSummary] Stopping summarization for task-1',
+    )
+    expect(clearedHandles).toEqual([1])
+  })
+})
--- a/src/services/AgentSummary/tests/summaryContext.test.ts
+++ b/src/services/AgentSummary/tests/summaryContext.test.ts
@@ -0,0 +1,268 @@
+import { describe, expect, test } from 'bun:test'
+import type { Message } from '../../../types/message.js'
+import {
+  buildSummaryContext,
+  estimateMessageChars,
+  getSummaryContextFingerprint,
+  MAX_SUMMARY_CONTEXT_CHARS,
+  selectSummaryContextMessages,
+} from '../summaryContext.js'
+
+function makeMessage(
+  type: 'user' | 'assistant',
+  uuid: string,
+  content: string,
+): Message {
+  return {
+    type,
+    uuid,
+    message: {
+      role: type,
+      content,
+    },
+  } as unknown as Message
+}
+
+describe('selectSummaryContextMessages', () => {
+  test('keeps a bounded recent suffix that starts with a user message', () => {
+    const messages = [
+      makeMessage('assistant', 'a0', 'older assistant'),
+      makeMessage('user', 'u1', 'first prompt'),
+      makeMessage('assistant', 'a1', 'first response'),
+      makeMessage('user', 'u2', 'second prompt'),
+      makeMessage('assistant', 'a2', 'second response'),
+    ]
+
+    const selected = selectSummaryContextMessages(messages, {
+      maxMessages: 3,
+      maxChars: 1_000,
+    })
+
+    expect(selected.map(message => String(message.uuid))).toEqual(['u2', 'a2'])
+  })
+
+  test('returns no context when the newest message exceeds the byte budget', () => {
+    const messages = [
+      makeMessage('user', 'u1', 'first prompt'),
+      makeMessage('assistant', 'a1', 'x'.repeat(100)),
+    ]
+
+    const selected = selectSummaryContextMessages(messages, {
+      maxMessages: 10,
+      maxChars: 10,
+    })
+
+    expect(selected).toEqual([])
+  })
+
+  test('uses serialized message size for nested content budgets', () => {
+    const messages = [
+      makeMessage('user', 'u1', 'first prompt'),
+      {
+        ...makeMessage('assistant', 'a1', 'short'),
+        nested: {
+          payload: Array.from({ length: 50 }, (_value, index) => ({
+            index,
+            text: 'x'.repeat(20),
+          })),
+        },
+      } as unknown as Message,
+    ]
+
+    const selected = selectSummaryContextMessages(messages, {
+      maxMessages: 10,
+      maxChars: 200,
+    })
+
+    expect(selected).toEqual([])
+  })
+
+  test('stops at an older oversized message after keeping the recent suffix', () => {
+    const messages = [
+      makeMessage('user', 'u1', 'x'.repeat(5_000)),
+      makeMessage('user', 'u2', 'small prompt'),
+      makeMessage('assistant', 'a2', 'small answer'),
+    ]
+
+    const selected = selectSummaryContextMessages(messages, {
+      maxMessages: 10,
+      maxChars: 1_000,
+    })
+
+    expect(selected.map(message => String(message.uuid))).toEqual(['u2', 'a2'])
+  })
+
+  test('drops leading orphan tool results after bounding', () => {
+    const messages = [
+      makeMessage('assistant', 'a0', 'older assistant'),
+      {
+        type: 'user',
+        uuid: 'u1',
+        message: {
+          role: 'user',
+          content: [
+            { type: 'tool_result', tool_use_id: 'tool-1', content: 'ok' },
+          ],
+        },
+      } as unknown as Message,
+      makeMessage('assistant', 'a1', 'after orphan'),
+      makeMessage('user', 'u2', 'next prompt'),
+    ]
+
+    const selected = selectSummaryContextMessages(messages, {
+      maxMessages: 3,
+      maxChars: 1_000,
+    })
+
+    expect(selected.map(message => String(message.uuid))).toEqual(['u2'])
+  })
+})
+
+describe('getSummaryContextFingerprint', () => {
+  test('estimates circular messages as unbounded', () => {
+    const circular = makeMessage('assistant', 'a1', 'cycle') as Message & {
+      self?: unknown
+    }
+    circular.self = circular
+
+    expect(estimateMessageChars(circular)).toBe(Number.POSITIVE_INFINITY)
+  })
+
+  test('ignores non-json primitive fields in size estimates', () => {
+    const message = makeMessage('assistant', 'a1', 'metadata') as Message & {
+      skipUndefined?: undefined
+      skipFunction?: () => void
+      skipSymbol?: symbol
+    }
+    message.skipUndefined = undefined
+    message.skipFunction = () => undefined
+    message.skipSymbol = Symbol('ignored')
+
+    expect(estimateMessageChars(message)).toBeGreaterThan(0)
+  })
+
+  test('treats unsupported top-level primitives as zero-size estimates', () => {
+    expect(
+      estimateMessageChars((() => undefined) as unknown as Message),
+    ).toBe(0)
+    expect(estimateMessageChars(1n as unknown as Message)).toBe(0)
+  })
+
+  test('returns null for an empty transcript', () => {
+    expect(getSummaryContextFingerprint([])).toBeNull()
+  })
+
+  test('changes when the transcript grows', () => {
+    const messages = [
+      makeMessage('user', 'u1', 'first prompt'),
+      makeMessage('assistant', 'a1', 'first response'),
+    ]
+
+    const first = getSummaryContextFingerprint(messages)
+    const second = getSummaryContextFingerprint([
+      ...messages,
+      makeMessage('user', 'u2', 'next prompt'),
+    ])
+    expect(first?.startsWith('2:a1:')).toBe(true)
+    expect(second?.startsWith('3:u2:')).toBe(true)
+    expect(first).not.toBe(second)
+  })
+
+  test('changes when message content changes under the same uuid', () => {
+    const first = getSummaryContextFingerprint([
+      makeMessage('user', 'u1', 'first prompt'),
+      makeMessage('assistant', 'a1', 'first response'),
+    ])
+    const second = getSummaryContextFingerprint([
+      makeMessage('user', 'u1', 'first prompt'),
+      makeMessage('assistant', 'a1', 'updated response'),
+    ])
+
+    expect(first).not.toBe(second)
+  })
+
+  test('includes a truncation marker for oversized primitive values', () => {
+    const prefix = 'x'.repeat(MAX_SUMMARY_CONTEXT_CHARS + 100)
+    const first = getSummaryContextFingerprint([
+      makeMessage('assistant', 'a1', `${prefix}a`),
+    ])
+    const second = getSummaryContextFingerprint([
+      makeMessage('assistant', 'a1', `${prefix}b`),
+    ])
+
+    expect(first).not.toBe(second)
+  })
+
+  test('fingerprints circular message references without recursing forever', () => {
+    const circular = makeMessage('assistant', 'a1', 'cycle') as Message & {
+      self?: unknown
+    }
+    circular.self = circular
+
+    expect(getSummaryContextFingerprint([circular])).toContain(':a1:')
+  })
+})
+
+describe('buildSummaryContext', () => {
+  test('returns bounded messages and fingerprint for summarizable context', () => {
+    const messages = [
+      { type: 'user', uuid: 'u1', message: { content: 'start' } },
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: { content: [{ type: 'text', text: 'working' }] },
+      },
+      { type: 'user', uuid: 'u2', message: { content: 'continue' } },
+    ] as unknown as Message[]
+
+    const result = buildSummaryContext(messages, null)
+
+    expect(result.skipReason).toBeUndefined()
+    expect(result.messages.map(message => String(message.uuid))).toEqual([
+      'u1',
+      'a1',
+      'u2',
+    ])
+    expect(result.fingerprint).toContain('3:u2:')
+  })
+
+  test('reports unchanged contexts by fingerprint', () => {
+    const messages = [
+      { type: 'user', uuid: 'u1', message: { content: 'start' } },
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: { content: [{ type: 'text', text: 'working' }] },
+      },
+      { type: 'user', uuid: 'u2', message: { content: 'continue' } },
+    ] as unknown as Message[]
+    const first = buildSummaryContext(messages, null)
+
+    const second = buildSummaryContext(messages, first.fingerprint)
+
+    expect(second.skipReason).toBe('unchanged')
+    expect(second.fingerprint).toBe(first.fingerprint)
+  })
+
+  test('filters incomplete tool calls before deciding context is too small', () => {
+    const messages = [
+      { type: 'user', uuid: 'u1', message: { content: 'start' } },
+      {
+        type: 'assistant',
+        uuid: 'a1',
+        message: {
+          content: [{ type: 'tool_use', id: 'missing', name: 'Read' }],
+        },
+      },
+      { type: 'user', uuid: 'u2', message: { content: 'continue' } },
+    ] as unknown as Message[]
+
+    const result = buildSummaryContext(messages, null)
+
+    expect(result.skipReason).toBe('too_small')
+    expect(result.messages.map(message => String(message.uuid))).toEqual([
+      'u1',
+      'u2',
+    ])
+  })
+})
--- a/src/services/AgentSummary/tests/summaryPrompt.test.ts
+++ b/src/services/AgentSummary/tests/summaryPrompt.test.ts
@@ -0,0 +1,34 @@
+import { describe, expect, test } from 'bun:test'
+import {
+  buildSummaryPrompt,
+  createSummaryPromptMessage,
+} from '../summaryPrompt.js'
+
+describe('buildSummaryPrompt', () => {
+  test('builds the first summary prompt without previous-summary pressure', () => {
+    const prompt = buildSummaryPrompt(null)
+
+    expect(prompt).toContain('Describe your most recent action')
+    expect(prompt).toContain('Good: "Reading runAgent.ts"')
+    expect(prompt).not.toContain('Previous:')
+  })
+
+  test('asks for a new summary when a previous one exists', () => {
+    const prompt = buildSummaryPrompt('Reading udsMessaging.ts')
+
+    expect(prompt).toContain('Previous: "Reading udsMessaging.ts"')
+    expect(prompt).toContain('say something NEW')
+  })
+})
+
+describe('createSummaryPromptMessage', () => {
+  test('creates the minimal user message shape used by forked summaries', () => {
+    const message = createSummaryPromptMessage('Summarize progress')
+
+    expect(message.type).toBe('user')
+    expect(message.message.role).toBe('user')
+    expect(message.message.content).toBe('Summarize progress')
+    expect(message.uuid).toBeString()
+    expect(message.timestamp).toBeString()
+  })
+})
--- a/src/services/AgentSummary/agentSummary.ts
+++ b/src/services/AgentSummary/agentSummary.ts
@@ -13,7 +13,6 @@
 import type { TaskContext } from '../../Task.js'
 import { isPoorModeActive } from '../../commands/poor/poorMode.js'
 import { updateAgentSummary } from '../../tasks/LocalAgentTask/LocalAgentTask.js'
-import { filterIncompleteToolCalls } from '@claude-code-best/builtin-tools/tools/AgentTool/runAgent.js'
 import type { AgentId } from '../../types/ids.js'
 import { logForDebugging } from '../../utils/debug.js'
 import {
@@ -21,34 +20,32 @@ import {
  runForkedAgent,
 } from '../../utils/forkedAgent.js'
 import { logError } from '../../utils/log.js'
-import { createUserMessage } from '../../utils/messages.js'
 import { getAgentTranscript } from '../../utils/sessionStorage.js'
+import { buildSummaryContext } from './summaryContext.js'
+import {
+  buildSummaryPrompt,
+  createSummaryPromptMessage,
+} from './summaryPrompt.js'

 const SUMMARY_INTERVAL_MS = 30_000

-function buildSummaryPrompt(previousSummary: string | null): string {
-  const prevLine = previousSummary
-    ? `\nPrevious: "${previousSummary}" — say something NEW.\n`
-    : ''
-
-  return `Describe your most recent action in 3-5 words using present tense (-ing). Name the file or function, not the branch. Do not use tools.
-${prevLine}
-Good: "Reading runAgent.ts"
-Good: "Fixing null check in validate.ts"
-Good: "Running auth module tests"
-Good: "Adding retry logic to fetchUser"
-
-Bad (past tense): "Analyzed the branch diff"
-Bad (too vague): "Investigating the issue"
-Bad (too long): "Reviewing full branch diff and AgentTool.tsx integration"
-Bad (branch name): "Analyzed adam/background-summary branch diff"`
-}
+export type AgentSummaryDependencies = Partial<{
+  clearTimeout: typeof clearTimeout
+  getAgentTranscript: typeof getAgentTranscript
+  isPoorModeActive: typeof isPoorModeActive
+  logError: typeof logError
+  logForDebugging: typeof logForDebugging
+  runForkedAgent: typeof runForkedAgent
+  setTimeout: typeof setTimeout
+  updateAgentSummary: typeof updateAgentSummary
+}>

 export function startAgentSummarization(
  taskId: string,
  agentId: AgentId,
  cacheSafeParams: CacheSafeParams,
  setAppState: TaskContext['setAppState'],
+  dependencies: AgentSummaryDependencies = {},
 ): { stop: () => void } {
  // Drop forkContextMessages from the closure — runSummary rebuilds it each
  // tick from getAgentTranscript(). Without this, the original fork messages
@@ -58,39 +55,67 @@ export function startAgentSummarization(
  let timeoutId: ReturnType<typeof setTimeout> | null = null
  let stopped = false
  let previousSummary: string | null = null
+  let lastHandledTranscriptFingerprint: string | null = null
+  const clearTimeoutImpl = dependencies.clearTimeout ?? clearTimeout
+  const getAgentTranscriptImpl =
+    dependencies.getAgentTranscript ?? getAgentTranscript
+  const isPoorModeActiveImpl =
+    dependencies.isPoorModeActive ?? isPoorModeActive
+  const logErrorImpl = dependencies.logError ?? logError
+  const logForDebuggingImpl =
+    dependencies.logForDebugging ?? logForDebugging
+  const runForkedAgentImpl = dependencies.runForkedAgent ?? runForkedAgent
+  const setTimeoutImpl = dependencies.setTimeout ?? setTimeout
+  const updateAgentSummaryImpl =
+    dependencies.updateAgentSummary ?? updateAgentSummary

  async function runSummary(): Promise<void> {
    if (stopped) return
-    if (isPoorModeActive()) {
-      logForDebugging('[AgentSummary] Skipping summary — poor mode active')
+    if (isPoorModeActiveImpl()) {
+      logForDebuggingImpl('[AgentSummary] Skipping summary — poor mode active')
      scheduleNext()
      return
    }

-    logForDebugging(`[AgentSummary] Timer fired for agent ${agentId}`)
+    logForDebuggingImpl(`[AgentSummary] Timer fired for agent ${agentId}`)

    try {
      // Read current messages from transcript
-      const transcript = await getAgentTranscript(agentId)
+      const transcript = await getAgentTranscriptImpl(agentId)
      if (!transcript || transcript.messages.length < 3) {
        // Not enough context yet — finally block will schedule next attempt
-        logForDebugging(
+        logForDebuggingImpl(
          `[AgentSummary] Skipping summary for ${taskId}: not enough messages (${transcript?.messages.length ?? 0})`,
        )
        return
      }

-      // Filter to clean message state
-      const cleanMessages = filterIncompleteToolCalls(transcript.messages)
+      const summaryContext = buildSummaryContext(
+        transcript.messages,
+        lastHandledTranscriptFingerprint,
+      )
+      if (summaryContext.skipReason === 'unchanged') {
+        logForDebuggingImpl(
+          `[AgentSummary] Skipping summary for ${taskId}: transcript unchanged`,
+        )
+        return
+      }
+
+      if (summaryContext.skipReason === 'too_small') {
+        logForDebuggingImpl(
+          `[AgentSummary] Skipping summary for ${taskId}: no bounded context available`,
+        )
+        return
+      }

      // Build fork params with current messages
      const forkParams: CacheSafeParams = {
        ...baseParams,
-        forkContextMessages: cleanMessages,
+        forkContextMessages: summaryContext.messages,
      }

-      logForDebugging(
-        `[AgentSummary] Forking for summary, ${cleanMessages.length} messages in context`,
+      logForDebuggingImpl(
+        `[AgentSummary] Forking for summary, ${summaryContext.messages.length} messages in context`,
      )

      // Create abort controller for this summary
@@ -112,9 +137,9 @@ export function startAgentSummarization(
      // ContentReplacementState is cloned by default in createSubagentContext
      // from forkParams.toolUseContext (the subagent's LIVE state captured at
      // onCacheSafeParams time). No explicit override needed.
-      const result = await runForkedAgent({
+      const result = await runForkedAgentImpl({
        promptMessages: [
-          createUserMessage({ content: buildSummaryPrompt(previousSummary) }),
+          createSummaryPromptMessage(buildSummaryPrompt(previousSummary)),
        ],
        cacheSafeParams: forkParams,
        canUseTool,
@@ -136,21 +161,24 @@ export function startAgentSummarization(
          )
          continue
        }
-        const contentArr = Array.isArray(msg.message!.content) ? msg.message!.content : []
+        const contentArr = Array.isArray(msg.message!.content)
+          ? msg.message!.content
+          : []
        const textBlock = contentArr.find(b => b.type === 'text')
        if (textBlock?.type === 'text' && textBlock.text.trim()) {
          const summaryText = textBlock.text.trim()
-          logForDebugging(
+          logForDebuggingImpl(
            `[AgentSummary] Summary result for ${taskId}: ${summaryText}`,
          )
+          lastHandledTranscriptFingerprint = summaryContext.fingerprint
          previousSummary = summaryText
-          updateAgentSummary(taskId, summaryText, setAppState)
+          updateAgentSummaryImpl(taskId, summaryText, setAppState)
          break
        }
      }
    } catch (e) {
      if (!stopped && e instanceof Error) {
-        logError(e)
+        logErrorImpl(e)
      }
    } finally {
      summaryAbortController = null
@@ -163,14 +191,14 @@ export function startAgentSummarization(

  function scheduleNext(): void {
    if (stopped) return
-    timeoutId = setTimeout(runSummary, SUMMARY_INTERVAL_MS)
+    timeoutId = setTimeoutImpl(runSummary, SUMMARY_INTERVAL_MS)
  }

  function stop(): void {
-    logForDebugging(`[AgentSummary] Stopping summarization for ${taskId}`)
+    logForDebuggingImpl(`[AgentSummary] Stopping summarization for ${taskId}`)
    stopped = true
    if (timeoutId) {
-      clearTimeout(timeoutId)
+      clearTimeoutImpl(timeoutId)
      timeoutId = null
    }
    if (summaryAbortController) {
--- a/src/services/AgentSummary/summaryContext.ts
+++ b/src/services/AgentSummary/summaryContext.ts
@@ -0,0 +1,219 @@
+import { createHash } from 'node:crypto'
+import { filterIncompleteToolCalls } from '@claude-code-best/builtin-tools/tools/AgentTool/filterIncompleteToolCalls.js'
+import type { Message } from '../../types/message.js'
+
+export const MAX_SUMMARY_CONTEXT_MESSAGES = 120
+export const MAX_SUMMARY_CONTEXT_CHARS = 200_000
+
+function estimateJsonChars(
+  value: unknown,
+  limit: number,
+  seen = new Set<object>(),
+): number {
+  if (value === null) return 4
+  switch (typeof value) {
+    case 'string':
+      return value.length + 2
+    case 'number':
+    case 'boolean':
+      return String(value).length
+    case 'undefined':
+    case 'function':
+    case 'symbol':
+      return 0
+    case 'object': {
+      if (seen.has(value)) return Number.POSITIVE_INFINITY
+      seen.add(value)
+      let total = 2
+      if (Array.isArray(value)) {
+        for (let index = 0; index < value.length; index++) {
+          total += String(index).length + 3
+          total += estimateJsonChars(value[index], limit - total, seen)
+          if (total > limit) return total
+        }
+      } else {
+        const record = value as Record<string, unknown>
+        for (const key in record) {
+          if (!Object.hasOwn(record, key)) continue
+          total += key.length + 3
+          total += estimateJsonChars(record[key], limit - total, seen)
+          if (total > limit) return total
+        }
+      }
+      seen.delete(value)
+      return total
+    }
+  }
+  return 0
+}
+
+function updateFingerprintHash(
+  hash: ReturnType<typeof createHash>,
+  value: unknown,
+  limit: { remaining: number },
+  seen = new Set<object>(),
+): void {
+  if (limit.remaining <= 0) return
+  if (value === null || typeof value !== 'object') {
+    const text = String(value)
+    const consumed = Math.min(text.length, limit.remaining)
+    if (consumed <= 0) return
+    hash.update(typeof value)
+    hash.update(':')
+    hash.update(text.slice(0, consumed))
+    if (consumed < text.length) {
+      hash.update(`#truncated:${text.length}:${text.slice(-64)}`)
+    }
+    limit.remaining -= consumed
+    return
+  }
+  if (seen.has(value)) {
+    hash.update('[Circular]')
+    return
+  }
+  seen.add(value)
+  if (Array.isArray(value)) {
+    for (let index = 0; index < value.length; index++) {
+      if (limit.remaining <= 0) break
+      const key = String(index)
+      hash.update(key)
+      limit.remaining -= key.length
+      updateFingerprintHash(hash, value[index], limit, seen)
+    }
+  } else {
+    const record = value as Record<string, unknown>
+    for (const key in record) {
+      if (limit.remaining <= 0) break
+      if (!Object.hasOwn(record, key)) continue
+      hash.update(key)
+      limit.remaining -= key.length
+      updateFingerprintHash(hash, record[key], limit, seen)
+    }
+  }
+  seen.delete(value)
+}
+
+export function estimateMessageChars(
+  message: Message,
+  limit = Number.POSITIVE_INFINITY,
+): number {
+  const estimated = estimateJsonChars(message, limit)
+  if (!Number.isFinite(estimated)) {
+    return Number.POSITIVE_INFINITY
+  }
+  return estimated
+}
+
+function hasToolResultBlock(message: Message): boolean {
+  if (message.type !== 'user') return false
+  const content = message.message?.content
+  return (
+    Array.isArray(content) &&
+    content.some(block => {
+      return Boolean(
+        block &&
+          typeof block === 'object' &&
+          'type' in block &&
+          block.type === 'tool_result',
+      )
+    })
+  )
+}
+
+export function getSummaryContextFingerprint(
+  messages: Message[],
+): string | null {
+  const lastMessage = messages.at(-1)
+  if (!lastMessage) return null
+  const hash = createHash('sha256')
+  updateFingerprintHash(hash, messages, {
+    remaining: MAX_SUMMARY_CONTEXT_CHARS,
+  })
+  return `${messages.length}:${lastMessage.uuid}:${hash.digest('hex').slice(0, 16)}`
+}
+
+export function selectSummaryContextMessages(
+  messages: Message[],
+  limits: {
+    maxMessages?: number
+    maxChars?: number
+  } = {},
+): Message[] {
+  const maxMessages = limits.maxMessages ?? MAX_SUMMARY_CONTEXT_MESSAGES
+  const maxChars = limits.maxChars ?? MAX_SUMMARY_CONTEXT_CHARS
+  if (maxMessages <= 0 || maxChars <= 0) return []
+
+  const selected: Message[] = []
+  let selectedChars = 0
+
+  for (let i = messages.length - 1; i >= 0; i--) {
+    const message = messages[i]
+    if (!message) continue
+
+    const messageChars = estimateMessageChars(message, maxChars - selectedChars)
+    if (messageChars > maxChars) {
+      if (selected.length === 0) return []
+      break
+    }
+
+    if (
+      selected.length >= maxMessages ||
+      selectedChars + messageChars > maxChars
+    ) {
+      break
+    }
+
+    selected.unshift(message)
+    selectedChars += messageChars
+  }
+
+  while (selected.length > 0) {
+    const first = selected[0]
+    if (!first) break
+    if (first.type !== 'user' || hasToolResultBlock(first)) {
+      selected.shift()
+      continue
+    }
+    break
+  }
+
+  return selected
+}
+
+export type SummaryContextBuildResult = {
+  messages: Message[]
+  fingerprint: string | null
+  skipReason?: 'too_small' | 'unchanged'
+}
+
+export function buildSummaryContext(
+  messages: Message[],
+  previousFingerprint: string | null,
+): SummaryContextBuildResult {
+  const cleanMessages = filterIncompleteToolCalls(messages)
+  const boundedMessages = filterIncompleteToolCalls(
+    selectSummaryContextMessages(cleanMessages),
+  )
+  const fingerprint = getSummaryContextFingerprint(boundedMessages)
+
+  if (fingerprint && fingerprint === previousFingerprint) {
+    return {
+      messages: boundedMessages,
+      fingerprint,
+      skipReason: 'unchanged',
+    }
+  }
+
+  if (boundedMessages.length < 3) {
+    return {
+      messages: boundedMessages,
+      fingerprint,
+      skipReason: 'too_small',
+    }
+  }
+
+  return {
+    messages: boundedMessages,
+    fingerprint,
+  }
+}
--- a/src/services/AgentSummary/summaryPrompt.ts
+++ b/src/services/AgentSummary/summaryPrompt.ts
@@ -0,0 +1,32 @@
+import { randomUUID, type UUID } from 'node:crypto'
+import type { UserMessage } from '../../types/message.js'
+
+export function buildSummaryPrompt(previousSummary: string | null): string {
+  const prevLine = previousSummary
+    ? `\nPrevious: "${previousSummary}" — say something NEW.\n`
+    : ''
+
+  return `Describe your most recent action in 3-5 words using present tense (-ing). Name the file or function, not the branch. Do not use tools.
+${prevLine}
+Good: "Reading runAgent.ts"
+Good: "Fixing null check in validate.ts"
+Good: "Running auth module tests"
+Good: "Adding retry logic to fetchUser"
+
+Bad (past tense): "Analyzed the branch diff"
+Bad (too vague): "Investigating the issue"
+Bad (too long): "Reviewing full branch diff and AgentTool.tsx integration"
+Bad (branch name): "Analyzed adam/background-summary branch diff"`
+}
+
+export function createSummaryPromptMessage(content: string): UserMessage {
+  return {
+    type: 'user',
+    message: {
+      role: 'user',
+      content,
+    },
+    uuid: randomUUID() as UUID,
+    timestamp: new Date().toISOString(),
+  }
+}
--- a/src/services/api/claude.ts
+++ b/src/services/api/claude.ts
@@ -1347,12 +1347,6 @@ async function* queryModel(
    return
  }

-  if (getAPIProvider() === 'codex') {
-    const { queryModelCodex } = await import('./codex/index.js')
-    yield* queryModelCodex(messagesForAPI, systemPrompt, filteredTools, signal, options)
-    return
-  }
-
  if (getAPIProvider() === 'gemini') {
    const { queryModelGemini } = await import('./gemini/index.js')
    yield* queryModelGemini(
--- a/src/services/api/codex/tests/conversion.test.ts
+++ b/src/services/api/codex/tests/conversion.test.ts
@@ -1,407 +0,0 @@
-import { describe, expect, test } from 'bun:test'
-import { createAssistantMessage, createUserMessage } from '../../../../utils/messages.js'
-import { anthropicMessagesToCodexInput, anthropicToolsToCodex } from '@ant/model-provider'
-
-describe('anthropicMessagesToCodexInput', () => {
-  test('replays assistant tool calls and user tool results in order', async () => {
-    const assistant = createAssistantMessage({
-      content: [
-        'I will inspect the file.',
-        {
-          type: 'tool_use',
-          id: 'tool_1',
-          name: 'Read',
-          input: { file_path: 'README.md' },
-        },
-        'Then I will summarize.',
-      ] as any,
-    })
-    const user = createUserMessage({
-      content: [
-        {
-          type: 'tool_result',
-          tool_use_id: 'tool_1',
-          content: [
-            { type: 'text', text: 'file contents' },
-            { type: 'text', text: 'second line' },
-          ],
-        },
-        'Please continue.',
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([assistant, user])
-
-    expect(items).toHaveLength(5)
-    expect(items[0]).toMatchObject({
-      type: 'message',
-      role: 'assistant',
-    })
-    expect(items[0]).not.toHaveProperty('id')
-    expect(items[0]).not.toHaveProperty('status')
-    expect(items[1]).toMatchObject({
-      type: 'function_call',
-      call_id: 'tool_1',
-      name: 'Read',
-      arguments: '{"file_path":"README.md"}',
-    })
-    expect(items[1]).not.toHaveProperty('id')
-    expect(items[1]).not.toHaveProperty('status')
-    expect(items[2]).toMatchObject({
-      type: 'message',
-      role: 'assistant',
-    })
-    expect(items[2]).not.toHaveProperty('id')
-    expect(items[2]).not.toHaveProperty('status')
-    expect(items[3]).toMatchObject({
-      type: 'function_call_output',
-      call_id: 'tool_1',
-      output: [
-        { type: 'input_text', text: 'file contents' },
-        { type: 'input_text', text: 'second line' },
-      ],
-    })
-    expect(items[3]).not.toHaveProperty('id')
-    expect(items[3]).not.toHaveProperty('status')
-    expect(items[4]).toMatchObject({
-      type: 'message',
-      role: 'user',
-    })
-  })
-
-  test('normalizes tool call ids consistently across assistant replay and tool results', async () => {
-    const assistant = createAssistantMessage({
-      content: [
-        {
-          type: 'tool_use',
-          id: ' tool 1 / weird ',
-          name: 'Read',
-          input: { file_path: 'README.md' },
-        },
-      ] as any,
-    })
-    const user = createUserMessage({
-      content: [
-        {
-          type: 'tool_result',
-          tool_use_id: ' tool 1 / weird ',
-          content: 'ok',
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([assistant, user])
-
-    expect(items[0]).toMatchObject({
-      type: 'function_call',
-      call_id: 'tool_1_weird',
-    })
-    expect(items[1]).toMatchObject({
-      type: 'function_call_output',
-      call_id: 'tool_1_weird',
-      output: 'ok',
-    })
-  })
-
-  test('creates a deterministic fallback tool call id when assistant replay is missing one', async () => {
-    const assistant = createAssistantMessage({
-      content: [
-        {
-          type: 'tool_use',
-          id: '',
-          name: 'Read',
-          input: { file_path: 'README.md' },
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([assistant])
-
-    expect(items[0]).toMatchObject({
-      type: 'function_call',
-      name: 'Read',
-      arguments: '{"file_path":"README.md"}',
-    })
-    expect((items[0] as any).call_id).toMatch(/^call_[a-f0-9]{24}$/)
-  })
-
-  test('degrades unsupported user media blocks to text placeholders', async () => {
-    const user = createUserMessage({
-      content: [
-        { type: 'text', text: 'Inspect the attachment.' },
-        {
-          type: 'image',
-          source: {
-            type: 'base64',
-            media_type: 'image/png',
-            data: 'abc',
-          },
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([user])
-
-    expect(items).toEqual([
-      {
-        type: 'message',
-        role: 'user',
-        content: [
-          {
-            type: 'input_text',
-            text:
-              'Inspect the attachment.\n[Image omitted: codex gateway currently requires remote image URLs. Configure CODEX_IMGBB_API_KEY to auto-convert local images.]',
-          },
-        ],
-      },
-    ])
-  })
-
-  test('passes through remote image URLs for user messages', async () => {
-    const user = createUserMessage({
-      content: [
-        { type: 'text', text: 'Read the image.' },
-        {
-          type: 'image',
-          source: {
-            type: 'url',
-            url: 'https://example.com/vision.png',
-          },
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([user])
-
-    expect(items).toEqual([
-      {
-        type: 'message',
-        role: 'user',
-        content: [
-          {
-            type: 'input_text',
-            text: 'Read the image.',
-          },
-          {
-            type: 'input_image',
-            image_url: 'https://example.com/vision.png',
-            detail: 'high',
-          },
-        ],
-      },
-    ])
-  })
-
-  test('converts base64 user images through the configured inline resolver', async () => {
-    const user = createUserMessage({
-      content: [
-        { type: 'text', text: 'Read the image.' },
-        {
-          type: 'image',
-          source: {
-            type: 'base64',
-            media_type: 'image/png',
-            data: 'abc',
-          },
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([user], {
-      resolveBase64ImageUrl: async (data, mediaType) =>
-        data === 'abc' && mediaType === 'image/png'
-          ? 'https://example.com/inline-uploaded.png'
-          : null,
-    })
-
-    expect(items).toEqual([
-      {
-        type: 'message',
-        role: 'user',
-        content: [
-          {
-            type: 'input_text',
-            text: 'Read the image.',
-          },
-          {
-            type: 'input_image',
-            image_url: 'https://example.com/inline-uploaded.png',
-            detail: 'high',
-          },
-        ],
-      },
-    ])
-  })
-
-  test('passes through remote image URLs inside tool results', async () => {
-    const assistant = createAssistantMessage({
-      content: [
-        {
-          type: 'tool_use',
-          id: 'tool_vision',
-          name: 'Read',
-          input: { file_path: '/tmp/screenshot.png' },
-        },
-      ] as any,
-    })
-    const user = createUserMessage({
-      content: [
-        {
-          type: 'tool_result',
-          tool_use_id: 'tool_vision',
-          content: [
-            { type: 'text', text: 'Screenshot attached.' },
-            {
-              type: 'image',
-              source: {
-                type: 'url',
-                url: 'https://example.com/tool-screenshot.png',
-              },
-            },
-          ],
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([assistant, user])
-
-    expect(items[1]).toEqual({
-      type: 'function_call_output',
-      call_id: 'tool_vision',
-      output: [
-        { type: 'input_text', text: 'Screenshot attached.' },
-        {
-          type: 'input_image',
-          image_url: 'https://example.com/tool-screenshot.png',
-          detail: 'high',
-        },
-      ],
-    })
-  })
-
-  test('degrades unsupported tool result images to text placeholders', async () => {
-    const assistant = createAssistantMessage({
-      content: [
-        {
-          type: 'tool_use',
-          id: 'tool_vision',
-          name: 'Read',
-          input: { file_path: '/tmp/screenshot.png' },
-        },
-      ] as any,
-    })
-    const user = createUserMessage({
-      content: [
-        {
-          type: 'tool_result',
-          tool_use_id: 'tool_vision',
-          content: [
-            {
-              type: 'image',
-              source: {
-                type: 'base64',
-                media_type: 'image/png',
-                data: 'abc',
-              },
-            },
-          ],
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([assistant, user])
-
-    expect(items[1]).toEqual({
-      type: 'function_call_output',
-      call_id: 'tool_vision',
-      output:
-        '[Image omitted: codex gateway currently requires remote image URLs. Configure CODEX_IMGBB_API_KEY to auto-convert local images.]',
-    })
-  })
-
-  test('converts base64 tool result images through the configured inline resolver', async () => {
-    const assistant = createAssistantMessage({
-      content: [
-        {
-          type: 'tool_use',
-          id: 'tool_vision',
-          name: 'Read',
-          input: { file_path: '/tmp/screenshot.png' },
-        },
-      ] as any,
-    })
-    const user = createUserMessage({
-      content: [
-        {
-          type: 'tool_result',
-          tool_use_id: 'tool_vision',
-          content: [
-            {
-              type: 'image',
-              source: {
-                type: 'base64',
-                media_type: 'image/png',
-                data: 'abc',
-              },
-            },
-          ],
-        },
-      ] as any,
-    })
-
-    const items = await anthropicMessagesToCodexInput([assistant, user], {
-      resolveBase64ImageUrl: async (data, mediaType) =>
-        data === 'abc' && mediaType === 'image/png'
-          ? 'https://example.com/tool-inline-uploaded.png'
-          : null,
-    })
-
-    expect(items[1]).toEqual({
-      type: 'function_call_output',
-      call_id: 'tool_vision',
-      output: [
-        {
-          type: 'input_image',
-          image_url: 'https://example.com/tool-inline-uploaded.png',
-          detail: 'high',
-        },
-      ],
-    })
-  })
-})
-
-describe('anthropicToolsToCodex', () => {
-  test('converts only client function tools', () => {
-    const tools = anthropicToolsToCodex([
-      {
-        name: 'Read',
-        description: 'Read a file',
-        input_schema: {
-          type: 'object',
-          properties: {
-            file_path: { type: 'string' },
-          },
-        },
-        strict: true,
-      } as any,
-      {
-        type: 'advisor_20260301',
-      } as any,
-    ])
-
-    expect(tools).toEqual([
-      {
-        type: 'function',
-        name: 'Read',
-        description: 'Read a file',
-        parameters: {
-          type: 'object',
-          properties: {
-            file_path: { type: 'string' },
-          },
-        },
-        strict: true,
-      },
-    ])
-  })
-})
--- a/src/services/api/codex/tests/errors.test.ts
+++ b/src/services/api/codex/tests/errors.test.ts
@@ -1,103 +0,0 @@
-import { afterEach, describe, expect, test } from 'bun:test'
-import {
-  getCodexConfigurationError,
-  normalizeCodexError,
-} from '../errors.js'
-
-const originalCodexApiKey = process.env.CODEX_API_KEY
-
-afterEach(() => {
-  if (originalCodexApiKey === undefined) {
-    delete process.env.CODEX_API_KEY
-  } else {
-    process.env.CODEX_API_KEY = originalCodexApiKey
-  }
-})
-
-describe('getCodexConfigurationError', () => {
-  test('reports missing CODEX_API_KEY clearly', () => {
-    delete process.env.CODEX_API_KEY
-
-    expect(getCodexConfigurationError()).toEqual({
-      content:
-        'Missing CODEX_API_KEY. Configure it in settings or your environment before using the codex provider.',
-      error: 'authentication_failed',
-    })
-  })
-
-  test('returns null when CODEX_API_KEY is present', () => {
-    process.env.CODEX_API_KEY = 'test-key'
-
-    expect(getCodexConfigurationError()).toBeNull()
-  })
-})
-
-describe('normalizeCodexError', () => {
-  test('maps authentication failures', () => {
-    expect(
-      normalizeCodexError({
-        status: 401,
-        message: 'invalid_api_key',
-      }),
-    ).toEqual({
-      content:
-        'Codex authentication failed (401). Verify CODEX_API_KEY and CODEX_BASE_URL.',
-      error: 'authentication_failed',
-    })
-  })
-
-  test('maps missing endpoint failures', () => {
-    expect(
-      normalizeCodexError({
-        status: 404,
-        message: 'Not Found',
-      }),
-    ).toEqual({
-      content:
-        'Codex endpoint not found (404). Verify CODEX_BASE_URL points to a Responses API root.',
-      error: 'invalid_request',
-    })
-  })
-
-  test('maps rate limits', () => {
-    expect(
-      normalizeCodexError({
-        status: 429,
-        message: 'Too Many Requests',
-      }),
-    ).toEqual({
-      content:
-        'Codex rate limit reached (429). Retry shortly or reduce request volume.',
-      error: 'rate_limit',
-    })
-  })
-
-  test('maps upstream gateway 502 errors', () => {
-    expect(
-      normalizeCodexError({
-        status: 502,
-        message: 'Upstream request failed',
-      }),
-    ).toEqual({
-      content:
-        'Codex gateway returned 502 Upstream request failed. This usually means a transient gateway issue or incomplete Responses API compatibility during tool replay.',
-      error: 'server_error',
-    })
-  })
-
-  test('passes through Codex preflight errors as invalid requests', () => {
-    expect(
-      normalizeCodexError(new Error('Codex preflight: input must be an array.')),
-    ).toEqual({
-      content: 'Codex preflight: input must be an array.',
-      error: 'invalid_request',
-    })
-  })
-
-  test('falls back to generic API error text', () => {
-    expect(normalizeCodexError(new Error('socket hang up'))).toEqual({
-      content: 'API Error: socket hang up',
-      error: 'unknown',
-    })
-  })
-})
--- a/src/services/api/codex/tests/imageUpload.test.ts
+++ b/src/services/api/codex/tests/imageUpload.test.ts
@@ -1,103 +0,0 @@
-import { afterEach, beforeEach, describe, expect, test } from 'bun:test'
-import { uploadCodexBase64Image } from '../imageUpload.js'
-
-describe('codex image upload', () => {
-  const originalFetch = globalThis.fetch
-  const originalImgbbApiKey = process.env.CODEX_IMGBB_API_KEY
-  const originalUploadTimeout = process.env.CODEX_IMAGE_UPLOAD_TIMEOUT_MS
-  const originalLegacyTimeout = process.env.CODEX_IMAGE_URL_TIMEOUT_MS
-
-  beforeEach(() => {
-    process.env.CODEX_IMGBB_API_KEY = 'imgbb-test-key'
-    delete process.env.CODEX_IMAGE_UPLOAD_TIMEOUT_MS
-    delete process.env.CODEX_IMAGE_URL_TIMEOUT_MS
-  })
-
-  afterEach(() => {
-    globalThis.fetch = originalFetch
-    if (originalImgbbApiKey === undefined) {
-      delete process.env.CODEX_IMGBB_API_KEY
-    } else {
-      process.env.CODEX_IMGBB_API_KEY = originalImgbbApiKey
-    }
-    if (originalUploadTimeout === undefined) {
-      delete process.env.CODEX_IMAGE_UPLOAD_TIMEOUT_MS
-    } else {
-      process.env.CODEX_IMAGE_UPLOAD_TIMEOUT_MS = originalUploadTimeout
-    }
-    if (originalLegacyTimeout === undefined) {
-      delete process.env.CODEX_IMAGE_URL_TIMEOUT_MS
-    } else {
-      process.env.CODEX_IMAGE_URL_TIMEOUT_MS = originalLegacyTimeout
-    }
-  })
-
-  test('uploads inline base64 images to ImgBB and caches the result', async () => {
-    let fetchCalls = 0
-    globalThis.fetch = (async (input: string | URL | Request) => {
-      fetchCalls += 1
-      expect(String(input)).toBe(
-        'https://api.imgbb.com/1/upload?key=imgbb-test-key',
-      )
-      return new Response(
-        JSON.stringify({ data: { url: 'https://i.ibb.co/base64.png' } }),
-        { status: 200 },
-      )
-    }) as unknown as typeof fetch
-
-    const first = await uploadCodexBase64Image('YWJj', 'image/png')
-    const second = await uploadCodexBase64Image('YWJj', 'image/png')
-
-    expect(first).toBe('https://i.ibb.co/base64.png')
-    expect(second).toBe('https://i.ibb.co/base64.png')
-    expect(fetchCalls).toBe(1)
-  })
-
-  test('prefers ImgBB derived variants before the raw url', async () => {
-    globalThis.fetch = (async () =>
-      new Response(
-        JSON.stringify({
-          data: {
-            url: 'https://i.ibb.co/raw/base64.png',
-            image: { url: 'https://i.ibb.co/image/base64.png' },
-            thumb: { url: 'https://i.ibb.co/thumb/base64.png' },
-            medium: { url: 'https://i.ibb.co/medium/base64.png' },
-          },
-        }),
-        { status: 200 },
-      )) as unknown as typeof fetch
-
-    const url = await uploadCodexBase64Image('ZGVm', 'image/png')
-
-    expect(url).toBe('https://i.ibb.co/medium/base64.png')
-  })
-
-  test('prefers the new upload timeout env name over the legacy one', async () => {
-    let aborted = false
-    process.env.CODEX_IMAGE_UPLOAD_TIMEOUT_MS = '1'
-    process.env.CODEX_IMAGE_URL_TIMEOUT_MS = '1000'
-    globalThis.fetch = (async (
-      _input: string | URL | Request,
-      init?: RequestInit,
-    ) => {
-      const signal = init?.signal
-      if (!(signal instanceof AbortSignal)) {
-        throw new Error('Expected AbortSignal')
-      }
-
-      await new Promise<void>(resolve => {
-        signal.addEventListener('abort', () => {
-          aborted = true
-          resolve()
-        })
-      })
-
-      throw new Error('aborted')
-    }) as unknown as typeof fetch
-
-    const url = await uploadCodexBase64Image('Z2hp', 'image/png')
-
-    expect(url).toBeNull()
-    expect(aborted).toBe(true)
-  })
-})
--- a/src/services/api/codex/tests/preflight.test.ts
+++ b/src/services/api/codex/tests/preflight.test.ts
@@ -1,51 +0,0 @@
-import { describe, expect, test } from 'bun:test'
-import { sanitizeCodexRequest } from '../preflight.js'
-
-describe('sanitizeCodexRequest', () => {
-  test('normalizes function call ids and tool names', () => {
-    const request = sanitizeCodexRequest({
-      model: 'gpt-5.4',
-      input: [
-        {
-          type: 'function_call',
-          call_id: ' tool 1 / weird ',
-          name: ' Read ',
-          arguments: '{}',
-        },
-      ] as any,
-      tools: [
-        {
-          type: 'function',
-          name: ' Read ',
-          parameters: null,
-        },
-      ] as any,
-    } as any)
-
-    expect(request.input?.[0]).toMatchObject({
-      type: 'function_call',
-      call_id: 'tool_1_weird',
-      name: 'Read',
-    })
-    expect(request.tools?.[0]).toMatchObject({
-      type: 'function',
-      name: 'Read',
-      parameters: {},
-    })
-  })
-
-  test('rejects invalid function_call_output without call_id', () => {
-    expect(() =>
-      sanitizeCodexRequest({
-        model: 'gpt-5.4',
-        input: [
-          {
-            type: 'function_call_output',
-            call_id: '   ',
-            output: 'ok',
-          },
-        ] as any,
-      } as any),
-    ).toThrow('Codex preflight: function_call_output.call_id is required.')
-  })
-})
--- a/src/services/api/codex/tests/streaming.test.ts
+++ b/src/services/api/codex/tests/streaming.test.ts
@@ -1,451 +0,0 @@
-import { afterEach, beforeEach, describe, expect, mock, test } from 'bun:test'
-import type { Response, ResponseStreamEvent } from 'openai/resources/responses/responses.mjs'
-import { asSystemPrompt } from '../../../../utils/systemPromptType.js'
-
-type StreamRun = {
-  events?: ResponseStreamEvent[]
-  finalResponse?: Response
-  error?: unknown
-}
-
-let streamRuns: StreamRun[] = []
-let createRuns: StreamRun[] = []
-let lastRequestBody: any
-let lastCreateRequestBody: any
-
-function makeResponse(overrides: Partial<Response> = {}): Response {
-  return {
-    id: 'resp_test',
-    object: 'response',
-    created_at: 0,
-    status: 'completed',
-    model: 'gpt-5.4',
-    output: [],
-    parallel_tool_calls: false,
-    store: false,
-    temperature: 1,
-    tool_choice: 'auto',
-    top_p: 1,
-    truncation: 'disabled',
-    usage: {
-      input_tokens: 12,
-      output_tokens: 8,
-      total_tokens: 20,
-      input_tokens_details: {
-        cached_tokens: 0,
-      },
-      output_tokens_details: {
-        reasoning_tokens: 0,
-      },
-    },
-    ...overrides,
-  } as Response
-}
-
-function makeStream(run: StreamRun) {
-  return {
-    async *[Symbol.asyncIterator]() {
-      for (const event of run.events ?? []) {
-        yield event
-      }
-    },
-    finalResponse: async () => {
-      if (run.error) {
-        throw run.error
-      }
-      return run.finalResponse ?? makeResponse()
-    },
-  }
-}
-
-function makeCreateStream(run: StreamRun) {
-  return {
-    async *[Symbol.asyncIterator]() {
-      if (run.error) {
-        throw run.error
-      }
-      for (const event of run.events ?? []) {
-        yield event
-      }
-    },
-  }
-}
-
-mock.module('../client.js', () => ({
-  getCodexClient: () => ({
-    responses: {
-      stream: (body: any) => {
-        lastRequestBody = body
-        const run = streamRuns.shift()
-        if (!run) {
-          throw new Error('unexpected stream call')
-        }
-        if (run.error && !run.events) {
-          throw run.error
-        }
-        return makeStream(run)
-      },
-      create: async (body: any) => {
-        lastCreateRequestBody = body
-        const run = createRuns.shift()
-        if (!run) {
-          throw new Error('unexpected create call')
-        }
-        return makeCreateStream(run)
-      },
-    },
-  }),
-}))
-
-// Mock only model resolution — conversion functions can use real implementations
-// since the client mock controls API responses.
-mock.module('@ant/model-provider', () => {
-  // Import the real module to preserve conversion functions
-  const real = require('@ant/model-provider')
-  return {
-    ...real,
-    resolveCodexModel: () => 'gpt-5.4',
-    resolveCodexMaxTokens: () => 4096,
-  }
-})
-
-mock.module('../../../../utils/context.js', () => ({
-  MODEL_CONTEXT_WINDOW_DEFAULT: 200_000,
-  COMPACT_MAX_OUTPUT_TOKENS: 20_000,
-  CAPPED_DEFAULT_MAX_TOKENS: 8_000,
-  ESCALATED_MAX_TOKENS: 64_000,
-  is1mContextDisabled: () => false,
-  has1mContext: () => false,
-  modelSupports1M: () => false,
-  getContextWindowForModel: () => 200_000,
-  getSonnet1mExpTreatmentEnabled: () => false,
-  calculateContextPercentages: () => ({}),
-  getModelMaxOutputTokens: () => ({ upperLimit: 4096 }),
-  getMaxThinkingTokensForModel: () => 0,
-}))
-
-mock.module('../../../../utils/api.js', () => ({
-  toolToAPISchema: async () => ({}),
-  appendSystemContext: () => {},
-  prependUserContext: () => {},
-  logAPIPrefix: () => {},
-  splitSysPromptPrefix: () => ({ prefix: '', rest: [] }),
-  logContextMetrics: async () => {},
-  normalizeToolInput: (input: any) => input,
-  normalizeToolInputForAPI: (input: any) => input,
-}))
-
-mock.module('src/utils/debug.ts', () => ({
-  getMinDebugLogLevel: () => 'debug' as const,
-  isDebugMode: () => false,
-  enableDebugLogging: () => false,
-  getDebugFilter: () => null,
-  isDebugToStdErr: () => false,
-  getDebugFilePath: () => null as string | null,
-  setHasFormattedOutput: () => {},
-  getHasFormattedOutput: () => false,
-  flushDebugLogs: async () => {},
-  logForDebugging: () => {},
-  getDebugLogPath: () => '/tmp/mock-debug.log',
-  logAntError: () => {},
-}))
-
-mock.module('../../../../services/langfuse/tracing.js', () => ({
-  createTrace: () => null,
-  recordLLMObservation: () => {},
-  recordToolObservation: () => {},
-  createToolBatchSpan: () => null,
-  endToolBatchSpan: () => {},
-  createSubagentTrace: () => null,
-  createChildSpan: () => null,
-  endTrace: () => {},
-}))
-
-mock.module('../../../../services/langfuse/convert.js', () => ({
-  convertMessagesToLangfuse: () => [],
-  convertOutputToLangfuse: () => [],
-  convertToolsToLangfuse: () => [],
-}))
-
-async function runQuery(
-  nextStreamRuns: StreamRun[],
-  nextCreateRuns: StreamRun[] = [],
-  systemPrompt = asSystemPrompt([]),
-) {
-  streamRuns = [...nextStreamRuns]
-  createRuns = [...nextCreateRuns]
-
-  const { queryModelCodex } = await import('../index.js')
-  const assistantMessages: any[] = []
-  const streamEvents: any[] = []
-
-  const options: any = {
-    model: 'gpt-5.4',
-    agents: [],
-    querySource: 'main_loop',
-    getToolPermissionContext: async () => ({
-      alwaysAllow: [],
-      alwaysDeny: [],
-      needsPermission: [],
-      mode: 'default',
-      isBypassingPermissions: false,
-    }),
-  }
-
-  for await (const item of queryModelCodex(
-    [],
-    systemPrompt,
-    [],
-    new AbortController().signal,
-    options,
-  )) {
-    if (item.type === 'assistant') {
-      assistantMessages.push(item)
-    } else if (item.type === 'stream_event') {
-      streamEvents.push(item)
-    }
-  }
-
-  return { assistantMessages, streamEvents }
-}
-
-describe('queryModelCodex streaming fallback', () => {
-  const originalCodexApiKey = process.env.CODEX_API_KEY
-
-  beforeEach(() => {
-    process.env.CODEX_API_KEY = 'test-key'
-  })
-
-  afterEach(() => {
-    streamRuns = []
-    createRuns = []
-    lastRequestBody = undefined
-    lastCreateRequestBody = undefined
-    if (originalCodexApiKey === undefined) {
-      delete process.env.CODEX_API_KEY
-    } else {
-      process.env.CODEX_API_KEY = originalCodexApiKey
-    }
-  })
-
-  test('builds the final assistant text from streamed blocks when final snapshots are empty', async () => {
-    const response = makeResponse()
-    const events: ResponseStreamEvent[] = [
-      { type: 'response.created', response } as any,
-      {
-        type: 'response.output_item.added',
-        output_index: 0,
-        item: {
-          type: 'message',
-          id: 'msg_1',
-          role: 'assistant',
-          content: [],
-          status: 'in_progress',
-        },
-      } as any,
-      {
-        type: 'response.output_text.delta',
-        output_index: 0,
-        item_id: 'msg_1',
-        delta: 'hello',
-      } as any,
-      {
-        type: 'response.output_text.done',
-        output_index: 0,
-        item_id: 'msg_1',
-        text: 'hello world',
-      } as any,
-      { type: 'response.completed', response } as any,
-    ]
-
-    const { assistantMessages, streamEvents } = await runQuery([
-      { events, finalResponse: response },
-    ])
-
-    expect(assistantMessages).toHaveLength(1)
-    expect(assistantMessages[0].message.content).toEqual([
-      { type: 'text', text: 'hello world' },
-    ])
-    expect(assistantMessages[0].message.stop_reason).toBe('end_turn')
-    expect(
-      streamEvents.find((item: any) => item.event.type === 'message_delta')?.event.delta
-        .stop_reason,
-    ).toBe('end_turn')
-  })
-
-  test('builds tool_use blocks from streamed arguments when final snapshots are empty', async () => {
-    const response = makeResponse()
-    const events: ResponseStreamEvent[] = [
-      { type: 'response.created', response } as any,
-      {
-        type: 'response.output_item.added',
-        output_index: 0,
-        item: {
-          type: 'function_call',
-          id: 'fc_1',
-          call_id: 'call_1',
-          name: 'Read',
-          arguments: '',
-          status: 'in_progress',
-        },
-      } as any,
-      {
-        type: 'response.function_call_arguments.delta',
-        output_index: 0,
-        item_id: 'fc_1',
-        delta: '{"file_path":"README.md"}',
-      } as any,
-      {
-        type: 'response.function_call_arguments.done',
-        output_index: 0,
-        item_id: 'fc_1',
-        arguments: '{"file_path":"README.md"}',
-      } as any,
-      { type: 'response.completed', response } as any,
-    ]
-
-    const { assistantMessages, streamEvents } = await runQuery([
-      { events, finalResponse: response },
-    ])
-
-    expect(assistantMessages).toHaveLength(1)
-    expect(assistantMessages[0].message.content).toEqual([
-      {
-        type: 'tool_use',
-        id: 'call_1',
-        name: 'Read',
-        input: { file_path: 'README.md' },
-      },
-    ])
-    expect(assistantMessages[0].message.stop_reason).toBe('tool_use')
-    expect(
-      streamEvents.find((item: any) => item.event.type === 'message_delta')?.event.delta
-        .stop_reason,
-    ).toBe('tool_use')
-  })
-
-  test('sends system prompt via top-level instructions instead of system messages', async () => {
-    const response = makeResponse({
-      output: [
-        {
-          type: 'message',
-          role: 'assistant',
-          content: [{ type: 'output_text', text: 'ok' }],
-          status: 'completed',
-        } as any,
-      ],
-      output_text: 'ok',
-    })
-
-    const events: ResponseStreamEvent[] = [
-      { type: 'response.created', response } as any,
-      { type: 'response.completed', response } as any,
-    ]
-
-    await runQuery(
-      [{ events, finalResponse: response }],
-      [],
-      asSystemPrompt(['system one', 'system two']),
-    )
-
-    expect(lastRequestBody.instructions).toBe('system one\n\nsystem two')
-    expect(lastRequestBody.input).toEqual([])
-  })
-
-  test('continues incomplete responses and aggregates usage across attempts', async () => {
-    const incompleteResponse = makeResponse({
-      status: 'incomplete',
-      incomplete_details: { reason: 'max_output_tokens' } as any,
-      usage: {
-        input_tokens: 10,
-        output_tokens: 4,
-        total_tokens: 14,
-        input_tokens_details: { cached_tokens: 1 },
-        output_tokens_details: { reasoning_tokens: 0 },
-      } as any,
-      output: [
-        {
-          type: 'message',
-          role: 'assistant',
-          content: [{ type: 'output_text', text: 'hello ' }],
-          status: 'incomplete',
-        } as any,
-      ],
-    })
-    const completedResponse = makeResponse({
-      usage: {
-        input_tokens: 20,
-        output_tokens: 6,
-        total_tokens: 26,
-        input_tokens_details: { cached_tokens: 2 },
-        output_tokens_details: { reasoning_tokens: 0 },
-      } as any,
-      output: [
-        {
-          type: 'message',
-          role: 'assistant',
-          content: [{ type: 'output_text', text: 'world' }],
-          status: 'completed',
-        } as any,
-      ],
-    })
-
-    const { assistantMessages } = await runQuery([
-      {
-        events: [
-          { type: 'response.created', response: incompleteResponse } as any,
-          { type: 'response.incomplete', response: incompleteResponse } as any,
-        ],
-        finalResponse: incompleteResponse,
-      },
-      {
-        events: [
-          { type: 'response.created', response: completedResponse } as any,
-          { type: 'response.completed', response: completedResponse } as any,
-        ],
-        finalResponse: completedResponse,
-      },
-    ])
-
-    expect(assistantMessages).toHaveLength(1)
-    expect(assistantMessages[0].message.content).toEqual([
-      { type: 'text', text: 'hello world' },
-    ])
-    expect(assistantMessages[0].message.usage).toMatchObject({
-      input_tokens: 30,
-      output_tokens: 10,
-      cache_read_input_tokens: 3,
-    })
-  })
-
-  test('falls back to responses.create(stream:true) when helper streaming fails', async () => {
-    const fallbackResponse = makeResponse({
-      output: [
-        {
-          type: 'message',
-          role: 'assistant',
-          content: [{ type: 'output_text', text: 'fallback ok' }],
-          status: 'completed',
-        } as any,
-      ],
-    })
-
-    const { assistantMessages } = await runQuery(
-      [{ error: new Error('helper stream failed') }],
-      [
-        {
-          events: [
-            { type: 'response.created', response: fallbackResponse } as any,
-            { type: 'response.completed', response: fallbackResponse } as any,
-          ],
-        },
-      ],
-    )
-
-    expect(lastCreateRequestBody.stream).toBe(true)
-    expect(assistantMessages).toHaveLength(1)
-    expect(assistantMessages[0].message.content).toEqual([
-      { type: 'text', text: 'fallback ok' },
-    ])
-  })
-})
--- a/src/services/api/codex/client.ts
+++ b/src/services/api/codex/client.ts
@@ -1,57 +0,0 @@
-import OpenAI from 'openai'
-import { openaiAdapter } from 'src/services/providerUsage/adapters/openai.js'
-import { updateProviderBuckets } from 'src/services/providerUsage/store.js'
-import { getProxyFetchOptions } from 'src/utils/proxy.js'
-
-export const DEFAULT_CODEX_BASE_URL = 'https://api.openai.com/v1'
-
-let cachedClient: OpenAI | null = null
-
-function wrapFetchForUsage(base: typeof fetch): typeof fetch {
-  const wrapped = async (
-    ...args: Parameters<typeof fetch>
-  ): Promise<Response> => {
-    const res = await base(...args)
-    try {
-      updateProviderBuckets('codex', openaiAdapter.parseHeaders(res.headers))
-    } catch {
-      // Usage tracking must not affect the request path.
-    }
-    return res
-  }
-  return wrapped as unknown as typeof fetch
-}
-
-export function getCodexClient(options?: {
-  maxRetries?: number
-  fetchOverride?: typeof fetch
-}): OpenAI {
-  if (cachedClient && !options?.fetchOverride) {
-    return cachedClient
-  }
-
-  const apiKey = process.env.CODEX_API_KEY || ''
-  const baseURL = process.env.CODEX_BASE_URL || DEFAULT_CODEX_BASE_URL
-  const baseFetch = options?.fetchOverride ?? (globalThis.fetch as typeof fetch)
-  const wrappedFetch = wrapFetchForUsage(baseFetch)
-
-  const client = new OpenAI({
-    apiKey,
-    baseURL,
-    maxRetries: options?.maxRetries ?? 0,
-    timeout: parseInt(process.env.API_TIMEOUT_MS || String(600 * 1000), 10),
-    dangerouslyAllowBrowser: true,
-    fetchOptions: getProxyFetchOptions({ forAnthropicAPI: false }),
-    fetch: wrappedFetch,
-  })
-
-  if (!options?.fetchOverride) {
-    cachedClient = client
-  }
-
-  return client
-}
-
-export function clearCodexClientCache(): void {
-  cachedClient = null
-}
--- a/src/services/api/codex/errors.ts
+++ b/src/services/api/codex/errors.ts
@@ -1,114 +0,0 @@
-import type { SDKAssistantMessageError } from '../../../entrypoints/agentSdkTypes.js'
-
-type CodexErrorLike = {
-  status?: unknown
-  message?: unknown
-  error?: {
-    message?: unknown
-  }
-}
-
-export type NormalizedCodexError = {
-  content: string
-  error: SDKAssistantMessageError
-}
-
-function readErrorStatus(error: unknown): number | null {
-  if (
-    typeof error === 'object' &&
-    error !== null &&
-    typeof (error as CodexErrorLike).status === 'number'
-  ) {
-    return (error as CodexErrorLike).status as number
-  }
-
-  return null
-}
-
-function readErrorMessage(error: unknown): string {
-  if (error instanceof Error && error.message.length > 0) {
-    return error.message
-  }
-
-  if (typeof error === 'object' && error !== null) {
-    const value = error as CodexErrorLike
-    if (typeof value.message === 'string' && value.message.length > 0) {
-      return value.message
-    }
-    if (
-      typeof value.error?.message === 'string' &&
-      value.error.message.length > 0
-    ) {
-      return value.error.message
-    }
-  }
-
-  return String(error)
-}
-
-export function getCodexConfigurationError(): NormalizedCodexError | null {
-  if (!process.env.CODEX_API_KEY) {
-    return {
-      content:
-        'Missing CODEX_API_KEY. Configure it in settings or your environment before using the codex provider.',
-      error: 'authentication_failed',
-    }
-  }
-
-  return null
-}
-
-export function normalizeCodexError(error: unknown): NormalizedCodexError {
-  const status = readErrorStatus(error)
-  const message = readErrorMessage(error)
-
-  if (/^Codex preflight:/i.test(message)) {
-    return {
-      content: message,
-      error: 'invalid_request',
-    }
-  }
-
-  if (status === 401 || status === 403) {
-    return {
-      content: `Codex authentication failed (${status}). Verify CODEX_API_KEY and CODEX_BASE_URL.`,
-      error: 'authentication_failed',
-    }
-  }
-
-  if (status === 404) {
-    return {
-      content:
-        'Codex endpoint not found (404). Verify CODEX_BASE_URL points to a Responses API root.',
-      error: 'invalid_request',
-    }
-  }
-
-  if (status === 429) {
-    return {
-      content:
-        'Codex rate limit reached (429). Retry shortly or reduce request volume.',
-      error: 'rate_limit',
-    }
-  }
-
-  if (status === 502 && /upstream request failed/i.test(message)) {
-    return {
-      content:
-        'Codex gateway returned 502 Upstream request failed. This usually means a transient gateway issue or incomplete Responses API compatibility during tool replay.',
-      error: 'server_error',
-    }
-  }
-
-  if (status !== null && status >= 500) {
-    return {
-      content: `Codex server error (${status}): ${message}`,
-      error: 'server_error',
-    }
-  }
-
-  return {
-    content: `API Error: ${message}`,
-    error: 'unknown',
-  }
-}
--- a/src/services/api/codex/imageUpload.ts
+++ b/src/services/api/codex/imageUpload.ts
@@ -1,132 +0,0 @@
-import { createHash } from 'crypto'
-import { logForDebugging } from '../../../utils/debug.js'
-
-const resolvedImageUrls = new Map<string, string>()
-const DEFAULT_TIMEOUT_MS = 30_000
-const IMGBB_UPLOAD_URL = 'https://api.imgbb.com/1/upload'
-
-type ImgbbVariant = {
-  url?: unknown
-}
-
-type ImgbbPayload = {
-  data?: {
-    url?: unknown
-    display_url?: unknown
-    image?: ImgbbVariant
-    medium?: ImgbbVariant
-    thumb?: ImgbbVariant
-  }
-}
-
-function getUploadTimeoutMs(): number {
-  const raw =
-    process.env.CODEX_IMAGE_UPLOAD_TIMEOUT_MS ??
-    process.env.CODEX_IMAGE_URL_TIMEOUT_MS
-  if (!raw) {
-    return DEFAULT_TIMEOUT_MS
-  }
-
-  const parsed = Number.parseInt(raw, 10)
-  return Number.isFinite(parsed) && parsed > 0 ? parsed : DEFAULT_TIMEOUT_MS
-}
-
-function getCacheKey(prefix: string, value: string): string {
-  return `${prefix}:${createHash('sha256').update(value).digest('hex')}`
-}
-
-function getImgbbApiKey(): string | null {
-  const apiKey = process.env.CODEX_IMGBB_API_KEY?.trim()
-  return apiKey && apiKey.length > 0 ? apiKey : null
-}
-
-function pickImgbbImageUrl(payload: ImgbbPayload): string | null {
-  const candidates = [
-    payload.data?.medium?.url,
-    payload.data?.thumb?.url,
-    payload.data?.image?.url,
-    payload.data?.url,
-    payload.data?.display_url,
-  ]
-
-  for (const candidate of candidates) {
-    if (typeof candidate === 'string' && candidate.length > 0) {
-      return candidate
-    }
-  }
-
-  return null
-}
-
-async function withTimeout<T>(
-  run: (signal: AbortSignal) => Promise<T>,
-): Promise<T> {
-  const controller = new AbortController()
-  const timeout = setTimeout(() => controller.abort(), getUploadTimeoutMs())
-
-  try {
-    return await run(controller.signal)
-  } finally {
-    clearTimeout(timeout)
-  }
-}
-
-async function uploadToImgbb(
-  base64Image: string,
-): Promise<string | null> {
-  const apiKey = getImgbbApiKey()
-  if (!apiKey) {
-    return null
-  }
-
-  try {
-    const url = await withTimeout(async signal => {
-      const body = new FormData()
-      body.append('image', base64Image)
-
-      const response = await fetch(`${IMGBB_UPLOAD_URL}?key=${encodeURIComponent(apiKey)}`, {
-        method: 'POST',
-        body,
-        signal,
-      })
-
-      if (!response.ok) {
-        logForDebugging(
-          `[Codex] ImgBB upload failed: ${response.status} ${response.statusText}`,
-        )
-        return null
-      }
-
-      return pickImgbbImageUrl((await response.json()) as ImgbbPayload)
-    })
-
-    if (!url) {
-      logForDebugging('[Codex] ImgBB upload produced no usable URL.')
-      return null
-    }
-
-    return url
-  } catch (error) {
-    logForDebugging(`[Codex] Failed to upload image to ImgBB: ${error}`)
-    return null
-  }
-}
-
-export async function uploadCodexBase64Image(
-  data: string,
-  mediaType: string = 'image/png',
-): Promise<string | null> {
-  const cacheKey = getCacheKey('base64', `${mediaType}:${data}`)
-  const cached = resolvedImageUrls.get(cacheKey)
-  if (cached) {
-    return cached
-  }
-
-  const url = await uploadToImgbb(data)
-  if (!url) {
-    return null
-  }
-
-  resolvedImageUrls.set(cacheKey, url)
-  return url
-}
--- a/src/services/api/codex/index.ts
+++ b/src/services/api/codex/index.ts
@@ -1,304 +0,0 @@
-import type { BetaToolUnion } from '@anthropic-ai/sdk/resources/beta/messages/messages.mjs'
-import type {
-  Response,
-  ResponseCreateParamsNonStreaming,
-} from 'openai/resources/responses/responses.mjs'
-import { appendFileSync } from 'fs'
-import type { SystemPrompt } from '../../../utils/systemPromptType.js'
-import type {
-  AssistantMessage,
-  Message,
-  StreamEvent,
-  SystemAPIErrorMessage,
-} from '../../../types/message.js'
-import type { Tools } from '../../../Tool.js'
-import type { SDKAssistantMessageError } from '../../../entrypoints/agentSdkTypes.js'
-import { toolToAPISchema } from '../../../utils/api.js'
-import {
-  createAssistantAPIErrorMessage,
-  normalizeMessagesForAPI,
-} from '../../../utils/messages.js'
-import { logForDebugging } from '../../../utils/debug.js'
-import { getModelMaxOutputTokens } from '../../../utils/context.js'
-import type { Options } from '../claude.js'
-import { recordLLMObservation } from '../../../services/langfuse/tracing.js'
-import {
-  convertMessagesToLangfuse,
-  convertOutputToLangfuse,
-  convertToolsToLangfuse,
-} from '../../../services/langfuse/convert.js'
-import {
-  anthropicMessagesToCodexInput,
-  anthropicToolsToCodex,
-  resolveCodexMaxTokens,
-  resolveCodexModel,
-} from '@ant/model-provider'
-import { getCodexClient } from './client.js'
-import { uploadCodexBase64Image } from './imageUpload.js'
-import {
-  getCodexConfigurationError,
-  normalizeCodexError,
-} from './errors.js'
-import { sanitizeCodexRequest } from './preflight.js'
-import {
-  addCodexUsage,
-  type CodexStreamResult,
-  type CodexUsage,
-  rawAssistantBlocksToAssistantMessage,
-  type RawAssistantBlock,
-  streamCodexAttempt,
-} from './streaming.js'
-
-const MAX_CODEX_CONTINUATIONS = 3
-
-function dumpCodexPayload(
-  body: ResponseCreateParamsNonStreaming,
-): void {
-  const path = process.env.CODEX_DEBUG_PAYLOADS
-  if (!path) {
-    return
-  }
-
-  appendFileSync(
-    path,
-    `${JSON.stringify({ timestamp: new Date().toISOString(), body }, null, 2)}\n`,
-  )
-}
-
-function appendRawAssistantBlocks(
-  target: RawAssistantBlock[],
-  source: RawAssistantBlock[],
-): void {
-  for (const block of source) {
-    const lastBlock = target.at(-1)
-
-    if (lastBlock?.type === 'text' && block.type === 'text') {
-      lastBlock.text += block.text
-      continue
-    }
-
-    if (
-      lastBlock?.type === 'tool_use' &&
-      block.type === 'tool_use' &&
-      lastBlock.id === block.id &&
-      lastBlock.name === block.name &&
-      block.input.startsWith(lastBlock.input)
-    ) {
-      lastBlock.input = block.input
-      continue
-    }
-
-    target.push({ ...block })
-  }
-}
-
-export async function* queryModelCodex(
-  messages: Message[],
-  systemPrompt: SystemPrompt,
-  tools: Tools,
-  signal: AbortSignal,
-  options: Options,
-): AsyncGenerator<
-  StreamEvent | AssistantMessage | SystemAPIErrorMessage,
-  void
-> {
-  try {
-    const configurationError = getCodexConfigurationError()
-    if (configurationError) {
-      yield createAssistantAPIErrorMessage({
-        content: configurationError.content,
-        apiError: 'api_error',
-        error: configurationError.error,
-      })
-      return
-    }
-
-    const model = resolveCodexModel(options.model)
-    const messagesForAPI = normalizeMessagesForAPI(messages, tools)
-    const toolSchemas = await Promise.all(
-      tools.map(tool =>
-        toolToAPISchema(tool, {
-          getToolPermissionContext: options.getToolPermissionContext,
-          tools,
-          agents: options.agents,
-          allowedAgentTypes: options.allowedAgentTypes,
-          model: options.model,
-        }),
-      ),
-    )
-    const codexTools = anthropicToolsToCodex(toolSchemas as BetaToolUnion[])
-    const { upperLimit } = getModelMaxOutputTokens(model)
-    const maxTokens = resolveCodexMaxTokens(
-      upperLimit,
-      options.maxOutputTokensOverride,
-    )
-
-    const client = getCodexClient({
-      maxRetries: 0,
-      fetchOverride: options.fetchOverride as typeof fetch | undefined,
-    })
-    const start = Date.now()
-    const collectedMessages: AssistantMessage[] = []
-    let totalUsage: CodexUsage = {
-      input_tokens: 0,
-      output_tokens: 0,
-      cache_creation_input_tokens: 0,
-      cache_read_input_tokens: 0,
-    }
-
-    const aggregateBlocks: RawAssistantBlock[] = []
-    let replayMessages = messagesForAPI
-    let partialMessage: AssistantMessage['message'] | undefined
-    let finalResponse: Response | undefined
-    let terminalIncompleteResponse: Response | undefined
-
-    for (
-      let attempt = 0;
-      attempt <= MAX_CODEX_CONTINUATIONS;
-      attempt += 1
-    ) {
-      const input = await anthropicMessagesToCodexInput(replayMessages, {
-        resolveBase64ImageUrl: uploadCodexBase64Image,
-      })
-      const requestBody = sanitizeCodexRequest({
-        model,
-        input,
-        store: false,
-        parallel_tool_calls: false,
-        max_output_tokens: maxTokens,
-        ...(systemPrompt.length > 0 && {
-          instructions: systemPrompt.join('\n\n'),
-        }),
-        ...(codexTools.length > 0 && {
-          tools: codexTools,
-        }),
-        ...(options.temperatureOverride !== undefined && {
-          temperature: options.temperatureOverride,
-        }),
-      } satisfies ResponseCreateParamsNonStreaming)
-
-      if (attempt === 0) {
-        logForDebugging(
-          `[Codex] Calling model=${model}, inputItems=${input.length}, tools=${codexTools.length}`,
-        )
-        dumpCodexPayload(requestBody)
-      } else {
-        logForDebugging(
-          `[Codex] Continuing incomplete response attempt ${attempt}/${MAX_CODEX_CONTINUATIONS}`,
-        )
-      }
-
-      const attemptStream = streamCodexAttempt({
-        client,
-        requestBody,
-        signal,
-        start,
-        emitPrimaryEvents: attempt === 0,
-      })
-
-      let attemptResult: CodexStreamResult | undefined
-      while (true) {
-        const next = await attemptStream.next()
-        if (next.done) {
-          attemptResult = next.value
-          break
-        }
-        yield next.value
-      }
-
-      if (!attemptResult?.response) {
-        continue
-      }
-
-      partialMessage = partialMessage ?? attemptResult.partialMessage
-      finalResponse = attemptResult.response
-      terminalIncompleteResponse = attemptResult.incompleteResponse
-      totalUsage = addCodexUsage(totalUsage, attemptResult.response)
-
-      if (attemptResult.assistantBlocks.length === 0) {
-        break
-      }
-
-      appendRawAssistantBlocks(aggregateBlocks, attemptResult.assistantBlocks)
-
-      const shouldContinue =
-        attemptResult.incompleteResponse !== undefined &&
-        attempt < MAX_CODEX_CONTINUATIONS
-
-      if (!shouldContinue) {
-        break
-      }
-
-      const continuationMessage = rawAssistantBlocksToAssistantMessage(
-        attemptResult.assistantBlocks,
-        attemptResult.response,
-        tools,
-        options.agentId,
-      )
-      replayMessages = [...replayMessages, continuationMessage]
-    }
-
-    if (finalResponse) {
-      if (aggregateBlocks.length === 0) {
-        yield createAssistantAPIErrorMessage({
-          content: 'Codex returned an empty streamed response.',
-          apiError: 'api_error',
-          error: 'unknown',
-        })
-        return
-      }
-
-      const assistantMessage = rawAssistantBlocksToAssistantMessage(
-        aggregateBlocks,
-        finalResponse,
-        tools,
-        options.agentId,
-      )
-      assistantMessage.message.usage = totalUsage as any
-      collectedMessages.push(assistantMessage)
-      yield assistantMessage
-
-      recordLLMObservation(options.langfuseTrace ?? null, {
-        model,
-        provider: process.env.CODEX_LOGIN_METHOD === 'chatgpt_subscription'
-          ? 'codex-chatgpt'
-          : 'codex',
-        input: convertMessagesToLangfuse(messagesForAPI, systemPrompt),
-        output: convertOutputToLangfuse(collectedMessages),
-        usage: totalUsage,
-        startTime: new Date(start),
-        endTime: new Date(),
-        completionStartTime:
-          partialMessage !== undefined ? new Date(start) : undefined,
-        tools: convertToolsToLangfuse(toolSchemas as unknown[]),
-      })
-    } else {
-      yield createAssistantAPIErrorMessage({
-        content: 'Codex returned an empty streamed response.',
-        apiError: 'api_error',
-        error: 'unknown',
-      })
-      return
-    }
-
-    if (
-      terminalIncompleteResponse?.incomplete_details?.reason ===
-      'max_output_tokens'
-    ) {
-      yield createAssistantAPIErrorMessage({
-        content: `Output truncated: response exceeded the ${maxTokens} token limit. Set CODEX_MAX_TOKENS or CLAUDE_CODE_MAX_OUTPUT_TOKENS to override.`,
-        apiError: 'max_output_tokens',
-        error: 'max_output_tokens' as unknown as SDKAssistantMessageError,
-      })
-    }
-  } catch (error) {
-    const errorMessage = error instanceof Error ? error.message : String(error)
-    const normalizedError = normalizeCodexError(error)
-    logForDebugging(`[Codex] Error: ${errorMessage}`, { level: 'error' })
-    yield createAssistantAPIErrorMessage({
-      content: normalizedError.content,
-      apiError: 'api_error',
-      error: normalizedError.error,
-    })
-  }
-}
--- a/src/services/api/codex/preflight.ts
+++ b/src/services/api/codex/preflight.ts
@@ -1,151 +0,0 @@
-import type {
-  ResponseCreateParamsNonStreaming,
-  ResponseCreateParamsStreaming,
-  ResponseInputItem,
-  Tool,
-} from 'openai/resources/responses/responses.mjs'
-import { normalizeCodexCallId } from '@ant/model-provider'
-
-function isRecord(value: unknown): value is Record<string, unknown> {
-  return typeof value === 'object' && value !== null && !Array.isArray(value)
-}
-
-function assertString(value: unknown, label: string): string {
-  if (typeof value !== 'string') {
-    throw new Error(`Codex preflight: ${label} must be a string.`)
-  }
-
-  return value
-}
-
-function sanitizeMessageItem(item: Record<string, unknown>): ResponseInputItem {
-  const role = assertString(item.role, 'message.role')
-  const content = item.content
-
-  if ((role !== 'user' && role !== 'assistant') || !Array.isArray(content)) {
-    throw new Error('Codex preflight: message items require role and content array.')
-  }
-
-  return item as unknown as ResponseInputItem
-}
-
-function sanitizeFunctionCallItem(item: Record<string, unknown>): ResponseInputItem {
-  const callId = normalizeCodexCallId(item.call_id)
-  const name = assertString(item.name, 'function_call.name').trim()
-  const argumentsValue = item.arguments
-
-  if (!callId) {
-    throw new Error('Codex preflight: function_call.call_id is required.')
-  }
-  if (name.length === 0) {
-    throw new Error('Codex preflight: function_call.name is required.')
-  }
-  if (typeof argumentsValue !== 'string') {
-    throw new Error('Codex preflight: function_call.arguments must be a string.')
-  }
-
-  return {
-    ...item,
-    call_id: callId,
-    name,
-    arguments: argumentsValue,
-  } as ResponseInputItem
-}
-
-function sanitizeFunctionCallOutputItem(
-  item: Record<string, unknown>,
-): ResponseInputItem {
-  const callId = normalizeCodexCallId(item.call_id)
-  const output = item.output
-
-  if (!callId) {
-    throw new Error('Codex preflight: function_call_output.call_id is required.')
-  }
-  if (
-    typeof output !== 'string' &&
-    !(Array.isArray(output) && output.every(part => isRecord(part)))
-  ) {
-    throw new Error(
-      'Codex preflight: function_call_output.output must be a string or content array.',
-    )
-  }
-
-  return {
-    ...item,
-    call_id: callId,
-  } as ResponseInputItem
-}
-
-function sanitizeInputItem(item: unknown): ResponseInputItem {
-  if (!isRecord(item) || typeof item.type !== 'string') {
-    throw new Error('Codex preflight: each input item requires a type.')
-  }
-
-  switch (item.type) {
-    case 'message':
-      return sanitizeMessageItem(item)
-    case 'function_call':
-      return sanitizeFunctionCallItem(item)
-    case 'function_call_output':
-      return sanitizeFunctionCallOutputItem(item)
-    default:
-      throw new Error(`Codex preflight: unsupported input item type "${item.type}".`)
-  }
-}
-
-function sanitizeTool(tool: unknown): Tool {
-  if (!isRecord(tool) || tool.type !== 'function') {
-    throw new Error('Codex preflight: only function tools are supported.')
-  }
-
-  const name = assertString(tool.name, 'tool.name').trim()
-  const parameters = isRecord(tool.parameters) ? tool.parameters : {}
-
-  if (name.length === 0) {
-    throw new Error('Codex preflight: tool.name is required.')
-  }
-
-  return {
-    ...tool,
-    type: 'function',
-    name,
-    parameters,
-  } as Tool
-}
-
-export function sanitizeCodexRequest(
-  request: ResponseCreateParamsNonStreaming,
-): ResponseCreateParamsNonStreaming {
-  if (typeof request.model !== 'string' || request.model.trim().length === 0) {
-    throw new Error('Codex preflight: model is required.')
-  }
-
-  if (
-    request.instructions !== undefined &&
-    request.instructions !== null &&
-    typeof request.instructions !== 'string'
-  ) {
-    throw new Error('Codex preflight: instructions must be a string.')
-  }
-
-  if (!Array.isArray(request.input)) {
-    throw new Error('Codex preflight: input must be an array.')
-  }
-
-  return {
-    ...request,
-    model: request.model.trim(),
-    instructions: request.instructions?.trim() || undefined,
-    input: request.input.map(sanitizeInputItem),
-    tools: request.tools?.map(sanitizeTool),
-  }
-}
-
-export function toStreamingCodexRequest(
-  request: ResponseCreateParamsNonStreaming,
-): ResponseCreateParamsStreaming {
-  return {
-    ...request,
-    stream: true,
-  }
-}
--- a/src/services/api/codex/streaming.ts
+++ b/src/services/api/codex/streaming.ts
@@ -1,681 +0,0 @@
-import { randomUUID } from 'crypto'
-import type {
-  Response,
-  ResponseCreateParamsNonStreaming,
-  ResponseFunctionToolCall,
-  ResponseOutputItem,
-  ResponseOutputMessage,
-  ResponseStreamEvent,
-} from 'openai/resources/responses/responses.mjs'
-import type { AssistantMessage, StreamEvent } from '../../../types/message.js'
-import type { Tools } from '../../../Tool.js'
-import {
-  createAssistantMessage,
-  normalizeContentFromAPI,
-} from '../../../utils/messages.js'
-import { getCodexClient } from './client.js'
-import { resolveCodexCallId } from '@ant/model-provider'
-import { toStreamingCodexRequest } from './preflight.js'
-
-export type RawAssistantBlock =
-  | { type: 'text'; text: string }
-  | { type: 'tool_use'; id: string; name: string; input: string }
-
-export type CodexUsage = {
-  input_tokens: number
-  output_tokens: number
-  cache_creation_input_tokens: number
-  cache_read_input_tokens: number
-}
-
-export type CodexStreamResult = {
-  response?: Response
-  incompleteResponse?: Response
-  partialMessage?: AssistantMessage['message']
-  assistantBlocks: RawAssistantBlock[]
-}
-
-type CodexStreamState = {
-  contentBlocks: Record<number, RawAssistantBlock>
-  completedBlocks: Array<RawAssistantBlock | undefined>
-  partialMessage?: AssistantMessage['message']
-  finalResponse?: Response
-  incompleteResponse?: Response
-  failedResponse?: Response
-}
-
-export function getCodexUsage(
-  response: Pick<Response, 'usage'> | null | undefined,
-): CodexUsage {
-  return {
-    input_tokens: response?.usage?.input_tokens ?? 0,
-    output_tokens: response?.usage?.output_tokens ?? 0,
-    cache_creation_input_tokens: 0,
-    cache_read_input_tokens:
-      response?.usage?.input_tokens_details.cached_tokens ?? 0,
-  }
-}
-
-export function addCodexUsage(
-  total: CodexUsage,
-  response: Pick<Response, 'usage'> | null | undefined,
-): CodexUsage {
-  const usage = getCodexUsage(response)
-
-  return {
-    input_tokens: total.input_tokens + usage.input_tokens,
-    output_tokens: total.output_tokens + usage.output_tokens,
-    cache_creation_input_tokens:
-      total.cache_creation_input_tokens + usage.cache_creation_input_tokens,
-    cache_read_input_tokens:
-      total.cache_read_input_tokens + usage.cache_read_input_tokens,
-  }
-}
-
-function createPartialAssistantMessage(
-  response: Response,
-): AssistantMessage['message'] {
-  return {
-    id: response.id,
-    type: 'message',
-    role: 'assistant',
-    content: [],
-    model: response.model,
-    stop_reason: null,
-    stop_sequence: null,
-    usage: getCodexUsage(response) as any,
-  } as AssistantMessage['message']
-}
-
-function createToolUseBlock(
-  item: Partial<ResponseFunctionToolCall> & { id?: string },
-): RawAssistantBlock {
-  return {
-    type: 'tool_use',
-    id: resolveCodexCallId(
-      item.call_id ?? item.id,
-      `tool:${item.name ?? ''}:${item.arguments ?? ''}:${item.id ?? ''}`,
-    ),
-    name: item.name ?? '',
-    input: item.arguments ?? '',
-  }
-}
-
-function getCompletedTextFromItem(item: ResponseOutputItem): string | null {
-  if (item.type !== 'message' || item.role !== 'assistant') {
-    return null
-  }
-
-  for (const content of (item as ResponseOutputMessage).content) {
-    if (content.type === 'output_text' && content.text.length > 0) {
-      return content.text
-    }
-    if (content.type === 'refusal' && content.refusal.length > 0) {
-      return content.refusal
-    }
-  }
-
-  return null
-}
-
-function getCompletedAssistantBlocks(
-  blocks: Array<RawAssistantBlock | undefined>,
-): RawAssistantBlock[] {
-  return blocks.filter(
-    (block): block is RawAssistantBlock => block !== undefined,
-  )
-}
-
-function getCodexStopReason(
-  response: Pick<Response, 'incomplete_details'>,
-  blocks: RawAssistantBlock[],
-): string {
-  if (response.incomplete_details?.reason === 'max_output_tokens') {
-    return 'max_tokens'
-  }
-
-  return blocks.some(block => block.type === 'tool_use') ? 'tool_use' : 'end_turn'
-}
-
-function emitTrailingTextDelta(
-  output: StreamEvent[],
-  index: number,
-  currentText: string,
-  finalText: string,
-): void {
-  if (!finalText.startsWith(currentText)) {
-    return
-  }
-
-  const delta = finalText.slice(currentText.length)
-  if (delta.length === 0) {
-    return
-  }
-
-  output.push({
-    type: 'stream_event',
-    event: {
-      type: 'content_block_delta',
-      index,
-      delta: {
-        type: 'text_delta',
-        text: delta,
-      },
-    } as any,
-  } as StreamEvent)
-}
-
-function emitTrailingToolDelta(
-  output: StreamEvent[],
-  index: number,
-  currentInput: string,
-  finalInput: string,
-): void {
-  if (!finalInput.startsWith(currentInput)) {
-    return
-  }
-
-  const delta = finalInput.slice(currentInput.length)
-  if (delta.length === 0) {
-    return
-  }
-
-  output.push({
-    type: 'stream_event',
-    event: {
-      type: 'content_block_delta',
-      index,
-      delta: {
-        type: 'input_json_delta',
-        partial_json: delta,
-      },
-    } as any,
-  } as StreamEvent)
-}
-
-function responseToRawAssistantBlocks(response: Response): RawAssistantBlock[] {
-  const blocks: RawAssistantBlock[] = []
-
-  for (const item of response.output) {
-    if (item.type === 'function_call') {
-      const functionCall = item as ResponseFunctionToolCall
-      blocks.push({
-        type: 'tool_use',
-        id: resolveCodexCallId(
-          functionCall.call_id,
-          `output:${functionCall.name}:${functionCall.arguments}`,
-        ),
-        name: functionCall.name,
-        input: functionCall.arguments,
-      })
-      continue
-    }
-
-    if (item.type !== 'message' || item.role !== 'assistant') {
-      continue
-    }
-
-    for (const content of (item as ResponseOutputMessage).content) {
-      if (content.type === 'output_text' && content.text.length > 0) {
-        blocks.push({
-          type: 'text',
-          text: content.text,
-        })
-      } else if (content.type === 'refusal' && content.refusal.length > 0) {
-        blocks.push({
-          type: 'text',
-          text: content.refusal,
-        })
-      }
-    }
-  }
-
-  if (
-    blocks.length === 0 &&
-    typeof response.output_text === 'string' &&
-    response.output_text.length > 0
-  ) {
-    blocks.push({
-      type: 'text',
-      text: response.output_text,
-    })
-  }
-
-  return blocks
-}
-
-export function rawAssistantBlocksToAssistantMessage(
-  rawBlocks: RawAssistantBlock[],
-  response: Pick<Response, 'id' | 'model' | 'usage' | 'incomplete_details'>,
-  tools: Tools,
-  agentId?: string,
-): AssistantMessage {
-  const content = normalizeContentFromAPI(
-    rawBlocks as any,
-    tools,
-    agentId as any,
-  )
-
-  const assistantMessage = createAssistantMessage({
-    content: content as any,
-    usage: {
-      input_tokens: response.usage?.input_tokens ?? 0,
-      output_tokens: response.usage?.output_tokens ?? 0,
-      cache_creation_input_tokens: 0,
-      cache_read_input_tokens:
-        response.usage?.input_tokens_details.cached_tokens ?? 0,
-    } as any,
-  })
-
-  assistantMessage.message.id = response.id
-  assistantMessage.message.model = response.model
-  assistantMessage.message.stop_reason = getCodexStopReason(response, rawBlocks) as any
-  assistantMessage.message.stop_sequence = null
-  assistantMessage.uuid = randomUUID()
-  assistantMessage.timestamp = new Date().toISOString()
-
-  return assistantMessage
-}
-
-function handleCodexStreamEvent(params: {
-  event: ResponseStreamEvent
-  partialMessage: AssistantMessage['message'] | undefined
-  contentBlocks: Record<number, RawAssistantBlock>
-  completedBlocks: Array<RawAssistantBlock | undefined>
-  start: number
-}): {
-  output: StreamEvent[]
-  partialMessage: AssistantMessage['message'] | undefined
-  finalResponse?: Response
-  failedResponse?: Response
-  incompleteResponse?: Response
-} {
-  const { event, start } = params
-  const output: StreamEvent[] = []
-  const contentBlocks = params.contentBlocks
-  const completedBlocks = params.completedBlocks
-  let partialMessage = params.partialMessage
-  let finalResponse: Response | undefined
-  let failedResponse: Response | undefined
-  let incompleteResponse: Response | undefined
-
-  const ensureMessageStart = (response: Response): void => {
-    if (partialMessage) {
-      return
-    }
-
-    partialMessage = createPartialAssistantMessage(response)
-    output.push({
-      type: 'stream_event',
-      event: {
-        type: 'message_start',
-        message: partialMessage,
-      } as any,
-      ttftMs: Date.now() - start,
-    } as StreamEvent)
-  }
-
-  const ensureTextBlock = (index: number): RawAssistantBlock => {
-    const existing = contentBlocks[index]
-    if (existing) {
-      return existing
-    }
-
-    const block: RawAssistantBlock = { type: 'text', text: '' }
-    contentBlocks[index] = block
-    output.push({
-      type: 'stream_event',
-      event: {
-        type: 'content_block_start',
-        index,
-        content_block: { type: 'text', text: '' },
-      } as any,
-    } as StreamEvent)
-    return block
-  }
-
-  const ensureToolUseBlock = (
-    index: number,
-    item?: Partial<ResponseFunctionToolCall> & { id?: string },
-  ): RawAssistantBlock => {
-    const existing = contentBlocks[index]
-    if (existing) {
-      return existing
-    }
-
-    const block = createToolUseBlock(item ?? {})
-    contentBlocks[index] = block
-    const toolBlock = block as Extract<RawAssistantBlock, { type: 'tool_use' }>
-    output.push({
-      type: 'stream_event',
-      event: {
-        type: 'content_block_start',
-        index,
-        content_block: {
-          type: 'tool_use',
-          id: toolBlock.id,
-          name: toolBlock.name,
-          input: '',
-        },
-      } as any,
-    } as StreamEvent)
-    return block
-  }
-
-  const emitCompletedBlock = (index: number): void => {
-    const block = contentBlocks[index]
-    if (!block) {
-      return
-    }
-    completedBlocks[index] = { ...block }
-    output.push({
-      type: 'stream_event',
-      event: {
-        type: 'content_block_stop',
-        index,
-      } as any,
-    } as StreamEvent)
-    delete contentBlocks[index]
-  }
-
-  switch (event.type) {
-    case 'response.created':
-    case 'response.in_progress':
-      ensureMessageStart(event.response)
-      break
-    case 'response.output_item.added':
-      if (event.item.type === 'function_call') {
-        ensureToolUseBlock(event.output_index, event.item)
-      } else if (event.item.type === 'message' && event.item.role === 'assistant') {
-        ensureTextBlock(event.output_index)
-      }
-      break
-    case 'response.output_text.delta':
-    case 'response.refusal.delta': {
-      const block = ensureTextBlock(event.output_index)
-      if (block.type === 'text') {
-        block.text += event.delta
-      }
-      output.push({
-        type: 'stream_event',
-        event: {
-          type: 'content_block_delta',
-          index: event.output_index,
-          delta: {
-            type: 'text_delta',
-            text: event.delta,
-          },
-        } as any,
-      } as StreamEvent)
-      break
-    }
-    case 'response.function_call_arguments.delta': {
-      const block = ensureToolUseBlock(event.output_index, { id: event.item_id })
-      if (block.type === 'tool_use') {
-        block.input += event.delta
-      }
-      output.push({
-        type: 'stream_event',
-        event: {
-          type: 'content_block_delta',
-          index: event.output_index,
-          delta: {
-            type: 'input_json_delta',
-            partial_json: event.delta,
-          },
-        } as any,
-      } as StreamEvent)
-      break
-    }
-    case 'response.output_text.done':
-    case 'response.refusal.done': {
-      const block = ensureTextBlock(event.output_index)
-      const finalText = event.type === 'response.output_text.done'
-        ? event.text
-        : event.refusal
-      if (block.type === 'text') {
-        emitTrailingTextDelta(output, event.output_index, block.text, finalText)
-        block.text = finalText
-      }
-      emitCompletedBlock(event.output_index)
-      break
-    }
-    case 'response.function_call_arguments.done': {
-      const block = ensureToolUseBlock(event.output_index, {
-        id: event.item_id,
-        name: event.name,
-      })
-      if (block.type === 'tool_use') {
-        if (event.name) {
-          block.name = event.name
-        }
-        emitTrailingToolDelta(output, event.output_index, block.input, event.arguments)
-        block.input = event.arguments
-      }
-      emitCompletedBlock(event.output_index)
-      break
-    }
-    case 'response.output_item.done':
-      if (
-        event.item.type === 'message' &&
-        event.item.role === 'assistant' &&
-        contentBlocks[event.output_index]
-      ) {
-        const finalText = getCompletedTextFromItem(event.item)
-        if (finalText !== null) {
-          const block = contentBlocks[event.output_index]
-          if (block.type === 'text') {
-            emitTrailingTextDelta(output, event.output_index, block.text, finalText)
-            block.text = finalText
-          }
-        }
-        emitCompletedBlock(event.output_index)
-      } else if (
-        event.item.type === 'function_call' &&
-        contentBlocks[event.output_index]
-      ) {
-        const block = contentBlocks[event.output_index]
-        if (block.type === 'tool_use') {
-          block.id = resolveCodexCallId(
-            event.item.call_id,
-            `done:${event.item.name}:${event.item.arguments}:${event.item.id}`,
-          )
-          block.name = event.item.name
-          emitTrailingToolDelta(
-            output,
-            event.output_index,
-            block.input,
-            event.item.arguments,
-          )
-          block.input = event.item.arguments
-        }
-        emitCompletedBlock(event.output_index)
-      }
-      break
-    case 'response.completed':
-    case 'response.incomplete': {
-      ensureMessageStart(event.response)
-      if (event.type === 'response.completed') {
-        finalResponse = event.response
-      } else {
-        incompleteResponse = event.response
-      }
-      const assistantBlocks = getCompletedAssistantBlocks(completedBlocks)
-      output.push({
-        type: 'stream_event',
-        event: {
-          type: 'message_delta',
-          delta: {
-            stop_reason: getCodexStopReason(event.response, assistantBlocks),
-            stop_sequence: null,
-          },
-          usage: getCodexUsage(event.response),
-        } as any,
-      } as StreamEvent)
-      output.push({
-        type: 'stream_event',
-        event: {
-          type: 'message_stop',
-        } as any,
-      } as StreamEvent)
-      break
-    }
-    case 'response.failed':
-      failedResponse = event.response
-      break
-    case 'error':
-      throw new Error(event.message)
-  }
-
-  return {
-    output,
-    partialMessage,
-    finalResponse,
-    failedResponse,
-    incompleteResponse,
-  }
-}
-
-function selectResponse(
-  state: CodexStreamState,
-  streamedResponse?: Response,
-): CodexStreamResult {
-  const response =
-    [streamedResponse, state.finalResponse, state.incompleteResponse, state.failedResponse]
-      .find(
-        candidate =>
-          candidate !== undefined &&
-          responseToRawAssistantBlocks(candidate).length > 0,
-      ) ??
-    streamedResponse ??
-    state.finalResponse ??
-    state.incompleteResponse ??
-    state.failedResponse
-
-  return {
-    response,
-    incompleteResponse: state.incompleteResponse,
-    partialMessage: state.partialMessage,
-    assistantBlocks:
-      response !== undefined && responseToRawAssistantBlocks(response).length > 0
-        ? responseToRawAssistantBlocks(response)
-        : getCompletedAssistantBlocks(state.completedBlocks),
-  }
-}
-
-async function consumeCodexStream(
-  events: AsyncIterable<ResponseStreamEvent>,
-  start: number,
-): Promise<CodexStreamState> {
-  const state: CodexStreamState = {
-    contentBlocks: {},
-    completedBlocks: [],
-  }
-
-  for await (const event of events) {
-    const handled = handleCodexStreamEvent({
-      event,
-      partialMessage: state.partialMessage,
-      contentBlocks: state.contentBlocks,
-      completedBlocks: state.completedBlocks,
-      start,
-    })
-
-    state.partialMessage = handled.partialMessage
-    state.finalResponse = handled.finalResponse ?? state.finalResponse
-    state.incompleteResponse =
-      handled.incompleteResponse ?? state.incompleteResponse
-    state.failedResponse = handled.failedResponse ?? state.failedResponse
-  }
-
-  return state
-}
-
-export async function* streamCodexAttempt(params: {
-  client: ReturnType<typeof getCodexClient>
-  requestBody: ResponseCreateParamsNonStreaming
-  signal: AbortSignal
-  start: number
-  emitPrimaryEvents?: boolean
-}): AsyncGenerator<StreamEvent, CodexStreamResult, void> {
-  let primaryError: unknown
-  let primaryResult: CodexStreamResult | undefined
-
-  try {
-    const stream = params.client.responses.stream(
-      params.requestBody as unknown as Parameters<
-        typeof params.client.responses.stream
-      >[0],
-      { signal: params.signal },
-    )
-
-    const state: CodexStreamState = {
-      contentBlocks: {},
-      completedBlocks: [],
-    }
-
-    for await (const event of stream) {
-      const handled = handleCodexStreamEvent({
-        event,
-        partialMessage: state.partialMessage,
-        contentBlocks: state.contentBlocks,
-        completedBlocks: state.completedBlocks,
-        start: params.start,
-      })
-
-      state.partialMessage = handled.partialMessage
-      state.finalResponse = handled.finalResponse ?? state.finalResponse
-      state.incompleteResponse =
-        handled.incompleteResponse ?? state.incompleteResponse
-      state.failedResponse = handled.failedResponse ?? state.failedResponse
-
-      if (params.emitPrimaryEvents !== false) {
-        yield* handled.output
-      }
-    }
-
-    let streamedResponse: Response | undefined
-    try {
-      streamedResponse = await stream.finalResponse()
-    } catch {
-      streamedResponse = undefined
-    }
-
-    primaryResult = selectResponse(state, streamedResponse)
-    if (primaryResult.assistantBlocks.length > 0 || primaryResult.response) {
-      return primaryResult
-    }
-  } catch (error) {
-    primaryError = error
-  }
-
-  try {
-    const fallbackStream = await params.client.responses.create(
-      toStreamingCodexRequest(params.requestBody),
-      { signal: params.signal },
-    )
-
-    const fallbackState = await consumeCodexStream(
-      fallbackStream as AsyncIterable<ResponseStreamEvent>,
-      params.start,
-    )
-    const fallbackResult = selectResponse(fallbackState)
-
-    if (fallbackResult.assistantBlocks.length > 0 || fallbackResult.response) {
-      return fallbackResult
-    }
-  } catch (fallbackError) {
-    if (primaryError) {
-      throw primaryError
-    }
-    throw fallbackError
-  }
-
-  if (primaryError) {
-    throw primaryError
-  }
-
-  return primaryResult ?? {
-    assistantBlocks: [],
-  }
-}
--- a/src/services/langfuse/tracing.ts
+++ b/src/services/langfuse/tracing.ts
@@ -57,8 +57,6 @@ const PROVIDER_GENERATION_NAMES: Record<string, string> = {
  vertex: 'ChatVertexAnthropic',
  foundry: 'ChatFoundry',
  openai: 'ChatOpenAI',
-  'codex': 'ChatOpenAIResponses',
-  'codex-chatgpt': 'ChatCodex',
  gemini: 'ChatGoogleGenerativeAI',
  grok: 'ChatXAI',
 }
--- a/src/utils/tests/ndjsonFramer.test.ts
+++ b/src/utils/tests/ndjsonFramer.test.ts
@@ -0,0 +1,153 @@
+import { EventEmitter } from 'node:events'
+import type { Socket } from 'node:net'
+import { describe, expect, test } from 'bun:test'
+import { attachNdjsonFramer } from '../ndjsonFramer.js'
+
+type TestSocket = Socket & {
+  destroyed: boolean
+  emitData: (chunk: Buffer) => void
+}
+
+function createTestSocket(): TestSocket {
+  const emitter = new EventEmitter() as TestSocket
+  emitter.destroyed = false
+  emitter.destroy = ((_error?: Error) => {
+    emitter.destroyed = true
+    emitter.emit('close')
+    return emitter
+  }) as TestSocket['destroy']
+  emitter.emitData = (chunk: Buffer) => {
+    emitter.emit('data', chunk)
+  }
+  return emitter
+}
+
+describe('attachNdjsonFramer', () => {
+  test('accepts a complete frame at the configured byte limit', () => {
+    const socket = createTestSocket()
+    const messages: unknown[] = []
+    const errors: Error[] = []
+
+    attachNdjsonFramer(
+      socket,
+      msg => messages.push(msg),
+      text => JSON.parse(text) as unknown,
+      {
+        maxFrameBytes: Buffer.byteLength('{"a":1}', 'utf8'),
+        onFrameError: error => errors.push(error),
+      },
+    )
+
+    socket.emitData(Buffer.from('{"a":1}\n'))
+
+    expect(messages).toEqual([{ a: 1 }])
+    expect(errors).toEqual([])
+    expect(socket.destroyed).toBe(false)
+  })
+
+  test('destroys a complete frame over the configured byte limit', () => {
+    const socket = createTestSocket()
+    const messages: unknown[] = []
+    const errors: Error[] = []
+
+    attachNdjsonFramer(
+      socket,
+      msg => messages.push(msg),
+      text => JSON.parse(text) as unknown,
+      {
+        maxFrameBytes: 8,
+        onFrameError: error => errors.push(error),
+      },
+    )
+
+    socket.emitData(Buffer.from('{"long":true}\n'))
+
+    expect(messages).toEqual([])
+    expect(errors[0]?.message).toContain('NDJSON frame exceeded')
+    expect(socket.destroyed).toBe(true)
+  })
+
+  test('destroys oversized no-newline input before a frame can form', () => {
+    const socket = createTestSocket()
+    const messages: unknown[] = []
+    const errors: Error[] = []
+
+    attachNdjsonFramer(
+      socket,
+      msg => messages.push(msg),
+      text => JSON.parse(text) as unknown,
+      {
+        maxFrameBytes: 8,
+        onFrameError: error => errors.push(error),
+      },
+    )
+
+    socket.emitData(Buffer.from('x'.repeat(9)))
+
+    expect(messages).toEqual([])
+    expect(errors[0]?.message).toContain('NDJSON frame exceeded')
+    expect(socket.destroyed).toBe(true)
+  })
+
+  test('lets callers own oversized-frame shutdown when configured', () => {
+    const socket = createTestSocket()
+    const errors: Error[] = []
+
+    attachNdjsonFramer(
+      socket,
+      () => undefined,
+      text => JSON.parse(text) as unknown,
+      {
+        maxFrameBytes: 8,
+        onFrameError: error => errors.push(error),
+        destroyOnFrameError: false,
+      },
+    )
+
+    socket.emitData(Buffer.from('{"long":true}\n'))
+
+    expect(errors[0]?.message).toContain('NDJSON frame exceeded')
+    expect(socket.destroyed).toBe(false)
+  })
+
+  test('reports malformed non-empty frames without changing default compatibility', () => {
+    const socket = createTestSocket()
+    const messages: unknown[] = []
+    const errors: Error[] = []
+
+    attachNdjsonFramer(
+      socket,
+      msg => messages.push(msg),
+      text => JSON.parse(text) as unknown,
+      {
+        onInvalidFrame: error => errors.push(error),
+      },
+    )
+
+    socket.emitData(Buffer.from('{not-json\n'))
+
+    expect(messages).toEqual([])
+    expect(errors).toHaveLength(1)
+    expect(socket.destroyed).toBe(false)
+  })
+
+  test('destroys malformed frames when configured by the caller', () => {
+    const socket = createTestSocket()
+    const errors: Error[] = []
+
+    attachNdjsonFramer(
+      socket,
+      () => undefined,
+      text => JSON.parse(text) as unknown,
+      {
+        destroyOnInvalidFrame: true,
+        onInvalidFrame: error => errors.push(error),
+      },
+    )
+
+    socket.emitData(Buffer.from('{not-json\n'))
+
+    expect(errors).toHaveLength(1)
+    expect(socket.destroyed).toBe(true)
+  })
+})
--- a/src/utils/tests/teammateMailbox.test.ts
+++ b/src/utils/tests/teammateMailbox.test.ts
@@ -0,0 +1,490 @@
+import { afterEach, beforeEach, describe, expect, test } from 'bun:test'
+import { mkdir, readFile, rm, writeFile } from 'node:fs/promises'
+import { mkdtempSync } from 'node:fs'
+import { tmpdir } from 'node:os'
+import { dirname, join } from 'node:path'
+import type { Message } from 'src/types/message.js'
+import {
+  compactMailboxMessages,
+  getLastPeerDmSummary,
+  getInboxPath,
+  markMessageAsReadByIndex,
+  markMessageAsReadByIdentity,
+  markMessagesAsRead,
+  markMessagesAsReadByPredicate,
+  MAX_MAILBOX_MESSAGE_TEXT_BYTES,
+  MAX_MAILBOX_FILE_BYTES,
+  MAX_MAILBOX_MESSAGES,
+  MAX_READ_MAILBOX_MESSAGES,
+  MAX_UNREAD_PROTOCOL_MAILBOX_MESSAGES,
+  readMailbox,
+  type TeammateMessage,
+  writeToMailbox,
+} from 'src/utils/teammateMailbox.js'
+
+let tempHome = ''
+let previousConfigDir: string | undefined
+
+function message(
+  text: string,
+  read: boolean,
+  timestamp = new Date(0).toISOString(),
+): TeammateMessage {
+  return {
+    from: 'team-lead',
+    text,
+    timestamp,
+    read,
+  }
+}
+
+async function seedMailbox(
+  agentName: string,
+  teamName: string,
+  messages: TeammateMessage[],
+): Promise<void> {
+  const inboxPath = getInboxPath(agentName, teamName)
+  await mkdir(dirname(inboxPath), { recursive: true })
+  await writeFile(inboxPath, JSON.stringify(messages, null, 2), 'utf-8')
+}
+
+async function readRawMailbox(
+  agentName: string,
+  teamName: string,
+): Promise<TeammateMessage[]> {
+  const content = await readFile(getInboxPath(agentName, teamName), 'utf-8')
+  return JSON.parse(content) as TeammateMessage[]
+}
+
+describe('compactMailboxMessages', () => {
+  test('prioritizes unread messages and keeps only recent read history', () => {
+    const compacted = compactMailboxMessages(
+      [
+        message('read-1', true),
+        message('read-2', true),
+        message('unread-1', false),
+        message('read-3', true),
+        message('unread-2', false),
+        message('read-4', true),
+        message('read-5', true),
+        message('unread-3', false),
+      ],
+      { maxMessages: 5, maxReadMessages: 2 },
+    )
+
+    expect(compacted.map(m => m.text)).toEqual([
+      'unread-1',
+      'unread-2',
+      'read-4',
+      'read-5',
+      'unread-3',
+    ])
+  })
+
+  test('retains unread protocol messages separately from regular cap', () => {
+    const protocol = message(
+      JSON.stringify({ type: 'permission_response', request_id: 'req-1' }),
+      false,
+    )
+    const compacted = compactMailboxMessages(
+      [
+        protocol,
+        ...Array.from({ length: 5 }, (_value, index) =>
+          message(`regular-${index}`, false),
+        ),
+      ],
+      {
+        maxMessages: 2,
+        maxReadMessages: 0,
+        maxUnreadProtocolMessages: 1,
+      },
+    )
+
+    expect(compacted.map(m => m.text)).toEqual([
+      protocol.text,
+      'regular-3',
+      'regular-4',
+    ])
+  })
+
+  test('does not prioritize malformed JSON-like unread messages as protocol', () => {
+    const compacted = compactMailboxMessages(
+      [
+        message('{not-json', false),
+        message('regular-1', false),
+        message('regular-2', false),
+      ],
+      {
+        maxMessages: 1,
+        maxReadMessages: 0,
+        maxUnreadProtocolMessages: 10,
+      },
+    )
+
+    expect(compacted.map(m => m.text)).toEqual(['regular-2'])
+  })
+
+  test('caps unread protocol messages with an independent bound', () => {
+    const compacted = compactMailboxMessages(
+      Array.from(
+        { length: MAX_UNREAD_PROTOCOL_MAILBOX_MESSAGES + 1 },
+        (_value, index) =>
+          message(
+            JSON.stringify({
+              type: 'permission_response',
+              request_id: `req-${index}`,
+            }),
+            false,
+          ),
+      ),
+    )
+
+    expect(compacted).toHaveLength(MAX_UNREAD_PROTOCOL_MAILBOX_MESSAGES)
+    expect(compacted[0]?.text).toContain('req-1')
+  })
+
+  test('keeps retained mailbox bytes under an explicit budget', () => {
+    const compacted = compactMailboxMessages(
+      Array.from({ length: 20 }, (_value, index) =>
+        message(`msg-${index}-${'x'.repeat(200)}`, false),
+      ),
+      {
+        maxMessages: 20,
+        maxReadMessages: 0,
+        maxRetainedBytes: 1_000,
+      },
+    )
+
+    expect(
+      Buffer.byteLength(JSON.stringify(compacted), 'utf8'),
+    ).toBeLessThanOrEqual(1_000)
+    expect(compacted.length).toBeLessThan(20)
+    expect(compacted.at(-1)?.text).toContain('msg-19')
+  })
+
+  test('returns an empty mailbox when even one message exceeds retained budget', () => {
+    const compacted = compactMailboxMessages([message('too-large', false)], {
+      maxMessages: 10,
+      maxReadMessages: 0,
+      maxRetainedBytes: 1,
+    })
+
+    expect(compacted).toEqual([])
+  })
+
+  test('returns an empty mailbox when all retention lanes are disabled', () => {
+    const compacted = compactMailboxMessages([message('unread', false)], {
+      maxMessages: 0,
+      maxReadMessages: 0,
+      maxUnreadProtocolMessages: 0,
+      maxRetainedBytes: 1_000,
+    })
+
+    expect(compacted).toEqual([])
+  })
+})
+
+describe('teammate mailbox retention', () => {
+  beforeEach(() => {
+    previousConfigDir = process.env.CLAUDE_CONFIG_DIR
+    tempHome = mkdtempSync(join(tmpdir(), 'teammate-mailbox-'))
+    process.env.CLAUDE_CONFIG_DIR = tempHome
+  })
+
+  afterEach(async () => {
+    if (previousConfigDir === undefined) {
+      delete process.env.CLAUDE_CONFIG_DIR
+    } else {
+      process.env.CLAUDE_CONFIG_DIR = previousConfigDir
+    }
+    await rm(tempHome, { recursive: true, force: true })
+    tempHome = ''
+  })
+
+  test('writeToMailbox compacts oversized unread inbox files', async () => {
+    const existing = Array.from(
+      { length: MAX_MAILBOX_MESSAGES + 20 },
+      (_value, index) => message(`old-${index}`, false),
+    )
+    await seedMailbox('worker', 'alpha', existing)
+
+    await writeToMailbox(
+      'worker',
+      {
+        from: 'team-lead',
+        text: 'newest',
+        timestamp: new Date(1).toISOString(),
+      },
+      'alpha',
+    )
+
+    const after = await readMailbox('worker', 'alpha')
+    expect(after).toHaveLength(MAX_MAILBOX_MESSAGES)
+    expect(after[0]?.text).toBe('old-21')
+    expect(after.at(-1)?.text).toBe('newest')
+  })
+
+  test('markMessagesAsRead compacts read history after consumption', async () => {
+    const existing = Array.from(
+      { length: MAX_MAILBOX_MESSAGES + 20 },
+      (_value, index) => message(`msg-${index}`, false),
+    )
+    await seedMailbox('worker', 'alpha', existing)
+
+    await markMessagesAsRead('worker', 'alpha')
+
+    const after = await readRawMailbox('worker', 'alpha')
+    expect(after).toHaveLength(MAX_READ_MAILBOX_MESSAGES)
+    expect(after.every(m => m.read)).toBe(true)
+    expect(after[0]?.text).toBe(
+      `msg-${MAX_MAILBOX_MESSAGES + 20 - MAX_READ_MAILBOX_MESSAGES}`,
+    )
+  })
+
+  test('markMessagesAsReadByPredicate leaves structured messages unread', async () => {
+    await seedMailbox('worker', 'alpha', [
+      message('plain', false),
+      message(JSON.stringify({ type: 'permission_request' }), false),
+    ])
+
+    await markMessagesAsReadByPredicate(
+      'worker',
+      m => !m.text.includes('permission_request'),
+      'alpha',
+    )
+
+    const after = await readRawMailbox('worker', 'alpha')
+    expect(after.map(m => m.read)).toEqual([true, false])
+  })
+
+  test('markMessageAsReadByIdentity survives compaction shifting indexes', async () => {
+    const permissionResponse = message(
+      JSON.stringify({ type: 'permission_response', request_id: 'req-1' }),
+      false,
+    )
+    await seedMailbox('worker', 'alpha', [
+      permissionResponse,
+      ...Array.from({ length: MAX_MAILBOX_MESSAGES + 20 }, (_value, index) =>
+        message(`regular-${index}`, false),
+      ),
+    ])
+
+    await writeToMailbox(
+      'worker',
+      {
+        from: 'team-lead',
+        text: 'newest',
+        timestamp: new Date(2).toISOString(),
+      },
+      'alpha',
+    )
+    const marked = await markMessageAsReadByIdentity(
+      'worker',
+      'alpha',
+      permissionResponse,
+    )
+
+    const after = await readRawMailbox('worker', 'alpha')
+    expect(marked).toBe(true)
+    expect(after.some(m => m.text === permissionResponse.text && !m.read)).toBe(
+      false,
+    )
+  })
+
+  test('markMessageAsReadByIndex also compacts through the compatibility path', async () => {
+    const existing = Array.from(
+      { length: MAX_MAILBOX_MESSAGES + 10 },
+      (_value, index) => message(`msg-${index}`, false),
+    )
+    await seedMailbox('worker', 'alpha', existing)
+
+    await markMessageAsReadByIndex('worker', 'alpha', existing.length - 1)
+
+    const after = await readRawMailbox('worker', 'alpha')
+    expect(after).toHaveLength(MAX_MAILBOX_MESSAGES)
+    expect(after.some(m => m.text === `msg-${existing.length - 1}`)).toBe(false)
+    expect(after.at(-1)?.text).toBe(`msg-${existing.length - 2}`)
+  })
+
+  test('writeToMailbox rejects oversized message text instead of storing it', async () => {
+    await expect(
+      writeToMailbox(
+        'worker',
+        {
+          from: 'team-lead',
+          text: 'x'.repeat(MAX_MAILBOX_MESSAGE_TEXT_BYTES + 1),
+          timestamp: new Date(3).toISOString(),
+        },
+        'alpha',
+      ),
+    ).rejects.toThrow('Mailbox message text exceeds')
+
+    expect(await readRawMailbox('worker', 'alpha')).toEqual([])
+  })
+
+  test('writeToMailbox fails closed when an existing mailbox is corrupt', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(inboxPath, '{not-json', 'utf-8')
+
+    await expect(
+      writeToMailbox(
+        'worker',
+        {
+          from: 'team-lead',
+          text: 'new',
+          timestamp: new Date(4).toISOString(),
+        },
+        'alpha',
+      ),
+    ).rejects.toThrow()
+
+    expect(await readFile(inboxPath, 'utf-8')).toBe('{not-json')
+  })
+
+  test('writeToMailbox rejects when the inbox path is already a directory', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(inboxPath, { recursive: true })
+
+    await expect(
+      writeToMailbox(
+        'worker',
+        {
+          from: 'team-lead',
+          text: 'new',
+          timestamp: new Date(5).toISOString(),
+        },
+        'alpha',
+      ),
+    ).rejects.toThrow()
+  })
+
+  test('readMailbox fails closed on corrupt mailbox content', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(inboxPath, '{not-json', 'utf-8')
+
+    await expect(readMailbox('worker', 'alpha')).rejects.toThrow()
+  })
+
+  test('readMailbox rejects non-array mailbox files', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(inboxPath, JSON.stringify({ text: 'not an array' }), 'utf-8')
+
+    await expect(readMailbox('worker', 'alpha')).rejects.toThrow(
+      'expected message array',
+    )
+  })
+
+  test('readMailbox rejects malformed stored message shapes', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(
+      inboxPath,
+      JSON.stringify([{ from: 'lead', text: 'missing timestamp' }]),
+      'utf-8',
+    )
+
+    await expect(readMailbox('worker', 'alpha')).rejects.toThrow(
+      'Invalid mailbox message shape',
+    )
+  })
+
+  test('readMailbox rejects non-object stored messages', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(inboxPath, JSON.stringify(['not an object']), 'utf-8')
+
+    await expect(readMailbox('worker', 'alpha')).rejects.toThrow(
+      'expected object',
+    )
+  })
+
+  test('readMailbox rejects oversized mailbox files before parsing', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(inboxPath, `[${' '.repeat(MAX_MAILBOX_FILE_BYTES)}]`, 'utf-8')
+
+    await expect(readMailbox('worker', 'alpha')).rejects.toThrow(
+      'Mailbox file exceeds',
+    )
+  })
+
+  test('markMessageAsReadByIdentity returns false for missing mailbox files', async () => {
+    await expect(
+      markMessageAsReadByIdentity('worker', 'alpha', message('absent', false)),
+    ).resolves.toBe(false)
+  })
+
+  test('markMessageAsReadByIdentity returns false when the expected message moved out', async () => {
+    await seedMailbox('worker', 'alpha', [message('other', false)])
+
+    await expect(
+      markMessageAsReadByIdentity('worker', 'alpha', message('missing', false)),
+    ).resolves.toBe(false)
+
+    expect((await readRawMailbox('worker', 'alpha'))[0]?.read).toBe(false)
+  })
+
+  test('markMessageAsReadByIdentity returns false on corrupt mailbox content', async () => {
+    const inboxPath = getInboxPath('worker', 'alpha')
+    await mkdir(dirname(inboxPath), { recursive: true })
+    await writeFile(inboxPath, '{not-json', 'utf-8')
+
+    await expect(
+      markMessageAsReadByIdentity('worker', 'alpha', message('missing', false)),
+    ).resolves.toBe(false)
+  })
+})
+
+describe('getLastPeerDmSummary', () => {
+  test('extracts the final peer direct-message summary from assistant tool use', () => {
+    const messages = [
+      { type: 'user', message: { content: 'wake up' } },
+      {
+        type: 'assistant',
+        message: {
+          content: [
+            {
+              type: 'tool_use',
+              name: 'SendMessage',
+              input: {
+                to: 'worker-1',
+                message: 'please check the UDS bounds',
+                summary: 'Checking UDS bounds',
+              },
+            },
+          ],
+        },
+      },
+    ] as unknown as Message[]
+
+    expect(getLastPeerDmSummary(messages)).toBe(
+      '[to worker-1] Checking UDS bounds',
+    )
+  })
+
+  test('stops peer direct-message summary search at the wake-up boundary', () => {
+    const messages = [
+      {
+        type: 'assistant',
+        message: {
+          content: [
+            {
+              type: 'tool_use',
+              name: 'SendMessage',
+              input: {
+                to: 'worker-1',
+                message: 'old message',
+              },
+            },
+          ],
+        },
+      },
+      { type: 'user', message: { content: 'new prompt' } },
+    ] as unknown as Message[]
+
+    expect(getLastPeerDmSummary(messages)).toBeUndefined()
+  })
+})
--- a/src/utils/tests/udsMessaging.test.ts
+++ b/src/utils/tests/udsMessaging.test.ts
@@ -0,0 +1,631 @@
+import { afterEach, beforeEach, describe, expect, test } from 'bun:test'
+import {
+  chmod,
+  mkdir,
+  mkdtemp,
+  readdir,
+  rm,
+  stat,
+  symlink,
+  unlink,
+  writeFile,
+} from 'node:fs/promises'
+import { createHash } from 'node:crypto'
+import { createConnection, createServer } from 'node:net'
+import { dirname, join } from 'node:path'
+import { tmpdir } from 'node:os'
+import {
+  drainInbox,
+  getDefaultUdsSocketPath,
+  MAX_UDS_INBOX_ENTRIES,
+  MAX_UDS_INBOX_BYTES,
+  MAX_UDS_FRAME_BYTES,
+  MAX_UDS_CLIENTS,
+  formatUdsAddress,
+  parseUdsTarget,
+  sendUdsMessage,
+  setOnEnqueue,
+  startUdsMessaging,
+  stopUdsMessaging,
+  UDS_AUTH_TIMEOUT_MS,
+} from '../udsMessaging.js'
+
+let previousConfigDir: string | undefined
+let tempConfigDir = ''
+
+function socketPath(label: string): string {
+  const suffix = `${process.pid}-${Date.now()}-${Math.random().toString(16).slice(2)}-${label}`
+  if (process.platform === 'win32') {
+    return `\\\\.\\pipe\\claude-code-test-${suffix}`
+  }
+  return join(tmpdir(), 'claude-code-test', `${suffix}.sock`)
+}
+
+function sleep(ms: number): Promise<void> {
+  return new Promise(resolve => setTimeout(resolve, ms))
+}
+
+async function waitForEnqueues(
+  expected: number,
+  sendMessages: () => Promise<void>,
+): Promise<void> {
+  let count = 0
+  let resolveDone: (() => void) | undefined
+  const done = new Promise<void>(resolve => {
+    resolveDone = resolve
+  })
+
+  setOnEnqueue(() => {
+    count++
+    if (count >= expected) resolveDone?.()
+  })
+
+  await sendMessages()
+  await Promise.race([
+    done,
+    sleep(5_000).then(() => {
+      throw new Error(`Timed out waiting for ${expected} UDS enqueues`)
+    }),
+  ])
+  setOnEnqueue(null)
+}
+
+beforeEach(async () => {
+  previousConfigDir = process.env.CLAUDE_CONFIG_DIR
+  tempConfigDir = await mkdtemp(join(tmpdir(), 'uds-messaging-home-'))
+  process.env.CLAUDE_CONFIG_DIR = tempConfigDir
+})
+
+afterEach(async () => {
+  setOnEnqueue(null)
+  drainInbox()
+  await stopUdsMessaging()
+  if (previousConfigDir === undefined) {
+    delete process.env.CLAUDE_CONFIG_DIR
+  } else {
+    process.env.CLAUDE_CONFIG_DIR = previousConfigDir
+  }
+  if (tempConfigDir) {
+    await rm(tempConfigDir, { recursive: true, force: true })
+    tempConfigDir = ''
+  }
+})
+
+async function closeServer(server: ReturnType<typeof createServer>): Promise<void> {
+  await new Promise<void>(resolve => {
+    server.close(() => resolve())
+  })
+}
+
+describe('UDS inbox retention', () => {
+  test('drainInbox returns each pending socket message once', async () => {
+    const path = socketPath('drain')
+    await startUdsMessaging(path, { isExplicit: true })
+    expect(process.env.CLAUDE_CODE_MESSAGING_TOKEN).toBeUndefined()
+
+    await waitForEnqueues(2, async () => {
+      await sendUdsMessage(path, { type: 'text', data: 'one' })
+      await sendUdsMessage(path, { type: 'text', data: 'two' })
+    })
+
+    const drained = drainInbox()
+    expect(drained.map(entry => entry.message.data)).toEqual(['one', 'two'])
+    expect(drained.every(entry => entry.status === 'processed')).toBe(true)
+    expect(drainInbox()).toEqual([])
+  })
+
+  test('inbox is capped when messages arrive faster than they are drained', async () => {
+    const path = socketPath('cap')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    await waitForEnqueues(MAX_UDS_INBOX_ENTRIES, async () => {
+      for (let i = 0; i < MAX_UDS_INBOX_ENTRIES; i++) {
+        await sendUdsMessage(path, { type: 'text', data: String(i) })
+      }
+    })
+    await expect(
+      sendUdsMessage(path, { type: 'text', data: 'overflow' }),
+    ).rejects.toThrow('inbox full')
+
+    const drained = drainInbox()
+    expect(drained).toHaveLength(MAX_UDS_INBOX_ENTRIES)
+    expect(drained[0]?.message.data).toBe('0')
+    expect(drained.at(-1)?.message.data).toBe(String(MAX_UDS_INBOX_ENTRIES - 1))
+  })
+
+  test('inbox is capped by retained bytes before entry count', async () => {
+    const path = socketPath('byte-cap')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    const payload = 'x'.repeat(32 * 1024)
+    let accepted = 0
+    for (;;) {
+      try {
+        await sendUdsMessage(path, { type: 'text', data: payload })
+        accepted++
+        if (accepted > MAX_UDS_INBOX_BYTES / payload.length + 20) {
+          throw new Error('byte cap was not enforced')
+        }
+      } catch (error) {
+        expect(error).toBeInstanceOf(Error)
+        expect((error as Error).message).toContain('inbox full')
+        break
+      }
+    }
+
+    const drained = drainInbox()
+    expect(drained.length).toBe(accepted)
+    expect(drained.length).toBeLessThan(MAX_UDS_INBOX_ENTRIES)
+  })
+
+  test('ping replies with pong without enqueueing inbox work', async () => {
+    const path = socketPath('ping')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    await sendUdsMessage(path, { type: 'ping' })
+    expect(drainInbox()).toEqual([])
+  })
+
+  test('udsClient helpers authenticate through the capability file', async () => {
+    const path = socketPath('uds-client')
+    await startUdsMessaging(path, { isExplicit: true })
+    const { isPeerAlive, sendToUdsSocket } = await import('../udsClient.js')
+
+    expect(await isPeerAlive(path)).toBe(true)
+    await waitForEnqueues(1, async () => {
+      await sendToUdsSocket(path, 'hello from client')
+    })
+
+    const drained = drainInbox()
+    expect(drained).toHaveLength(1)
+    expect(drained[0]?.message.data).toBe('hello from client')
+    expect(drained[0]?.message.meta).toBeUndefined()
+  })
+
+  test('udsClient peer probe fails closed on oversized pong frames', async () => {
+    const path = socketPath('uds-client-oversized-pong')
+    if (process.platform !== 'win32') {
+      await mkdir(dirname(path), { recursive: true })
+    }
+    const receiver = createServer(socket => {
+      socket.on('data', () => {
+        socket.write('x'.repeat(MAX_UDS_FRAME_BYTES + 1))
+      })
+    })
+    await new Promise<void>((resolve, reject) => {
+      receiver.on('error', reject)
+      receiver.listen(path, () => resolve())
+    })
+
+    try {
+      const { isPeerAlive } = await import('../udsClient.js')
+      expect(await isPeerAlive(path, 3_000, 'test-token')).toBe(false)
+    } finally {
+      await closeServer(receiver)
+      if (process.platform !== 'win32') {
+        await unlink(path).catch(() => undefined)
+      }
+    }
+  })
+
+  test('udsClient send fails closed when no capability token exists', async () => {
+    const path = socketPath('uds-client-no-token')
+    const { sendToUdsSocket } = await import('../udsClient.js')
+
+    await expect(sendToUdsSocket(path, 'hello')).rejects.toThrow(
+      'No auth token found',
+    )
+  })
+
+  test('udsClient send reports connection failures without leaking token state', async () => {
+    const path = socketPath('uds-client-connect-error')
+    const capabilityDir = join(tempConfigDir, 'messaging-capabilities')
+    const capabilityName = `${createHash('sha256').update(path).digest('hex')}.json`
+    await mkdir(capabilityDir, { recursive: true, mode: 0o700 })
+    await writeFile(
+      join(capabilityDir, capabilityName),
+      JSON.stringify({ socketPath: path, authToken: 'test-token' }),
+      'utf-8',
+    )
+    const { sendToUdsSocket } = await import('../udsClient.js')
+
+    await expect(sendToUdsSocket(path, 'hello')).rejects.toThrow(
+      'Failed to connect to peer',
+    )
+  })
+
+  test('sendUdsMessage fails closed before connecting without an auth token', async () => {
+    await expect(
+      sendUdsMessage(socketPath('no-auth-token'), { type: 'text', data: 'x' }),
+    ).rejects.toThrow('without auth token')
+  })
+
+  test('drained entries never expose the UDS auth token', async () => {
+    const path = socketPath('strip-token')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    await waitForEnqueues(1, async () => {
+      await sendUdsMessage(path, {
+        type: 'notification',
+        meta: { keep: 'visible' },
+      })
+    })
+
+    const drained = drainInbox()
+    expect(drained).toHaveLength(1)
+    expect(drained[0]?.message.meta).toEqual({ keep: 'visible' })
+    expect(drained[0]?.message.meta).not.toHaveProperty('authToken')
+  })
+
+  test('rejects unauthenticated socket messages', async () => {
+    const path = socketPath('auth')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    const response = await new Promise<string>((resolve, reject) => {
+      let responseText = ''
+      const conn = createConnection(path, () => {
+        conn.write(`${JSON.stringify({ type: 'text', data: 'bad' })}\n`)
+      })
+      conn.setTimeout(5_000, () => {
+        conn.destroy()
+        reject(new Error('Timed out waiting for auth rejection'))
+      })
+      conn.on('data', chunk => {
+        const text = chunk.toString('utf-8')
+        if (text.includes('\n')) {
+          responseText = text
+        }
+      })
+      conn.on('close', () => resolve(responseText))
+      conn.on('error', reject)
+    })
+
+    expect(JSON.parse(response).type).toBe('error')
+    expect(drainInbox()).toEqual([])
+  })
+
+  test('disconnects malformed JSON clients without enqueueing inbox work', async () => {
+    const path = socketPath('malformed-client')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    const response = await new Promise<string>((resolve, reject) => {
+      let responseText = ''
+      const conn = createConnection(path, () => {
+        conn.write('{not-json\n')
+      })
+      conn.setTimeout(5_000, () => {
+        conn.destroy()
+        reject(new Error('Timed out waiting for malformed frame close'))
+      })
+      conn.on('data', chunk => {
+        responseText += chunk.toString('utf-8')
+      })
+      conn.on('close', () => resolve(responseText))
+      conn.on('error', reject)
+    })
+
+    const parsed = JSON.parse(response)
+    expect(parsed.type).toBe('error')
+    expect(parsed.data).toBe('invalid frame')
+    expect(drainInbox()).toEqual([])
+  })
+
+  test('disconnects idle unauthenticated clients', async () => {
+    const path = socketPath('idle-client')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    const response = await new Promise<string>((resolve, reject) => {
+      let responseText = ''
+      const conn = createConnection(path)
+      conn.setTimeout(UDS_AUTH_TIMEOUT_MS + 2_000, () => {
+        conn.destroy()
+        reject(new Error('Timed out waiting for auth timeout close'))
+      })
+      conn.on('data', chunk => {
+        responseText += chunk.toString('utf-8')
+      })
+      conn.on('close', () => resolve(responseText))
+      conn.on('error', reject)
+    })
+
+    const parsed = JSON.parse(response)
+    expect(parsed.type).toBe('error')
+    expect(parsed.data).toBe('authentication timeout')
+    expect(drainInbox()).toEqual([])
+  })
+
+  test('destroys oversized frames before enqueueing inbox work', async () => {
+    const path = socketPath('oversized')
+    await startUdsMessaging(path, { isExplicit: true })
+
+    await new Promise<void>((resolve, reject) => {
+      const conn = createConnection(path, () => {
+        conn.write('x'.repeat(MAX_UDS_FRAME_BYTES + 1))
+      })
+      conn.setTimeout(5_000, () => {
+        conn.destroy()
+        reject(new Error('Timed out waiting for oversized frame close'))
+      })
+      conn.on('close', () => resolve())
+      conn.on('error', () => resolve())
+    })
+
+    expect(drainInbox()).toEqual([])
+  })
+
+  test('default socket path is regenerated after stop', async () => {
+    const firstPath = getDefaultUdsSocketPath()
+    await startUdsMessaging(firstPath)
+    await stopUdsMessaging()
+
+    expect(getDefaultUdsSocketPath()).not.toBe(firstPath)
+  })
+
+  test('rejects oversized receiver responses before retaining them', async () => {
+    const path = socketPath('oversized-response')
+    if (process.platform !== 'win32') {
+      await mkdir(dirname(path), { recursive: true })
+    }
+    const receiver = createServer(socket => {
+      socket.on('data', () => {
+        socket.write('x'.repeat(MAX_UDS_FRAME_BYTES + 1))
+      })
+    })
+    await new Promise<void>((resolve, reject) => {
+      receiver.on('error', reject)
+      receiver.listen(path, () => resolve())
+    })
+
+    try {
+      await expect(
+        sendUdsMessage(
+          path,
+          { type: 'text', data: 'hello' },
+          { authToken: 'test-token' },
+        ),
+      ).rejects.toThrow('UDS response frame exceeded size limit')
+    } finally {
+      await closeServer(receiver)
+      if (process.platform !== 'win32') {
+        await unlink(path).catch(() => undefined)
+      }
+    }
+  })
+
+  test('rejects closed receiver responses without waiting for timeout', async () => {
+    const path = socketPath('closed-response')
+    if (process.platform !== 'win32') {
+      await mkdir(dirname(path), { recursive: true })
+    }
+    const receiver = createServer(socket => {
+      socket.end()
+    })
+    await new Promise<void>((resolve, reject) => {
+      receiver.on('error', reject)
+      receiver.listen(path, () => resolve())
+    })
+
+    try {
+      await expect(
+        sendUdsMessage(
+          path,
+          { type: 'text', data: 'hello' },
+          { authToken: 'test-token' },
+        ),
+      ).rejects.toThrow('before response')
+    } finally {
+      await closeServer(receiver)
+      if (process.platform !== 'win32') {
+        await unlink(path).catch(() => undefined)
+      }
+    }
+  })
+
+  test('rejects malformed receiver responses without waiting for timeout', async () => {
+    const path = socketPath('malformed-response')
+    if (process.platform !== 'win32') {
+      await mkdir(dirname(path), { recursive: true })
+    }
+    const receiver = createServer(socket => {
+      socket.on('data', () => {
+        socket.write('{not-json\n')
+      })
+    })
+    await new Promise<void>((resolve, reject) => {
+      receiver.on('error', reject)
+      receiver.listen(path, () => resolve())
+    })
+
+    try {
+      await expect(
+        sendUdsMessage(
+          path,
+          { type: 'text', data: 'hello' },
+          { authToken: 'test-token' },
+        ),
+      ).rejects.toThrow('Invalid UDS response frame')
+    } finally {
+      await closeServer(receiver)
+      if (process.platform !== 'win32') {
+        await unlink(path).catch(() => undefined)
+      }
+    }
+  })
+
+  test('rejects inline auth token UDS targets instead of parsing them', async () => {
+    const path = socketPath('inline-token')
+
+    expect(formatUdsAddress(path)).toBe(`uds:${path}`)
+
+    const targetWithToken = `${path}#token=secret`
+    expect(() => parseUdsTarget(targetWithToken)).toThrow('inline auth token')
+    try {
+      parseUdsTarget(targetWithToken)
+    } catch (error) {
+      expect((error as Error).message).not.toContain('secret')
+    }
+
+    const { sendToUdsSocket } = await import('../udsClient.js')
+    await expect(sendToUdsSocket(targetWithToken, 'hello')).rejects.toThrow(
+      'inline auth token',
+    )
+  })
+
+  test('fails closed and cleans temp files when capability target is occupied', async () => {
+    const path = socketPath('capability-target-dir')
+    const capabilityDir = join(tempConfigDir, 'messaging-capabilities')
+    const capabilityName = `${createHash('sha256').update(path).digest('hex')}.json`
+    await mkdir(join(capabilityDir, capabilityName), {
+      recursive: true,
+      mode: 0o700,
+    })
+
+    await expect(
+      startUdsMessaging(path, { isExplicit: true }),
+    ).rejects.toThrow()
+
+    expect(process.env.CLAUDE_CODE_MESSAGING_SOCKET).toBeUndefined()
+    expect(await readdir(capabilityDir)).toEqual([capabilityName])
+  })
+
+  if (process.platform !== 'win32') {
+    test('creates the listening socket with owner-only permissions', async () => {
+      const path = socketPath('socket-mode')
+      await startUdsMessaging(path, { isExplicit: true })
+
+      const mode = (await stat(path)).mode & 0o777
+      expect(mode).toBe(0o600)
+    })
+
+    test('fails closed when the capability directory is not private', async () => {
+      const previousConfigDir = process.env.CLAUDE_CONFIG_DIR
+      const tempHome = join(
+        tmpdir(),
+        `uds-capability-${process.pid}-${Date.now()}-${Math.random().toString(16).slice(2)}`,
+      )
+      process.env.CLAUDE_CONFIG_DIR = tempHome
+      const capabilityDir = join(tempHome, 'messaging-capabilities')
+      await mkdir(capabilityDir, { recursive: true, mode: 0o755 })
+      await chmod(capabilityDir, 0o755)
+
+      try {
+        const path = socketPath('broad-capdir')
+        await expect(
+          startUdsMessaging(path, { isExplicit: true }),
+        ).rejects.toThrow('permissions are too broad')
+        await expect(stat(path)).rejects.toThrow()
+      } finally {
+        if (previousConfigDir === undefined) {
+          delete process.env.CLAUDE_CONFIG_DIR
+        } else {
+          process.env.CLAUDE_CONFIG_DIR = previousConfigDir
+        }
+        await rm(tempHome, { recursive: true, force: true })
+      }
+    })
+
+    test('fails closed when the capability directory is a symlink', async () => {
+      const previousConfigDir = process.env.CLAUDE_CONFIG_DIR
+      const tempHome = join(
+        tmpdir(),
+        `uds-capability-link-${process.pid}-${Date.now()}-${Math.random().toString(16).slice(2)}`,
+      )
+      const target = join(tempHome, 'target')
+      process.env.CLAUDE_CONFIG_DIR = tempHome
+      await mkdir(target, { recursive: true, mode: 0o700 })
+      await symlink(target, join(tempHome, 'messaging-capabilities'), 'dir')
+
+      try {
+        await expect(
+          startUdsMessaging(socketPath('symlink-capdir'), { isExplicit: true }),
+        ).rejects.toThrow('not a private directory')
+      } finally {
+        if (previousConfigDir === undefined) {
+          delete process.env.CLAUDE_CONFIG_DIR
+        } else {
+          process.env.CLAUDE_CONFIG_DIR = previousConfigDir
+        }
+        await rm(tempHome, { recursive: true, force: true })
+      }
+    })
+
+    test('fails closed when an explicit socket parent is not private', async () => {
+      const parent = join(
+        tmpdir(),
+        `uds-socket-parent-${process.pid}-${Date.now()}-${Math.random().toString(16).slice(2)}`,
+      )
+      await mkdir(parent, { recursive: true, mode: 0o755 })
+      await chmod(parent, 0o755)
+
+      try {
+        await expect(
+          startUdsMessaging(join(parent, 'messaging.sock'), {
+            isExplicit: true,
+          }),
+        ).rejects.toThrow('socket parent permissions are too broad')
+      } finally {
+        await rm(parent, { recursive: true, force: true })
+      }
+    })
+
+    test('fails closed when an explicit socket parent is a file', async () => {
+      const parentFile = join(
+        tmpdir(),
+        `uds-socket-parent-file-${process.pid}-${Date.now()}-${Math.random().toString(16).slice(2)}`,
+      )
+      await writeFile(parentFile, 'not a directory', 'utf-8')
+
+      try {
+        await expect(
+          startUdsMessaging(join(parentFile, 'messaging.sock'), {
+            isExplicit: true,
+          }),
+        ).rejects.toThrow('socket parent is not a directory')
+      } finally {
+        await rm(parentFile, { force: true })
+      }
+    })
+
+    test('stop tolerates an already removed socket path', async () => {
+      const path = socketPath('already-removed')
+      await startUdsMessaging(path, { isExplicit: true })
+      await unlink(path)
+
+      await stopUdsMessaging()
+
+      expect(process.env.CLAUDE_CODE_MESSAGING_SOCKET).toBeUndefined()
+    })
+
+    test('rejects clients over the configured connection cap', async () => {
+      const path = socketPath('client-cap')
+      await startUdsMessaging(path, { isExplicit: true })
+      const sockets: ReturnType<typeof createConnection>[] = []
+
+      try {
+        for (let i = 0; i < MAX_UDS_CLIENTS; i++) {
+          const socket = await new Promise<ReturnType<typeof createConnection>>(
+            (resolve, reject) => {
+              const conn = createConnection(path, () => resolve(conn))
+              conn.on('error', reject)
+            },
+          )
+          sockets.push(socket)
+        }
+
+        await new Promise<void>((resolve, reject) => {
+          const extra = createConnection(path)
+          extra.on('close', () => resolve())
+          extra.on('error', reject)
+          extra.setTimeout(5_000, () => {
+            extra.destroy()
+            reject(new Error('Timed out waiting for client cap close'))
+          })
+        })
+      } finally {
+        for (const socket of sockets) {
+          socket.destroy()
+        }
+      }
+    })
+  }
+})
--- a/src/utils/tests/udsResponseReader.test.ts
+++ b/src/utils/tests/udsResponseReader.test.ts
@@ -0,0 +1,218 @@
+import { describe, expect, test } from 'bun:test'
+import { EventEmitter } from 'node:events'
+import type { Socket } from 'node:net'
+import { attachUdsResponseReader } from '../udsResponseReader.js'
+
+class FakeSocket extends EventEmitter {
+  destroyed = false
+  ended = false
+
+  destroy(): this {
+    this.destroyed = true
+    this.emit('close', true)
+    return this
+  }
+
+  end(): this {
+    this.ended = true
+    this.emit('close', false)
+    return this
+  }
+
+  emitData(chunk: Buffer): void {
+    this.emit('data', chunk)
+  }
+}
+
+function asSocket(socket: FakeSocket): Socket {
+  return socket as unknown as Socket
+}
+
+describe('attachUdsResponseReader', () => {
+  test('tracks byte limits across split multibyte response chunks', () => {
+    const socket = new FakeSocket()
+    let settled = false
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settled = true
+        settledError = error
+      },
+    })
+
+    const multibyte = String.fromCodePoint(0x20ac)
+    const frame = Buffer.from(
+      JSON.stringify({ type: 'response', data: `ok ${multibyte}` }) + '\n',
+      'utf8',
+    )
+    const multibyteStart = frame.indexOf(Buffer.from(multibyte, 'utf8')[0])
+
+    socket.emitData(frame.subarray(0, multibyteStart + 1))
+    expect(settled).toBe(false)
+
+    socket.emitData(frame.subarray(multibyteStart + 1))
+    expect(settled).toBe(true)
+    expect(settledError).toBeUndefined()
+    expect(socket.ended).toBe(true)
+  })
+
+  test('rejects malformed response frames immediately', () => {
+    const socket = new FakeSocket()
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settledError = error
+      },
+    })
+
+    socket.emitData(Buffer.from('{bad-json}\n'))
+
+    expect(settledError?.message).toBe('Invalid UDS response frame')
+    expect(socket.destroyed).toBe(true)
+  })
+
+  test('skips blank frames before a valid response', () => {
+    const socket = new FakeSocket()
+    let settled = false
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settled = true
+        settledError = error
+      },
+    })
+
+    socket.emitData(Buffer.from('\n \n'))
+    expect(settled).toBe(false)
+
+    socket.emitData(Buffer.from(`${JSON.stringify({ type: 'response' })}\n`))
+    expect(settled).toBe(true)
+    expect(settledError).toBeUndefined()
+    expect(socket.ended).toBe(true)
+  })
+
+  test('continues scanning when blank and valid frames share one chunk', () => {
+    const socket = new FakeSocket()
+    let settled = false
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settled = true
+        settledError = error
+      },
+    })
+
+    socket.emitData(
+      Buffer.from(`\n${JSON.stringify({ type: 'response' })}\n`),
+    )
+
+    expect(settled).toBe(true)
+    expect(settledError).toBeUndefined()
+    expect(socket.ended).toBe(true)
+  })
+
+  test('rejects receiver error frames', () => {
+    const socket = new FakeSocket()
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settledError = error
+      },
+    })
+
+    socket.emitData(
+      Buffer.from(`${JSON.stringify({ type: 'error', data: 'denied' })}\n`),
+    )
+
+    expect(settledError?.message).toBe('denied')
+    expect(socket.destroyed).toBe(true)
+  })
+
+  test('ignores unrelated receiver frames until a terminal response arrives', () => {
+    const socket = new FakeSocket()
+    let settled = false
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settled = true
+        settledError = error
+      },
+    })
+
+    socket.emitData(
+      Buffer.from(
+        `${JSON.stringify({ type: 'notification', data: 'queued' })}\n`,
+      ),
+    )
+    expect(settled).toBe(false)
+
+    socket.emitData(Buffer.from(`${JSON.stringify({ type: 'response' })}\n`))
+    expect(settled).toBe(true)
+    expect(settledError).toBeUndefined()
+  })
+
+  test('uses custom socket error formatting', () => {
+    const socket = new FakeSocket()
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settledError = error
+      },
+      formatSocketError: error =>
+        new Error(`wrapped:${(error as Error).message}`),
+    })
+
+    socket.emit('error', new Error('connect failed'))
+
+    expect(settledError?.message).toBe('wrapped:connect failed')
+    expect(socket.destroyed).toBe(true)
+  })
+
+  test('rejects socket end before response', () => {
+    const socket = new FakeSocket()
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settledError = error
+      },
+    })
+
+    socket.emit('end')
+
+    expect(settledError?.message).toBe('UDS socket ended before response')
+    expect(socket.destroyed).toBe(true)
+  })
+
+  test('rejects clean socket close before response', () => {
+    const socket = new FakeSocket()
+    let settledError: Error | undefined
+
+    attachUdsResponseReader(asSocket(socket), {
+      maxFrameBytes: 128,
+      onSettled: error => {
+        settledError = error
+      },
+    })
+
+    socket.emit('close', false)
+
+    expect(settledError?.message).toBe('UDS socket closed before response')
+    expect(socket.destroyed).toBe(true)
+  })
+})
--- a/src/utils/auth.ts
+++ b/src/utils/auth.ts
@@ -117,12 +117,9 @@ export function isAnthropicAuthEnabled(): boolean {
    isEnvTruthy(process.env.CLAUDE_CODE_USE_BEDROCK) ||
    isEnvTruthy(process.env.CLAUDE_CODE_USE_VERTEX) ||
    isEnvTruthy(process.env.CLAUDE_CODE_USE_FOUNDRY) ||
-    isEnvTruthy(process.env.CLAUDE_CODE_USE_CODEX) ||
    (settings as any).modelType === 'openai' ||
-    (settings as any).modelType === 'codex' ||
    (settings as any).modelType === 'gemini' ||
    !!process.env.OPENAI_BASE_URL ||
-    !!process.env.CODEX_BASE_URL ||
    !!process.env.GEMINI_BASE_URL
  const apiKeyHelper = settings.apiKeyHelper
  const hasExternalAuthToken =
--- a/src/utils/managedEnvConstants.ts
+++ b/src/utils/managedEnvConstants.ts
@@ -22,7 +22,6 @@ const PROVIDER_MANAGED_ENV_VARS = new Set([
  'CLAUDE_CODE_USE_BEDROCK',
  'CLAUDE_CODE_USE_VERTEX',
  'CLAUDE_CODE_USE_FOUNDRY',
-  'CLAUDE_CODE_USE_CODEX',
  'CLAUDE_CODE_USE_GEMINI',
  // Endpoint config (base URLs, project/resource identifiers)
  'ANTHROPIC_BASE_URL',
@@ -31,7 +30,6 @@ const PROVIDER_MANAGED_ENV_VARS = new Set([
  'ANTHROPIC_FOUNDRY_BASE_URL',
  'ANTHROPIC_FOUNDRY_RESOURCE',
  'ANTHROPIC_VERTEX_PROJECT_ID',
-  'CODEX_BASE_URL',
  'GEMINI_BASE_URL',
  // Region routing (per-model VERTEX_REGION_CLAUDE_* handled by prefix below)
  'CLOUD_ML_REGION',
@@ -44,11 +42,6 @@ const PROVIDER_MANAGED_ENV_VARS = new Set([
  'CLAUDE_CODE_SKIP_BEDROCK_AUTH',
  'CLAUDE_CODE_SKIP_VERTEX_AUTH',
  'CLAUDE_CODE_SKIP_FOUNDRY_AUTH',
-  'CODEX_API_KEY',
-  'CODEX_LOGIN_METHOD',
-  'CODEX_IMGBB_API_KEY',
-  'CODEX_IMAGE_UPLOAD_TIMEOUT_MS',
-  'CODEX_IMAGE_URL_TIMEOUT_MS',
  'GEMINI_API_KEY',
  // Model defaults — often set to provider-specific ID formats
  'ANTHROPIC_MODEL',
@@ -81,23 +74,7 @@ const PROVIDER_MANAGED_ENV_VARS = new Set([
  'OPENAI_DEFAULT_SONNET_MODEL_NAME',
  'OPENAI_DEFAULT_SONNET_MODEL_SUPPORTED_CAPABILITIES',
  'OPENAI_SMALL_FAST_MODEL',
-  'CODEX_MODEL',
-  'CODEX_DEFAULT_HAIKU_MODEL',
-  'CODEX_DEFAULT_HAIKU_MODEL_DESCRIPTION',
-  'CODEX_DEFAULT_HAIKU_MODEL_NAME',
-  'CODEX_DEFAULT_HAIKU_MODEL_SUPPORTED_CAPABILITIES',
-  'CODEX_DEFAULT_OPUS_MODEL',
-  'CODEX_DEFAULT_OPUS_MODEL_DESCRIPTION',
-  'CODEX_DEFAULT_OPUS_MODEL_NAME',
-  'CODEX_DEFAULT_OPUS_MODEL_SUPPORTED_CAPABILITIES',
-  'CODEX_DEFAULT_SONNET_MODEL',
-  'CODEX_DEFAULT_SONNET_MODEL_DESCRIPTION',
-  'CODEX_DEFAULT_SONNET_MODEL_NAME',
-  'CODEX_DEFAULT_SONNET_MODEL_SUPPORTED_CAPABILITIES',
-  'CODEX_SMALL_FAST_MODEL',
  'ANTHROPIC_SMALL_FAST_MODEL',
-  'CODEX_IMAGE_UPLOAD_TIMEOUT_MS',
-  'CODEX_IMAGE_URL_TIMEOUT_MS',
  'ANTHROPIC_SMALL_FAST_MODEL_AWS_REGION',
  'CLAUDE_CODE_SUBAGENT_MODEL',
  'GEMINI_MODEL',
@@ -197,20 +174,6 @@ export const SAFE_ENV_VARS = new Set([
  'OPENAI_DEFAULT_SONNET_MODEL_DESCRIPTION',
  'OPENAI_DEFAULT_SONNET_MODEL_NAME',
  'OPENAI_DEFAULT_SONNET_MODEL_SUPPORTED_CAPABILITIES',
-  'CODEX_MODEL',
-  'CODEX_SMALL_FAST_MODEL',
-  'CODEX_DEFAULT_HAIKU_MODEL',
-  'CODEX_DEFAULT_HAIKU_MODEL_DESCRIPTION',
-  'CODEX_DEFAULT_HAIKU_MODEL_NAME',
-  'CODEX_DEFAULT_HAIKU_MODEL_SUPPORTED_CAPABILITIES',
-  'CODEX_DEFAULT_OPUS_MODEL',
-  'CODEX_DEFAULT_OPUS_MODEL_DESCRIPTION',
-  'CODEX_DEFAULT_OPUS_MODEL_NAME',
-  'CODEX_DEFAULT_OPUS_MODEL_SUPPORTED_CAPABILITIES',
-  'CODEX_DEFAULT_SONNET_MODEL',
-  'CODEX_DEFAULT_SONNET_MODEL_DESCRIPTION',
-  'CODEX_DEFAULT_SONNET_MODEL_NAME',
-  'CODEX_DEFAULT_SONNET_MODEL_SUPPORTED_CAPABILITIES',
  'ANTHROPIC_FOUNDRY_API_KEY',
  'ANTHROPIC_MODEL',
  'ANTHROPIC_SMALL_FAST_MODEL_AWS_REGION',
@@ -236,7 +199,6 @@ export const SAFE_ENV_VARS = new Set([
  'CLAUDE_CODE_SUBAGENT_MODEL',
  'CLAUDE_CODE_USE_BEDROCK',
  'CLAUDE_CODE_USE_FOUNDRY',
-  'CLAUDE_CODE_USE_CODEX',
  'CLAUDE_CODE_USE_GEMINI',
  'CLAUDE_CODE_USE_VERTEX',
  'GEMINI_MODEL',
--- a/src/utils/model/tests/providers.test.ts
+++ b/src/utils/model/tests/providers.test.ts
@@ -1,7 +1,7 @@
 import { describe, expect, test, beforeEach, afterEach } from "bun:test";
 import { mock } from "bun:test";

-let mockedModelType: "gemini" | "codex" | undefined;
+let mockedModelType: "gemini" | undefined;

 mock.module("../../settings/settings.js", () => ({
  getInitialSettings: () =>
@@ -18,7 +18,6 @@ describe("getAPIProvider", () => {
    "CLAUDE_CODE_USE_VERTEX",
    "CLAUDE_CODE_USE_FOUNDRY",
    "CLAUDE_CODE_USE_OPENAI",
-    "CLAUDE_CODE_USE_CODEX",
  ] as const;
  const savedEnv: Record<string, string | undefined> = {};

@@ -53,11 +52,6 @@ describe("getAPIProvider", () => {
    expect(getAPIProvider()).toBe("gemini");
  });

-  test('returns "codex" when modelType is codex', () => {
-    mockedModelType = "codex";
-    expect(getAPIProvider()).toBe("codex");
-  });
-
  test("modelType takes precedence over environment variables", () => {
    mockedModelType = "gemini";
    process.env.CLAUDE_CODE_USE_BEDROCK = "1";
@@ -69,11 +63,6 @@ describe("getAPIProvider", () => {
    expect(getAPIProvider()).toBe("gemini");
  });

-  test('returns "codex" when CLAUDE_CODE_USE_CODEX is set', () => {
-    process.env.CLAUDE_CODE_USE_CODEX = "1";
-    expect(getAPIProvider()).toBe("codex");
-  });
-
  test('returns "bedrock" when CLAUDE_CODE_USE_BEDROCK is set', () => {
    process.env.CLAUDE_CODE_USE_BEDROCK = "1";
    expect(getAPIProvider()).toBe("bedrock");
--- a/src/utils/model/configs.ts
+++ b/src/utils/model/configs.ts
@@ -12,7 +12,6 @@ export const CLAUDE_3_7_SONNET_CONFIG = {
  vertex: 'claude-3-7-sonnet@20250219',
  foundry: 'claude-3-7-sonnet',
  openai: 'claude-3-7-sonnet-20250219',
-  'codex': 'claude-3-7-sonnet-20250219',
  gemini: 'claude-3-7-sonnet-20250219',
  grok: 'claude-3-7-sonnet-20250219',
 } as const satisfies ModelConfig
@@ -23,7 +22,6 @@ export const CLAUDE_3_5_V2_SONNET_CONFIG = {
  vertex: 'claude-3-5-sonnet-v2@20241022',
  foundry: 'claude-3-5-sonnet',
  openai: 'claude-3-5-sonnet-20241022',
-  'codex': 'claude-3-5-sonnet-20241022',
  gemini: 'claude-3-5-sonnet-20241022',
  grok: 'claude-3-5-sonnet-20241022',
 } as const satisfies ModelConfig
@@ -34,7 +32,6 @@ export const CLAUDE_3_5_HAIKU_CONFIG = {
  vertex: 'claude-3-5-haiku@20241022',
  foundry: 'claude-3-5-haiku',
  openai: 'claude-3-5-haiku-20241022',
-  'codex': 'claude-3-5-haiku-20241022',
  gemini: 'claude-3-5-haiku-20241022',
  grok: 'claude-3-5-haiku-20241022',
 } as const satisfies ModelConfig
@@ -45,7 +42,6 @@ export const CLAUDE_HAIKU_4_5_CONFIG = {
  vertex: 'claude-haiku-4-5@20251001',
  foundry: 'claude-haiku-4-5',
  openai: 'claude-haiku-4-5-20251001',
-  'codex': 'claude-haiku-4-5-20251001',
  gemini: 'claude-haiku-4-5-20251001',
  grok: 'claude-haiku-4-5-20251001',
 } as const satisfies ModelConfig
@@ -56,7 +52,6 @@ export const CLAUDE_SONNET_4_CONFIG = {
  vertex: 'claude-sonnet-4@20250514',
  foundry: 'claude-sonnet-4',
  openai: 'claude-sonnet-4-20250514',
-  'codex': 'claude-sonnet-4-20250514',
  gemini: 'claude-sonnet-4-20250514',
  grok: 'claude-sonnet-4-20250514',
 } as const satisfies ModelConfig
@@ -67,7 +62,6 @@ export const CLAUDE_SONNET_4_5_CONFIG = {
  vertex: 'claude-sonnet-4-5@20250929',
  foundry: 'claude-sonnet-4-5',
  openai: 'claude-sonnet-4-5-20250929',
-  'codex': 'claude-sonnet-4-5-20250929',
  gemini: 'claude-sonnet-4-5-20250929',
  grok: 'claude-sonnet-4-5-20250929',
 } as const satisfies ModelConfig
@@ -78,7 +72,6 @@ export const CLAUDE_OPUS_4_CONFIG = {
  vertex: 'claude-opus-4@20250514',
  foundry: 'claude-opus-4',
  openai: 'claude-opus-4-20250514',
-  'codex': 'claude-opus-4-20250514',
  gemini: 'claude-opus-4-20250514',
  grok: 'claude-opus-4-20250514',
 } as const satisfies ModelConfig
@@ -89,7 +82,6 @@ export const CLAUDE_OPUS_4_1_CONFIG = {
  vertex: 'claude-opus-4-1@20250805',
  foundry: 'claude-opus-4-1',
  openai: 'claude-opus-4-1-20250805',
-  'codex': 'claude-opus-4-1-20250805',
  gemini: 'claude-opus-4-1-20250805',
  grok: 'claude-opus-4-1-20250805',
 } as const satisfies ModelConfig
@@ -100,7 +92,6 @@ export const CLAUDE_OPUS_4_5_CONFIG = {
  vertex: 'claude-opus-4-5@20251101',
  foundry: 'claude-opus-4-5',
  openai: 'claude-opus-4-5-20251101',
-  'codex': 'claude-opus-4-5-20251101',
  gemini: 'claude-opus-4-5-20251101',
  grok: 'claude-opus-4-5-20251101',
 } as const satisfies ModelConfig
@@ -111,7 +102,6 @@ export const CLAUDE_OPUS_4_6_CONFIG = {
  vertex: 'claude-opus-4-6',
  foundry: 'claude-opus-4-6',
  openai: 'claude-opus-4-6',
-  'codex': 'claude-opus-4-6',
  gemini: 'claude-opus-4-6',
  grok: 'claude-opus-4-6',
 } as const satisfies ModelConfig
@@ -122,7 +112,6 @@ export const CLAUDE_OPUS_4_7_CONFIG = {
  vertex: 'claude-opus-4-7',
  foundry: 'claude-opus-4-7',
  openai: 'claude-opus-4-7',
-  'codex': 'claude-opus-4-7',
  gemini: 'claude-opus-4-7',
  grok: 'claude-opus-4-7',
 } as const satisfies ModelConfig
@@ -133,7 +122,6 @@ export const CLAUDE_SONNET_4_6_CONFIG = {
  vertex: 'claude-sonnet-4-6',
  foundry: 'claude-sonnet-4-6',
  openai: 'claude-sonnet-4-6',
-  'codex': 'claude-sonnet-4-6',
  gemini: 'claude-sonnet-4-6',
  grok: 'claude-sonnet-4-6',
 } as const satisfies ModelConfig
--- a/src/utils/model/providers.ts
+++ b/src/utils/model/providers.ts
@@ -8,14 +8,12 @@ export type APIProvider =
  | 'vertex'
  | 'foundry'
  | 'openai'
-  | 'codex'
  | 'gemini'
  | 'grok'

 export function getAPIProvider(): APIProvider {
  const modelType = getInitialSettings().modelType
  if (modelType === 'openai') return 'openai'
-  if (modelType === 'codex') return 'codex'
  if (modelType === 'gemini') return 'gemini'
  if (modelType === 'grok') return 'grok'

@@ -24,7 +22,6 @@ export function getAPIProvider(): APIProvider {
  if (isEnvTruthy(process.env.CLAUDE_CODE_USE_FOUNDRY)) return 'foundry'

  if (isEnvTruthy(process.env.CLAUDE_CODE_USE_OPENAI)) return 'openai'
-  if (isEnvTruthy(process.env.CLAUDE_CODE_USE_CODEX)) return 'codex'
  if (isEnvTruthy(process.env.CLAUDE_CODE_USE_GEMINI)) return 'gemini'
  if (isEnvTruthy(process.env.CLAUDE_CODE_USE_GROK)) return 'grok'

--- a/src/utils/ndjsonFramer.ts
+++ b/src/utils/ndjsonFramer.ts
@@ -7,9 +7,18 @@
 */
 import type { Socket } from 'net'

+export type NdjsonFramerOptions = {
+  maxFrameBytes?: number
+  onFrameError?: (error: Error) => void
+  destroyOnFrameError?: boolean
+  onInvalidFrame?: (error: Error) => void
+  destroyOnInvalidFrame?: boolean
+}
+
 /**
 * Attach an NDJSON framer to a socket. Calls `onMessage` for each
- * complete JSON line received. Malformed lines are silently skipped.
+ * complete JSON line received. Malformed lines are skipped by default;
+ * callers may opt into error callbacks or socket destruction.
 *
 * @param parse - Optional custom JSON parser (defaults to JSON.parse).
 *                Useful when the caller uses a wrapped parser like jsonParse
@@ -19,21 +28,73 @@ export function attachNdjsonFramer<T = unknown>(
  socket: Socket,
  onMessage: (msg: T) => void,
  parse: (text: string) => T = text => JSON.parse(text) as T,
+  options: NdjsonFramerOptions = {},
 ): void {
  let buffer = ''
+  let bufferBytes = 0
+  const maxFrameBytes = options.maxFrameBytes ?? Number.POSITIVE_INFINITY
+
+  const rejectOversizedFrame = (bytes: number): void => {
+    const error = new Error(
+      `NDJSON frame exceeded ${maxFrameBytes} bytes (${bytes})`,
+    )
+    options.onFrameError?.(error)
+    if (options.destroyOnFrameError ?? true) {
+      socket.destroy(error)
+    }
+  }
+
+  const rejectInvalidFrame = (error: unknown): void => {
+    const frameError =
+      error instanceof Error ? error : new Error('Invalid NDJSON frame')
+    options.onInvalidFrame?.(frameError)
+    if (options.destroyOnInvalidFrame ?? false) {
+      socket.destroy(frameError)
+    }
+  }
+
+  const emitLine = (line: string): void => {
+    if (!line.trim()) return
+    try {
+      onMessage(parse(line))
+    } catch (error) {
+      rejectInvalidFrame(error)
+    }
+  }

  socket.on('data', (chunk: Buffer) => {
-    buffer += chunk.toString()
-    const lines = buffer.split('\n')
-    buffer = lines.pop() ?? ''
+    let start = 0
+    for (let index = 0; index < chunk.length; index++) {
+      if (chunk[index] !== 0x0a) continue

-    for (const line of lines) {
-      if (!line.trim()) continue
-      try {
-        onMessage(parse(line))
-      } catch {
-        // Malformed JSON — skip
+      const segmentBytes = index - start
+      if (
+        Number.isFinite(maxFrameBytes) &&
+        bufferBytes + segmentBytes > maxFrameBytes
+      ) {
+        rejectOversizedFrame(bufferBytes + segmentBytes)
+        return
      }
+
+      buffer += chunk.subarray(start, index).toString('utf8')
+      emitLine(buffer)
+      buffer = ''
+      bufferBytes = 0
+      start = index + 1
+    }
+
+    const tailBytes = chunk.length - start
+    if (
+      Number.isFinite(maxFrameBytes) &&
+      bufferBytes + tailBytes > maxFrameBytes
+    ) {
+      rejectOversizedFrame(bufferBytes + tailBytes)
+      return
+    }
+
+    if (tailBytes > 0) {
+      buffer += chunk.subarray(start).toString('utf8')
+      bufferBytes += tailBytes
    }
  })
 }
--- a/src/utils/settings/tests/config.test.ts
+++ b/src/utils/settings/tests/config.test.ts
@@ -481,10 +481,3 @@ describe("gemini settings", () => {
    expect(result.success).toBe(true);
  });
 });
-
-describe("codex settings", () => {
-  test("accepts codex modelType", () => {
-    const result = SettingsSchema().safeParse({ modelType: "codex" });
-    expect(result.success).toBe(true);
-  });
-});
--- a/src/utils/settings/types.ts
+++ b/src/utils/settings/types.ts
@@ -369,11 +369,11 @@ export const SettingsSchema = lazySchema(() =>
        .optional()
        .describe('Tool usage permissions configuration'),
      modelType: z
-        .enum(['anthropic', 'openai', 'codex', 'gemini', 'grok'])
+        .enum(['anthropic', 'openai', 'gemini', 'grok'])
        .optional()
        .describe(
-          'API provider type. "anthropic" uses the Anthropic API (default), "openai" uses the OpenAI Chat Completions API, "codex" uses the OpenAI Responses API, "gemini" uses the Gemini API, and "grok" uses the xAI Grok API (OpenAI-compatible). ' +
-            'When set to "openai", configure OPENAI_API_KEY, OPENAI_BASE_URL, and OPENAI_MODEL. When set to "codex", configure CODEX_API_KEY, CODEX_BASE_URL, and CODEX_MODEL. When set to "gemini", configure GEMINI_API_KEY and optional GEMINI_BASE_URL. When set to "grok", configure GROK_API_KEY (or XAI_API_KEY), optional GROK_BASE_URL, GROK_MODEL, and GROK_MODEL_MAP.',
+          'API provider type. "anthropic" uses the Anthropic API (default), "openai" uses the OpenAI Chat Completions API, "gemini" uses the Gemini API, and "grok" uses the xAI Grok API (OpenAI-compatible). ' +
+            'When set to "openai", configure OPENAI_API_KEY, OPENAI_BASE_URL, and OPENAI_MODEL. When set to "gemini", configure GEMINI_API_KEY and optional GEMINI_BASE_URL. When set to "grok", configure GROK_API_KEY (or XAI_API_KEY), optional GROK_BASE_URL, GROK_MODEL, and GROK_MODEL_MAP.',
        ),
      model: z
        .string()
--- a/src/utils/status.tsx
+++ b/src/utils/status.tsx
@@ -342,7 +342,6 @@ export function buildAPIProviderProperties(): Property[] {
      gemini: 'Gemini API',
      grok: 'Grok API',
      openai: 'OpenAI API',
-      'codex': 'OpenAI Responses API',
    }[apiProvider]
    properties.push({
      label: 'API provider',
@@ -445,18 +444,6 @@ export function buildAPIProviderProperties(): Property[] {
      label: 'OpenAI base URL',
      value: openaiBaseUrl,
    })
-  } else if (apiProvider === 'codex') {
-    const codexBaseUrl = process.env.CODEX_BASE_URL
-    properties.push({
-      label: 'OpenAI Responses base URL',
-      value: codexBaseUrl,
-    })
-    properties.push({
-      label: 'Codex image upload',
-      value: process.env.CODEX_IMGBB_API_KEY
-        ? 'ImgBB'
-        : 'Not configured',
-    })
  }

  const proxyUrl = getProxyUrl()
--- a/src/utils/swarm/inProcessRunner.ts
+++ b/src/utils/swarm/inProcessRunner.ts
@@ -97,7 +97,7 @@ import {
  getLastPeerDmSummary,
  isPermissionResponse,
  isShutdownRequest,
-  markMessageAsReadByIndex,
+  markMessageAsReadByIdentity,
  readMailbox,
  writeToMailbox,
 } from '../teammateMailbox.js'
@@ -405,10 +405,10 @@ function createInProcessCanUseTool(
            if (msg && !msg.read) {
              const parsed = isPermissionResponse(msg.text)
              if (parsed && parsed.request_id === request.id) {
-                await markMessageAsReadByIndex(
+                await markMessageAsReadByIdentity(
                  identity.agentName,
                  identity.teamName,
-                  i,
+                  msg,
                )
                if (parsed.subtype === 'success') {
                  processMailboxPermissionResponse({
@@ -801,10 +801,10 @@ async function waitForNextPromptOrShutdown(
        logForDebugging(
          `[inProcessRunner] ${identity.agentName} received shutdown request from ${shutdownParsed?.from} (prioritized over ${skippedUnread} unread messages)`,
        )
-        await markMessageAsReadByIndex(
+        await markMessageAsReadByIdentity(
          identity.agentName,
          identity.teamName,
-          shutdownIndex,
+          msg,
        )
        return {
          type: 'shutdown_request',
@@ -839,10 +839,10 @@ async function waitForNextPromptOrShutdown(
          logForDebugging(
            `[inProcessRunner] ${identity.agentName} received new message from ${msg.from} (index ${selectedIndex})`,
          )
-          await markMessageAsReadByIndex(
+          await markMessageAsReadByIdentity(
            identity.agentName,
            identity.teamName,
-            selectedIndex,
+            msg,
          )
          return {
            type: 'new_message',
--- a/src/utils/teammateMailbox.ts
+++ b/src/utils/teammateMailbox.ts
@@ -7,7 +7,8 @@
 * Note: Inboxes are keyed by agent name within a team.
 */

-import { mkdir, readFile, writeFile } from 'fs/promises'
+import { randomBytes } from 'crypto'
+import { mkdir, readFile, rename, stat, unlink, writeFile } from 'fs/promises'
 import { join } from 'path'
 import { z } from 'zod/v4'
 import { TEAMMATE_MESSAGE_TAG } from '../constants/xml.js'
@@ -40,6 +41,13 @@ const LOCK_OPTIONS = {
  },
 }

+export const MAX_MAILBOX_MESSAGES = 1_000
+export const MAX_READ_MAILBOX_MESSAGES = 200
+export const MAX_UNREAD_PROTOCOL_MAILBOX_MESSAGES = 2_000
+export const MAX_MAILBOX_MESSAGE_TEXT_BYTES = 64 * 1024
+export const MAX_MAILBOX_RETAINED_BYTES = 2 * 1024 * 1024
+export const MAX_MAILBOX_FILE_BYTES = 4 * 1024 * 1024
+
 export type TeammateMessage = {
  from: string
  text: string
@@ -49,6 +57,223 @@ export type TeammateMessage = {
  summary?: string // 5-10 word summary shown as preview in the UI
 }

+function isJsonLikeMessage(text: string): boolean {
+  const trimmed = text.trimStart()
+  return trimmed.startsWith('{') || trimmed.startsWith('[')
+}
+
+function shouldRetainUnreadAsProtocolMessage(
+  message: TeammateMessage,
+): boolean {
+  if (message.read) return false
+  if (isStructuredProtocolMessage(message.text)) return true
+  if (!isJsonLikeMessage(message.text)) return false
+
+  try {
+    const parsed = jsonParse(message.text)
+    return Boolean(
+      parsed &&
+        typeof parsed === 'object' &&
+        'type' in (parsed as Record<string, unknown>),
+    )
+  } catch {
+    return false
+  }
+}
+
+function sameMailboxMessage(a: TeammateMessage, b: TeammateMessage): boolean {
+  return a.from === b.from && a.timestamp === b.timestamp && a.text === b.text
+}
+
+function mailboxMessageStorageBytes(message: TeammateMessage): number {
+  return Buffer.byteLength(jsonStringify(message), 'utf8')
+}
+
+function assertMailboxMessageSize(message: TeammateMessage): void {
+  const textBytes = Buffer.byteLength(message.text, 'utf8')
+  if (textBytes > MAX_MAILBOX_MESSAGE_TEXT_BYTES) {
+    throw new Error(
+      `Mailbox message text exceeds ${MAX_MAILBOX_MESSAGE_TEXT_BYTES} bytes`,
+    )
+  }
+}
+
+function toMailboxMessage(value: unknown): TeammateMessage {
+  if (!value || typeof value !== 'object') {
+    throw new Error('Invalid mailbox message: expected object')
+  }
+  const record = value as Record<string, unknown>
+  if (
+    typeof record.from !== 'string' ||
+    typeof record.text !== 'string' ||
+    typeof record.timestamp !== 'string' ||
+    typeof record.read !== 'boolean'
+  ) {
+    throw new Error('Invalid mailbox message shape')
+  }
+  const message: TeammateMessage = {
+    from: record.from,
+    text: record.text,
+    timestamp: record.timestamp,
+    read: record.read,
+    ...(typeof record.color === 'string' ? { color: record.color } : {}),
+    ...(typeof record.summary === 'string' ? { summary: record.summary } : {}),
+  }
+  assertMailboxMessageSize(message)
+  return message
+}
+
+function parseMailboxMessages(content: string): TeammateMessage[] {
+  const parsed = jsonParse(content)
+  if (!Array.isArray(parsed)) {
+    throw new Error('Invalid mailbox file: expected message array')
+  }
+  return parsed.map(toMailboxMessage)
+}
+
+async function readMailboxFile(inboxPath: string): Promise<string> {
+  const info = await stat(inboxPath)
+  if (info.size > MAX_MAILBOX_FILE_BYTES) {
+    throw new Error(
+      `Mailbox file exceeds ${MAX_MAILBOX_FILE_BYTES} bytes: ${inboxPath}`,
+    )
+  }
+  return readFile(inboxPath, 'utf-8')
+}
+
+async function readMailboxForMutation(
+  agentName: string,
+  teamName?: string,
+): Promise<TeammateMessage[]> {
+  const inboxPath = getInboxPath(agentName, teamName)
+  return parseMailboxMessages(await readMailboxFile(inboxPath))
+}
+
+async function writeMailboxAtomic(
+  inboxPath: string,
+  content: string,
+): Promise<void> {
+  const bytes = Buffer.byteLength(content, 'utf8')
+  if (bytes > MAX_MAILBOX_FILE_BYTES) {
+    throw new Error(
+      `Compacted mailbox still exceeds ${MAX_MAILBOX_FILE_BYTES} bytes`,
+    )
+  }
+  const tempPath = `${inboxPath}.${process.pid}.${randomBytes(8).toString('hex')}.tmp`
+  try {
+    await writeFile(tempPath, content, 'utf-8')
+    await rename(tempPath, inboxPath)
+  } catch (error) {
+    await unlink(tempPath).catch(() => undefined)
+    throw error
+  }
+}
+
+export function compactMailboxMessages(
+  messages: TeammateMessage[],
+  limits: {
+    maxMessages?: number
+    maxReadMessages?: number
+    maxUnreadProtocolMessages?: number
+    maxRetainedBytes?: number
+  } = {},
+): TeammateMessage[] {
+  const maxMessages = limits.maxMessages ?? MAX_MAILBOX_MESSAGES
+  const maxReadMessages = limits.maxReadMessages ?? MAX_READ_MAILBOX_MESSAGES
+  const maxUnreadProtocolMessages =
+    limits.maxUnreadProtocolMessages ?? MAX_UNREAD_PROTOCOL_MAILBOX_MESSAGES
+  const maxRetainedBytes = limits.maxRetainedBytes ?? MAX_MAILBOX_RETAINED_BYTES
+
+  if (
+    maxRetainedBytes <= 0 ||
+    (maxMessages <= 0 && maxUnreadProtocolMessages <= 0)
+  ) {
+    return []
+  }
+
+  const keepIndexes = new Set<number>()
+  let retainedBytes = 0
+  let keptUnreadProtocolMessages = 0
+  const tryKeep = (index: number): boolean => {
+    if (keepIndexes.has(index)) return true
+    const message = messages[index]
+    if (!message) return false
+    const bytes = mailboxMessageStorageBytes(message)
+    if (bytes > maxRetainedBytes || retainedBytes + bytes > maxRetainedBytes) {
+      return false
+    }
+    keepIndexes.add(index)
+    retainedBytes += bytes
+    return true
+  }
+
+  for (let i = messages.length - 1; i >= 0; i--) {
+    const message = messages[i]
+    if (!message || !shouldRetainUnreadAsProtocolMessage(message)) continue
+    if (keptUnreadProtocolMessages >= maxUnreadProtocolMessages) continue
+    if (tryKeep(i)) keptUnreadProtocolMessages++
+  }
+
+  let keptNonProtocolMessages = 0
+  for (let i = messages.length - 1; i >= 0; i--) {
+    if (keptNonProtocolMessages >= maxMessages) break
+    const message = messages[i]
+    if (
+      message &&
+      !message.read &&
+      !shouldRetainUnreadAsProtocolMessage(message)
+    ) {
+      if (tryKeep(i)) keptNonProtocolMessages++
+    }
+  }
+
+  let keptReadMessages = 0
+  for (let i = messages.length - 1; i >= 0; i--) {
+    if (keptNonProtocolMessages >= maxMessages) break
+    if (keptReadMessages >= maxReadMessages) break
+    const message = messages[i]
+    if (message?.read) {
+      if (tryKeep(i)) {
+        keptReadMessages++
+        keptNonProtocolMessages++
+      }
+    }
+  }
+
+  return messages.filter((_message, index) => keepIndexes.has(index))
+}
+
+function logUnreadMailboxEvictions(
+  original: TeammateMessage[],
+  compacted: TeammateMessage[],
+  context: string,
+): void {
+  const kept = new Set(compacted)
+  const unreadEvicted = original.filter(message => {
+    return !message.read && !kept.has(message)
+  })
+  if (unreadEvicted.length === 0) return
+
+  const protocolEvicted = count(unreadEvicted, message =>
+    shouldRetainUnreadAsProtocolMessage(message),
+  )
+  logError(
+    new Error(
+      `[TeammateMailbox] Compacted ${unreadEvicted.length} unread message(s) in ${context}; protocol_or_unknown=${protocolEvicted}`,
+    ),
+  )
+}
+
+async function writeCompactedMailbox(
+  inboxPath: string,
+  messages: TeammateMessage[],
+  context: string,
+): Promise<void> {
+  const compacted = compactMailboxMessages(messages)
+  logUnreadMailboxEvictions(messages, compacted, context)
+  await writeMailboxAtomic(inboxPath, jsonStringify(compacted, null, 2))
+}
+
 /**
 * Get the path to a teammate's inbox file
 * Structure: ~/.claude/teams/{team_name}/inboxes/{agent_name}.json
@@ -89,8 +314,7 @@ export async function readMailbox(
  logForDebugging(`[TeammateMailbox] readMailbox: path=${inboxPath}`)

  try {
-    const content = await readFile(inboxPath, 'utf-8')
-    const messages = jsonParse(content) as TeammateMessage[]
+    const messages = parseMailboxMessages(await readMailboxFile(inboxPath))
    logForDebugging(
      `[TeammateMailbox] readMailbox: read ${messages.length} message(s)`,
    )
@@ -103,7 +327,7 @@ export async function readMailbox(
    }
    logForDebugging(`Failed to read inbox for ${agentName}: ${error}`)
    logError(error)
-    return []
+    throw error
  }
 }

@@ -156,7 +380,7 @@ export async function writeToMailbox(
        `[TeammateMailbox] writeToMailbox: failed to create inbox file: ${error}`,
      )
      logError(error)
-      return
+      throw error
    }
  }

@@ -168,22 +392,23 @@ export async function writeToMailbox(
    })

    // Re-read messages after acquiring lock to get the latest state
-    const messages = await readMailbox(recipientName, teamName)
+    const messages = await readMailboxForMutation(recipientName, teamName)

-    const newMessage: TeammateMessage = {
+    const newMessage = toMailboxMessage({
      ...message,
      read: false,
-    }
+    })

    messages.push(newMessage)

-    await writeFile(inboxPath, jsonStringify(messages, null, 2), 'utf-8')
+    await writeCompactedMailbox(inboxPath, messages, 'writeToMailbox')
    logForDebugging(
      `[TeammateMailbox] Wrote message to ${recipientName}'s inbox from ${message.from}`,
    )
  } catch (error) {
    logForDebugging(`Failed to write to inbox for ${recipientName}: ${error}`)
    logError(error)
+    throw error
  } finally {
    if (release) {
      await release()
@@ -222,7 +447,7 @@ export async function markMessageAsReadByIndex(
    logForDebugging(`[TeammateMailbox] markMessageAsReadByIndex: lock acquired`)

    // Re-read messages after acquiring lock to get the latest state
-    const messages = await readMailbox(agentName, teamName)
+    const messages = await readMailboxForMutation(agentName, teamName)
    logForDebugging(
      `[TeammateMailbox] markMessageAsReadByIndex: read ${messages.length} messages after lock`,
    )
@@ -244,7 +469,7 @@ export async function markMessageAsReadByIndex(

    messages[messageIndex] = { ...message, read: true }

-    await writeFile(inboxPath, jsonStringify(messages, null, 2), 'utf-8')
+    await writeCompactedMailbox(inboxPath, messages, 'markMessageAsReadByIndex')
    logForDebugging(
      `[TeammateMailbox] markMessageAsReadByIndex: marked message at index ${messageIndex} as read`,
    )
@@ -270,6 +495,46 @@ export async function markMessageAsReadByIndex(
  }
 }

+export async function markMessageAsReadByIdentity(
+  agentName: string,
+  teamName: string | undefined,
+  expectedMessage: TeammateMessage,
+): Promise<boolean> {
+  const inboxPath = getInboxPath(agentName, teamName)
+  const lockFilePath = `${inboxPath}.lock`
+
+  let release: (() => Promise<void>) | undefined
+  try {
+    release = await lockfile.lock(inboxPath, {
+      lockfilePath: lockFilePath,
+      ...LOCK_OPTIONS,
+    })
+
+    const messages = await readMailboxForMutation(agentName, teamName)
+    const messageIndex = messages.findIndex(message => {
+      return !message.read && sameMailboxMessage(message, expectedMessage)
+    })
+    if (messageIndex < 0) return false
+
+    messages[messageIndex] = { ...messages[messageIndex]!, read: true }
+    await writeCompactedMailbox(
+      inboxPath,
+      messages,
+      'markMessageAsReadByIdentity',
+    )
+    return true
+  } catch (error) {
+    const code = getErrnoCode(error)
+    if (code === 'ENOENT') return false
+    logError(error)
+    return false
+  } finally {
+    if (release) {
+      await release()
+    }
+  }
+}
+
 /**
 * Mark all messages in a teammate's inbox as read
 * Uses file locking to prevent race conditions
@@ -297,7 +562,7 @@ export async function markMessagesAsRead(
    logForDebugging(`[TeammateMailbox] markMessagesAsRead: lock acquired`)

    // Re-read messages after acquiring lock to get the latest state
-    const messages = await readMailbox(agentName, teamName)
+    const messages = await readMailboxForMutation(agentName, teamName)
    logForDebugging(
      `[TeammateMailbox] markMessagesAsRead: read ${messages.length} messages after lock`,
    )
@@ -317,7 +582,7 @@ export async function markMessagesAsRead(
    // messages comes from jsonParse — fresh, unshared objects safe to mutate
    for (const m of messages) m.read = true

-    await writeFile(inboxPath, jsonStringify(messages, null, 2), 'utf-8')
+    await writeCompactedMailbox(inboxPath, messages, 'markMessagesAsRead')
    logForDebugging(
      `[TeammateMailbox] markMessagesAsRead: WROTE ${unreadCount} message(s) as read to ${inboxPath}`,
    )
@@ -1114,7 +1379,7 @@ export async function markMessagesAsReadByPredicate(
      ...LOCK_OPTIONS,
    })

-    const messages = await readMailbox(agentName, teamName)
+    const messages = await readMailboxForMutation(agentName, teamName)
    if (messages.length === 0) {
      return
    }
@@ -1123,7 +1388,11 @@ export async function markMessagesAsReadByPredicate(
      !m.read && predicate(m) ? { ...m, read: true } : m,
    )

-    await writeFile(inboxPath, jsonStringify(updatedMessages, null, 2), 'utf-8')
+    await writeCompactedMailbox(
+      inboxPath,
+      updatedMessages,
+      'markMessagesAsReadByPredicate',
+    )
  } catch (error) {
    const code = getErrnoCode(error)
    if (code === 'ENOENT') {
@@ -1161,7 +1430,12 @@ export function getLastPeerDmSummary(messages: Message[]): string | undefined {
    if (!Array.isArray(content)) continue
    for (const block of content) {
      if (typeof block === 'string') continue
-      const b = block as unknown as { type: string; name?: string; input?: Record<string, unknown>; [key: string]: unknown }
+      const b = block as unknown as {
+        type: string
+        name?: string
+        input?: Record<string, unknown>
+        [key: string]: unknown
+      }
      if (
        b.type === 'tool_use' &&
        b.name === SEND_MESSAGE_TOOL_NAME &&
@@ -1177,7 +1451,7 @@ export function getLastPeerDmSummary(messages: Message[]): string | undefined {
        const to = b.input.to as string
        const summary =
          'summary' in b.input && typeof b.input.summary === 'string'
-            ? b.input.summary as string
+            ? (b.input.summary as string)
            : (b.input.message as string).slice(0, 80)
        return `[to ${to}] ${summary}`
      }
--- a/src/utils/udsClient.ts
+++ b/src/utils/udsClient.ts
@@ -16,7 +16,8 @@ import { errorMessage, isFsInaccessible } from './errors.js'
 import { isProcessRunning } from './genericProcessUtils.js'
 import { jsonParse, jsonStringify } from './slowOperations.js'
 import type { SessionKind } from './concurrentSessions.js'
-import type { UdsMessage } from './udsMessaging.js'
+import { MAX_UDS_FRAME_BYTES, type UdsMessage } from './udsMessaging.js'
+import { attachUdsResponseReader, getChunkBytes } from './udsResponseReader.js'

 // ---------------------------------------------------------------------------
 // Types
@@ -104,9 +105,14 @@ export async function listAllLiveSessions(): Promise<PeerSession[]> {
 */
 export async function listPeers(): Promise<PeerSession[]> {
  const all = await listAllLiveSessions()
-  return all.filter(
-    s => s.pid !== process.pid && s.messagingSocketPath != null,
-  )
+  return all.filter(s => s.pid !== process.pid && s.messagingSocketPath != null)
+}
+
+async function findAuthTokenForSocketPath(
+  socketPath: string,
+): Promise<string | undefined> {
+  const { readUdsCapabilityToken } = await import('./udsMessaging.js')
+  return readUdsCapabilityToken(socketPath)
 }

 // ---------------------------------------------------------------------------
@@ -117,10 +123,21 @@ export async function listPeers(): Promise<PeerSession[]> {
 * Probe a UDS socket to check if a server is listening (ping/pong).
 * Returns true if the peer responds within the timeout.
 */
-export async function isPeerAlive(socketPath: string, timeoutMs = 3000): Promise<boolean> {
-  return new Promise<boolean>((resolve) => {
+export async function isPeerAlive(
+  socketPath: string,
+  timeoutMs = 3000,
+  authToken?: string,
+): Promise<boolean> {
+  const token = authToken ?? (await findAuthTokenForSocketPath(socketPath))
+  if (!token) return false
+
+  return new Promise<boolean>(resolve => {
    const conn = createConnection(socketPath, () => {
-      const ping: UdsMessage = { type: 'ping', ts: new Date().toISOString() }
+      const ping: UdsMessage = {
+        type: 'ping',
+        ts: new Date().toISOString(),
+        meta: { authToken: token },
+      }
      conn.write(jsonStringify(ping) + '\n')
    })

@@ -135,7 +152,19 @@ export async function isPeerAlive(socketPath: string, timeoutMs = 3000): Promise
    }, timeoutMs)

    let buffer = ''
-    conn.on('data', (chunk) => {
+    conn.on('data', chunk => {
+      if (
+        Buffer.byteLength(buffer, 'utf8') + getChunkBytes(chunk) >
+        MAX_UDS_FRAME_BYTES
+      ) {
+        if (!resolved) {
+          resolved = true
+          clearTimeout(timer)
+          conn.destroy()
+          resolve(false)
+        }
+        return
+      }
      buffer += chunk.toString()
      if (buffer.includes('"pong"')) {
        if (!resolved) {
@@ -165,6 +194,13 @@ export async function sendToUdsSocket(
  targetSocketPath: string,
  message: string | Record<string, unknown>,
 ): Promise<void> {
+  const { parseUdsTarget } = await import('./udsMessaging.js')
+  const target = parseUdsTarget(targetSocketPath)
+  const authToken = await findAuthTokenForSocketPath(target.socketPath)
+  if (!authToken) {
+    throw new Error(`No auth token found for peer at ${target.socketPath}`)
+  }
+
  const data = typeof message === 'string' ? message : jsonStringify(message)
  const udsMsg: UdsMessage = {
    type: 'text',
@@ -177,18 +213,36 @@ export async function sendToUdsSocket(
  udsMsg.from = getUdsMessagingSocketPath()

  return new Promise<void>((resolve, reject) => {
-    const conn = createConnection(targetSocketPath, () => {
-      conn.write(jsonStringify(udsMsg) + '\n', (err) => {
+    let settled = false
+    let conn: ReturnType<typeof createConnection>
+    const finish = (error?: Error): void => {
+      if (settled) return
+      settled = true
+      if (error) {
+        conn.destroy(error)
+        reject(error)
+      } else {
        conn.end()
-        if (err) reject(err)
-        else resolve()
+        resolve()
+      }
+    }
+
+    conn = createConnection(target.socketPath, () => {
+      udsMsg.meta = { ...udsMsg.meta, authToken }
+      conn.write(jsonStringify(udsMsg) + '\n', err => {
+        if (err) finish(err)
      })
    })
-    conn.on('error', (err) => {
-      reject(new Error(`Failed to connect to peer at ${targetSocketPath}: ${errorMessage(err)}`))
+    attachUdsResponseReader(conn, {
+      maxFrameBytes: MAX_UDS_FRAME_BYTES,
+      onSettled: finish,
+      formatSocketError: err =>
+        new Error(
+          `Failed to connect to peer at ${target.socketPath}: ${errorMessage(err)}`,
+        ),
    })
    conn.setTimeout(5000, () => {
-      conn.destroy(new Error('Connection timed out'))
+      finish(new Error('Connection timed out'))
    })
  })
 }
--- a/src/utils/udsMessaging.ts
+++ b/src/utils/udsMessaging.ts
@@ -8,14 +8,26 @@
 * but can be overridden via --messaging-socket-path.
 */

+import { createHash, randomBytes, timingSafeEqual } from 'crypto'
 import { createServer, type Server, type Socket } from 'net'
-import { mkdir, unlink } from 'fs/promises'
+import {
+  chmod,
+  lstat,
+  mkdir,
+  open,
+  readFile,
+  rename,
+  unlink,
+} from 'fs/promises'
 import { dirname, join } from 'path'
 import { tmpdir } from 'os'
 import { registerCleanup } from './cleanupRegistry.js'
 import { logForDebugging } from './debug.js'
 import { errorMessage } from './errors.js'
+import { getClaudeConfigHomeDir } from './envUtils.js'
 import { attachNdjsonFramer } from './ndjsonFramer.js'
+import { attachUdsResponseReader } from './udsResponseReader.js'
+import { logError } from './log.js'
 import { jsonParse, jsonStringify } from './slowOperations.js'

 // ---------------------------------------------------------------------------
@@ -27,6 +39,7 @@ export type UdsMessageType =
  | 'notification'
  | 'query'
  | 'response'
+  | 'error'
  | 'ping'
  | 'pong'

@@ -60,6 +73,17 @@ let onEnqueueCb: (() => void) | null = null
 const clients = new Set<Socket>()
 const inbox: UdsInboxEntry[] = []
 let nextId = 1
+let defaultSocketPath: string | null = null
+let authToken: string | null = null
+let capabilityFilePath: string | null = null
+let inboxBytes = 0
+
+export const MAX_UDS_INBOX_ENTRIES = 1_000
+export const MAX_UDS_FRAME_BYTES = 64 * 1024
+export const MAX_UDS_INBOX_BYTES = 2 * 1024 * 1024
+export const MAX_UDS_CLIENTS = 128
+export const UDS_AUTH_TIMEOUT_MS = 2_000
+export const UDS_IDLE_TIMEOUT_MS = 30_000

 // ---------------------------------------------------------------------------
 // Public API — socket path helpers
@@ -74,10 +98,19 @@ let nextId = 1
 * transparently, but we use the pipe format on Windows for Node.js compat.
 */
 export function getDefaultUdsSocketPath(): string {
+  if (defaultSocketPath) return defaultSocketPath
+  const nonce = randomBytes(16).toString('hex')
  if (process.platform === 'win32') {
-    return `\\\\.\\pipe\\claude-code-${process.pid}`
+    defaultSocketPath = `\\\\.\\pipe\\claude-code-${process.pid}-${nonce}`
+    return defaultSocketPath
  }
-  return join(tmpdir(), 'claude-code-socks', `${process.pid}.sock`)
+  defaultSocketPath = join(
+    tmpdir(),
+    'claude-code-socks',
+    `${process.pid}-${nonce}`,
+    'messaging.sock',
+  )
+  return defaultSocketPath
 }

 /**
@@ -88,6 +121,153 @@ export function getUdsMessagingSocketPath(): string | undefined {
  return socketPath ?? undefined
 }

+export function formatUdsAddress(socket: string): string {
+  return `uds:${socket}`
+}
+
+export function parseUdsTarget(target: string): {
+  socketPath: string
+} {
+  if (target.includes('#token=')) {
+    throw new Error(
+      'UDS target must not include an inline auth token; use the ListPeers address',
+    )
+  }
+  return { socketPath: target }
+}
+
+function getCapabilityDir(): string {
+  return join(getClaudeConfigHomeDir(), 'messaging-capabilities')
+}
+
+function getCapabilityPath(socket: string): string {
+  const digest = createHash('sha256').update(socket).digest('hex')
+  return join(getCapabilityDir(), `${digest}.json`)
+}
+
+function isNotFound(error: unknown): boolean {
+  return (
+    typeof error === 'object' &&
+    error !== null &&
+    (error as NodeJS.ErrnoException).code === 'ENOENT'
+  )
+}
+
+async function assertPrivateCapabilityDir(dir: string): Promise<void> {
+  let stat: Awaited<ReturnType<typeof lstat>>
+  try {
+    stat = await lstat(dir)
+  } catch (error) {
+    if (!isNotFound(error)) throw error
+    await mkdir(dir, { recursive: true, mode: 0o700 })
+    stat = await lstat(dir)
+  }
+
+  assertPrivateDirectory(stat, dir, 'capability directory')
+  await chmod(dir, 0o700)
+}
+
+function assertPrivateDirectory(
+  stat: Awaited<ReturnType<typeof lstat>>,
+  dir: string,
+  label: string,
+): void {
+  if (!stat.isDirectory() || stat.isSymbolicLink()) {
+    throw new Error(
+      `[udsMessaging] ${label} is not a private directory: ${dir}`,
+    )
+  }
+  if (process.platform !== 'win32') {
+    const broadMode = Number(stat.mode) & 0o077
+    if (broadMode !== 0) {
+      throw new Error(
+        `[udsMessaging] ${label} permissions are too broad: ${dir}`,
+      )
+    }
+    if (
+      typeof process.getuid === 'function' &&
+      Number(stat.uid) !== process.getuid()
+    ) {
+      throw new Error(
+        `[udsMessaging] ${label} owner does not match current user: ${dir}`,
+      )
+    }
+  }
+}
+
+async function writePrivateFileExclusive(
+  path: string,
+  content: string,
+): Promise<void> {
+  const handle = await open(path, 'wx', 0o600)
+  try {
+    await handle.writeFile(content, 'utf-8')
+  } finally {
+    await handle.close()
+  }
+  await chmod(path, 0o600)
+}
+
+async function ensureSocketParent(path: string): Promise<void> {
+  const dir = dirname(path)
+  try {
+    const stat = await lstat(dir)
+    if (!stat.isDirectory() || stat.isSymbolicLink()) {
+      throw new Error(
+        `[udsMessaging] socket parent is not a directory: ${dir}`,
+      )
+    }
+    assertPrivateDirectory(stat, dir, 'socket parent')
+    return
+  } catch (error) {
+    if (!isNotFound(error)) throw error
+  }
+
+  await mkdir(dir, { recursive: true, mode: 0o700 })
+  await chmod(dir, 0o700)
+}
+
+async function writeCapabilityFile(
+  socket: string,
+  token: string,
+): Promise<void> {
+  const dir = getCapabilityDir()
+  await assertPrivateCapabilityDir(dir)
+  const target = getCapabilityPath(socket)
+  const temp = `${target}.${process.pid}.${randomBytes(8).toString('hex')}.tmp`
+  try {
+    await writePrivateFileExclusive(
+      temp,
+      jsonStringify({ socketPath: socket, authToken: token }),
+    )
+    await rename(temp, target)
+  } catch (error) {
+    try {
+      await unlink(temp)
+    } catch {
+      // Temp file may not exist if exclusive creation failed.
+    }
+    throw error
+  }
+  capabilityFilePath = target
+}
+
+export async function readUdsCapabilityToken(
+  socket: string,
+): Promise<string | undefined> {
+  try {
+    const parsed = jsonParse(
+      await readFile(getCapabilityPath(socket), 'utf-8'),
+    ) as Record<string, unknown>
+    if (parsed.socketPath === socket && typeof parsed.authToken === 'string') {
+      return parsed.authToken
+    }
+  } catch {
+    // Missing or unreadable capability file means the peer is not addressable.
+  }
+  return undefined
+}
+
 // ---------------------------------------------------------------------------
 // Inbox
 // ---------------------------------------------------------------------------
@@ -101,16 +281,121 @@ export function setOnEnqueue(cb: (() => void) | null): void {
 }

 /**
- * Drain all pending inbox messages, marking them processed.
+ * Drain all pending inbox messages and release retained history.
 */
 export function drainInbox(): UdsInboxEntry[] {
-  const pending = inbox.filter(e => e.status === 'pending')
+  const pending = inbox.splice(0, inbox.length)
+  inboxBytes = 0
  for (const entry of pending) {
    entry.status = 'processed'
  }
  return pending
 }

+function getMessageBytes(message: UdsMessage): number {
+  return Buffer.byteLength(jsonStringify(message), 'utf8')
+}
+
+function enqueueInboxEntry(entry: UdsInboxEntry): boolean {
+  const entryBytes = getMessageBytes(entry.message)
+  if (
+    entryBytes > MAX_UDS_FRAME_BYTES ||
+    inbox.length >= MAX_UDS_INBOX_ENTRIES ||
+    inboxBytes + entryBytes > MAX_UDS_INBOX_BYTES
+  ) {
+    logError(
+      new Error(
+        `[udsMessaging] inbox full (${inbox.length}/${MAX_UDS_INBOX_ENTRIES}, ${inboxBytes}/${MAX_UDS_INBOX_BYTES} bytes); dropping message type=${entry.message.type}`,
+      ),
+    )
+    return false
+  }
+  inbox.push(entry)
+  inboxBytes += entryBytes
+  return true
+}
+
+function ensureAuthToken(): string {
+  if (!authToken) {
+    authToken = randomBytes(32).toString('hex')
+  }
+  return authToken
+}
+
+function getMessageAuthToken(message: UdsMessage): string | undefined {
+  const token = message.meta?.authToken
+  return typeof token === 'string' ? token : undefined
+}
+
+function isAuthorizedMessage(message: UdsMessage): boolean {
+  const provided = getMessageAuthToken(message)
+  if (!provided || !authToken) return false
+  const providedBuffer = Buffer.from(provided, 'utf8')
+  const expectedBuffer = Buffer.from(authToken, 'utf8')
+  if (providedBuffer.length !== expectedBuffer.length) return false
+  return timingSafeEqual(providedBuffer, expectedBuffer)
+}
+
+function writeSocketMessage(socket: Socket, message: UdsMessage): void {
+  if (socket.destroyed) return
+  socket.write(jsonStringify(message) + '\n')
+}
+
+function writeSocketMessageAndDestroy(socket: Socket, message: UdsMessage): void {
+  if (socket.destroyed) return
+  socket.write(jsonStringify(message) + '\n', () => {
+    if (!socket.destroyed) socket.destroy()
+  })
+}
+
+function writeSocketErrorAndDestroy(socket: Socket, data: string): void {
+  writeSocketMessageAndDestroy(socket, {
+    type: 'error',
+    data,
+    ts: new Date().toISOString(),
+  })
+}
+
+function unrefTimer(timer: ReturnType<typeof setTimeout>): void {
+  const maybeUnref = (timer as { unref?: () => void }).unref
+  if (typeof maybeUnref === 'function') {
+    maybeUnref.call(timer)
+  }
+}
+
+async function closeServer(serverToClose: Server): Promise<void> {
+  await new Promise<void>(resolve => {
+    serverToClose.close(() => resolve())
+  })
+}
+
+async function removeSocketPath(path: string): Promise<void> {
+  if (process.platform === 'win32') return
+  try {
+    await unlink(path)
+  } catch {
+    // Already gone.
+  }
+}
+
+function stripAuthToken(message: UdsMessage): UdsMessage {
+  const { authToken: _authToken, ...metaWithoutAuth } = message.meta ?? {}
+  return {
+    ...message,
+    meta: Object.keys(metaWithoutAuth).length > 0 ? metaWithoutAuth : undefined,
+  }
+}
+
+function withRequestAuthToken(message: UdsMessage, token: string): UdsMessage {
+  return {
+    ...message,
+    meta: {
+      ...message.meta,
+      authToken: token,
+    },
+  }
+}
+
 // ---------------------------------------------------------------------------
 // Server
 // ---------------------------------------------------------------------------
@@ -132,7 +417,7 @@ export async function startUdsMessaging(

  // Ensure parent directory exists (skip on Windows — pipe paths aren't files)
  if (process.platform !== 'win32') {
-    await mkdir(dirname(path), { recursive: true })
+    await ensureSocketParent(path)
  }

  // Clean up stale socket file (skip on Windows — pipe paths aren't files)
@@ -144,69 +429,195 @@ export async function startUdsMessaging(
    }
  }

-  socketPath = path
-
-  await new Promise<void>((resolve, reject) => {
-    const srv = createServer(socket => {
-      clients.add(socket)
-      logForDebugging(
-        `[udsMessaging] client connected (total: ${clients.size})`,
-      )
-
-      attachNdjsonFramer<UdsMessage>(
-        socket,
-        msg => {
-          // Handle ping with automatic pong
-          if (msg.type === 'ping') {
-            const pong: UdsMessage = {
-              type: 'pong',
-              from: socketPath ?? undefined,
-              ts: new Date().toISOString(),
-            }
-            if (!socket.destroyed) {
-              socket.write(jsonStringify(pong) + '\n')
-            }
-            return
-          }
-
-          // Enqueue into inbox
-          const entry: UdsInboxEntry = {
-            id: `uds-${nextId++}`,
-            message: msg,
-            receivedAt: Date.now(),
-            status: 'pending',
-          }
-          inbox.push(entry)
+  const token = ensureAuthToken()
+  let startedServer: Server | null = null
+  let exportedSocketEnv = false
+  try {
+    await new Promise<void>((resolve, reject) => {
+      const srv = createServer(socket => {
+        if (clients.size >= MAX_UDS_CLIENTS) {
          logForDebugging(
-            `[udsMessaging] enqueued message type=${msg.type} from=${msg.from ?? 'unknown'}`,
+            `[udsMessaging] rejected client: ${clients.size}/${MAX_UDS_CLIENTS} clients already connected`,
          )
-          onEnqueueCb?.()
-        },
-        text => jsonParse(text) as UdsMessage,
-      )
+          socket.destroy()
+          return
+        }
+        clients.add(socket)
+        logForDebugging(
+          `[udsMessaging] client connected (total: ${clients.size})`,
+        )
+        let authenticated = false
+        let closing = false
+        const closeWithError = (data: string): void => {
+          if (closing || socket.destroyed) return
+          closing = true
+          socket.pause()
+          writeSocketErrorAndDestroy(socket, data)
+        }
+        const authTimer = setTimeout(() => {
+          if (authenticated || socket.destroyed) return
+          logForDebugging('[udsMessaging] closing unauthenticated idle client')
+          closeWithError('authentication timeout')
+        }, UDS_AUTH_TIMEOUT_MS)
+        unrefTimer(authTimer)
+        socket.setTimeout(UDS_IDLE_TIMEOUT_MS, () => {
+          logForDebugging('[udsMessaging] closing idle client')
+          closeWithError('idle timeout')
+        })

-      socket.on('close', () => {
-        clients.delete(socket)
+        attachNdjsonFramer<UdsMessage>(
+          socket,
+          msg => {
+            if (!isAuthorizedMessage(msg)) {
+              logForDebugging(
+                `[udsMessaging] rejected unauthenticated message type=${msg.type}`,
+              )
+              closeWithError('unauthorized')
+              return
+            }
+            if (!authenticated) {
+              authenticated = true
+              clearTimeout(authTimer)
+            }
+
+            // Handle ping with automatic pong
+            if (msg.type === 'ping') {
+              writeSocketMessage(socket, {
+                type: 'pong',
+                from: socketPath ?? undefined,
+                ts: new Date().toISOString(),
+              })
+              return
+            }
+
+            // Enqueue into inbox
+            const sanitizedMessage = stripAuthToken(msg)
+            const entry: UdsInboxEntry = {
+              id: `uds-${nextId++}`,
+              message: sanitizedMessage,
+              receivedAt: Date.now(),
+              status: 'pending',
+            }
+            if (!enqueueInboxEntry(entry)) {
+              closeWithError('inbox full')
+              return
+            }
+            logForDebugging(
+              `[udsMessaging] enqueued message type=${msg.type} from=${msg.from ?? 'unknown'}`,
+            )
+            writeSocketMessage(socket, {
+              type: 'response',
+              data: 'ok',
+              ts: new Date().toISOString(),
+              meta: { id: entry.id },
+            })
+            onEnqueueCb?.()
+          },
+          text => jsonParse(text) as UdsMessage,
+          {
+            maxFrameBytes: MAX_UDS_FRAME_BYTES,
+            onFrameError: error => {
+              logForDebugging(`[udsMessaging] ${error.message}`)
+              closeWithError(error.message)
+            },
+            onInvalidFrame: error => {
+              logForDebugging(
+                `[udsMessaging] invalid client frame: ${errorMessage(error)}`,
+              )
+              closeWithError('invalid frame')
+            },
+            destroyOnFrameError: false,
+          },
+        )
+
+        socket.on('close', () => {
+          clearTimeout(authTimer)
+          clients.delete(socket)
+        })
+
+        socket.on('error', err => {
+          clearTimeout(authTimer)
+          clients.delete(socket)
+          logForDebugging(`[udsMessaging] client error: ${errorMessage(err)}`)
+        })
      })

-      socket.on('error', err => {
-        clients.delete(socket)
-        logForDebugging(`[udsMessaging] client error: ${errorMessage(err)}`)
+      const rejectBeforeListen = (error: Error): void => {
+        reject(error)
+      }
+      const logRuntimeError = (error: Error): void => {
+        logForDebugging(
+          `[udsMessaging] server error on ${path}${opts?.isExplicit ? ' (explicit)' : ''}: ${errorMessage(error)}`,
+        )
+      }
+
+      srv.once('error', rejectBeforeListen)
+
+      srv.listen(path, () => {
+        void (async () => {
+          try {
+            if (process.platform !== 'win32') {
+              await chmod(path, 0o600)
+            }
+            srv.off('error', rejectBeforeListen)
+            srv.on('error', logRuntimeError)
+            server = srv
+            startedServer = srv
+            resolve()
+          } catch (error) {
+            srv.off('error', rejectBeforeListen)
+            const closeError =
+              error instanceof Error ? error : new Error(errorMessage(error))
+            let rejected = false
+            const rejectOnce = (): void => {
+              if (rejected) return
+              rejected = true
+              reject(closeError)
+            }
+            const fallback = setTimeout(rejectOnce, 1_000)
+            unrefTimer(fallback)
+            srv.close(() => {
+              clearTimeout(fallback)
+              rejectOnce()
+            })
+          }
+        })()
      })
    })

-    srv.on('error', reject)
-
-    srv.listen(path, () => {
-      server = srv
-      // Export so child processes can discover the socket
-      process.env.CLAUDE_CODE_MESSAGING_SOCKET = path
-      logForDebugging(
-        `[udsMessaging] server listening on ${path}${opts?.isExplicit ? ' (explicit)' : ''}`,
-      )
-      resolve()
-    })
-  })
+    await writeCapabilityFile(path, token)
+    socketPath = path
+    // Export so child processes can discover the socket only after the
+    // capability file exists and the listener is ready.
+    process.env.CLAUDE_CODE_MESSAGING_SOCKET = path
+    exportedSocketEnv = true
+    logForDebugging(
+      `[udsMessaging] server listening on ${path}${opts?.isExplicit ? ' (explicit)' : ''}`,
+    )
+  } catch (error) {
+    if (capabilityFilePath) {
+      try {
+        await unlink(capabilityFilePath)
+      } catch {
+        // Already gone.
+      }
+      capabilityFilePath = null
+    }
+    if (startedServer) {
+      await closeServer(startedServer)
+    }
+    if (server === startedServer) {
+      server = null
+    }
+    await removeSocketPath(path)
+    if (exportedSocketEnv) {
+      delete process.env.CLAUDE_CODE_MESSAGING_SOCKET
+    }
+    socketPath = null
+    defaultSocketPath = null
+    authToken = null
+    throw error
+  }

  // Register cleanup so the socket file is removed on exit
  registerCleanup(async () => {
@@ -218,6 +629,7 @@ export async function startUdsMessaging(
 * Stop the UDS messaging server and clean up the socket file.
 */
 export async function stopUdsMessaging(): Promise<void> {
+  defaultSocketPath = null
  if (!server) return

  // Close all connected clients
@@ -230,21 +642,27 @@ export async function stopUdsMessaging(): Promise<void> {
    server!.close(() => resolve())
  })
  server = null
+  inbox.length = 0
+  inboxBytes = 0
+  onEnqueueCb = null

  // Remove socket file (skip on Windows — pipe paths aren't files)
  if (socketPath) {
-    if (process.platform !== 'win32') {
-      try {
-        await unlink(socketPath)
-      } catch {
-        // Already gone
-      }
-    }
+    await removeSocketPath(socketPath)
    delete process.env.CLAUDE_CODE_MESSAGING_SOCKET
    logForDebugging(
      `[udsMessaging] server stopped, socket removed: ${socketPath}`,
    )
    socketPath = null
+    authToken = null
+  }
+  if (capabilityFilePath) {
+    try {
+      await unlink(capabilityFilePath)
+    } catch {
+      // Already gone
+    }
+    capabilityFilePath = null
  }
 }

@@ -255,23 +673,50 @@ export async function stopUdsMessaging(): Promise<void> {
 export async function sendUdsMessage(
  targetSocketPath: string,
  message: UdsMessage,
+  opts: { authToken?: string } = {},
 ): Promise<void> {
  const { createConnection } = await import('net')
-  message.from = message.from ?? socketPath ?? undefined
-  message.ts = message.ts ?? new Date().toISOString()
+  const token = opts.authToken ?? authToken
+  if (!token) {
+    throw new Error('Cannot send UDS message without auth token')
+  }
+  const outbound = withRequestAuthToken(
+    {
+      ...message,
+      from: message.from ?? socketPath ?? undefined,
+      ts: message.ts ?? new Date().toISOString(),
+    },
+    token,
+  )

  return new Promise<void>((resolve, reject) => {
-    const conn = createConnection(targetSocketPath, () => {
-      conn.write(jsonStringify(message) + '\n', err => {
+    let settled = false
+    let conn: ReturnType<typeof createConnection>
+    const finish = (error?: Error): void => {
+      if (settled) return
+      settled = true
+      if (error) {
+        conn.destroy(error)
+        reject(error)
+      } else {
        conn.end()
-        if (err) reject(err)
-        else resolve()
+        resolve()
+      }
+    }
+
+    conn = createConnection(targetSocketPath, () => {
+      conn.write(jsonStringify(outbound) + '\n', err => {
+        if (err) finish(err)
      })
    })
-    conn.on('error', reject)
+    attachUdsResponseReader(conn, {
+      maxFrameBytes: MAX_UDS_FRAME_BYTES,
+      acceptPong: true,
+      onSettled: finish,
+    })
    // Timeout so we don't hang on unreachable sockets
    conn.setTimeout(5000, () => {
-      conn.destroy(new Error('Connection timed out'))
+      finish(new Error('Connection timed out'))
    })
  })
 }
--- a/src/utils/udsResponseReader.ts
+++ b/src/utils/udsResponseReader.ts
@@ -0,0 +1,120 @@
+import type { Socket } from 'net'
+import { StringDecoder } from 'node:string_decoder'
+import { errorMessage } from './errors.js'
+import { jsonParse } from './slowOperations.js'
+import type { UdsMessage } from './udsMessaging.js'
+
+type UdsResponseReaderOptions = {
+  maxFrameBytes: number
+  acceptPong?: boolean
+  onSettled: (error?: Error) => void
+  formatSocketError?: (error: unknown) => Error
+}
+
+export function getChunkBytes(chunk: string | Buffer): number {
+  return typeof chunk === 'string'
+    ? Buffer.byteLength(chunk, 'utf8')
+    : chunk.byteLength
+}
+
+function parseResponseLine(line: string): UdsMessage {
+  try {
+    return jsonParse(line) as UdsMessage
+  } catch {
+    throw new Error('Invalid UDS response frame')
+  }
+}
+
+export function attachUdsResponseReader(
+  socket: Socket,
+  options: UdsResponseReaderOptions,
+): void {
+  let buffer = ''
+  let bufferBytes = 0
+  let settled = false
+  const decoder = new StringDecoder('utf8')
+
+  function cleanupListeners(): void {
+    socket.off('data', onData)
+    socket.off('error', onError)
+    socket.off('end', onEnd)
+    socket.off('close', onClose)
+  }
+
+  function finish(error?: Error): void {
+    if (settled) return
+    settled = true
+    buffer = ''
+    bufferBytes = 0
+    cleanupListeners()
+    if (error) {
+      socket.destroy()
+    } else {
+      socket.end()
+    }
+    options.onSettled(error)
+  }
+
+  function onData(chunk: Buffer): void {
+    const decoded = decoder.write(chunk)
+    const decodedBytes = Buffer.byteLength(decoded, 'utf8')
+    if (bufferBytes + decodedBytes > options.maxFrameBytes) {
+      finish(new Error('UDS response frame exceeded size limit'))
+      return
+    }
+
+    buffer += decoded
+    bufferBytes += decodedBytes
+    let newlineIndex = buffer.indexOf('\n')
+    while (newlineIndex !== -1) {
+      const line = buffer.slice(0, newlineIndex)
+      const consumed = buffer.slice(0, newlineIndex + 1)
+      buffer = buffer.slice(newlineIndex + 1)
+      bufferBytes -= Buffer.byteLength(consumed, 'utf8')
+      if (!line.trim()) {
+        newlineIndex = buffer.indexOf('\n')
+        continue
+      }
+      let response: UdsMessage
+      try {
+        response = parseResponseLine(line)
+      } catch (error) {
+        finish(error instanceof Error ? error : new Error(errorMessage(error)))
+        return
+      }
+      if (
+        response.type === 'response' ||
+        (options.acceptPong === true && response.type === 'pong')
+      ) {
+        finish()
+        return
+      }
+      if (response.type === 'error') {
+        finish(new Error(response.data ?? 'UDS receiver rejected message'))
+        return
+      }
+      newlineIndex = buffer.indexOf('\n')
+    }
+  }
+
+  function onError(error: Error): void {
+    finish(
+      options.formatSocketError?.(error) ??
+        (error instanceof Error ? error : new Error(errorMessage(error))),
+    )
+  }
+
+  function onEnd(): void {
+    finish(new Error('UDS socket ended before response'))
+  }
+
+  function onClose(hadError: boolean): void {
+    if (hadError) return
+    finish(new Error('UDS socket closed before response'))
+  }
+
+  socket.on('data', onData)
+  socket.on('error', onError)
+  socket.on('end', onEnd)
+  socket.on('close', onClose)
+}