diff --git a/docs/specs/agent-tooling-v2/spec.md b/docs/specs/agent-tooling-v2/spec.md
index b07a71863..39290552c 100644
--- a/docs/specs/agent-tooling-v2/spec.md
+++ b/docs/specs/agent-tooling-v2/spec.md
@@ -75,7 +75,7 @@
 
 | 工具 | 必填参数 | 可选参数 | 说明 |
 |---|---|---|---|
-| `exec` | `command: string` | `cwd?: string`, `timeoutMs?: number`, `background?: boolean`, `yieldMs?: number` | 命令执行；长任务建议后台。 |
+| `exec` | `command: string` | `cwd?: string`, `timeoutMs?: number`, `background?: boolean`, `yieldMs?: number` | 命令执行；前台仅等待 yield 窗口，超时后自动转后台并返回 `sessionId`。 |
 | `process` | `action: enum` | `sessionId?: string`, `offset?: number`, `limit?: number`, `data?: string`, `eof?: boolean` | 后台会话管理（list/poll/log/write/kill/clear/remove）。 |
 
 约束：
diff --git a/docs/specs/process-tool/spec.md b/docs/specs/process-tool/spec.md
index c4895d1f2..db4e7d2ce 100644
--- a/docs/specs/process-tool/spec.md
+++ b/docs/specs/process-tool/spec.md
@@ -14,6 +14,15 @@ As an AI agent, I want to start a command in the background so that I can run lo
 - Command returns immediately with a `sessionId` and `status: "running"`
 - Process continues running after tool returns
 
+### US-1.1: Foreground Yield To Background
+As an AI agent, I want a foreground `exec` call to yield into a background session when it runs too long, so that the loop can continue without restarting the command.
+
+**Acceptance Criteria:**
+- Foreground `exec` waits only until `yieldMs` (or the default yield window)
+- If the command finishes within that window, it returns the normal foreground result
+- If the command is still running after that window, the same process is kept alive and `exec` returns `status: "running"` with a `sessionId`
+- The yielded session is manageable through `process`
+
 ### US-2: Monitor Background Output
 As an AI agent, I want to poll the output of a background command so that I can monitor its progress.
 
diff --git a/electron.vite.config.ts b/electron.vite.config.ts
index 4dee57b91..d8955694c 100644
--- a/electron.vite.config.ts
+++ b/electron.vite.config.ts
@@ -56,6 +56,7 @@ export default defineConfig({
       )
     },
     optimizeDeps: {
+      exclude: ['markstream-vue', 'stream-monaco'],
       include: [
         'monaco-editor',
         'axios'
diff --git a/src/main/events.ts b/src/main/events.ts
index fdf231ba1..130c392e2 100644
--- a/src/main/events.ts
+++ b/src/main/events.ts
@@ -78,7 +78,8 @@ export const SESSION_EVENTS = {
   ACTIVATED: 'session:activated',
   DEACTIVATED: 'session:deactivated',
   STATUS_CHANGED: 'session:status-changed',
-  COMPACTION_UPDATED: 'session:compaction-updated'
+  COMPACTION_UPDATED: 'session:compaction-updated',
+  PENDING_INPUTS_UPDATED: 'session:pending-inputs-updated'
 }
 
 // 系统相关事件
diff --git a/src/main/lib/agentRuntime/backgroundExecSessionManager.ts b/src/main/lib/agentRuntime/backgroundExecSessionManager.ts
index 9c8eec4e6..dc3c99227 100644
--- a/src/main/lib/agentRuntime/backgroundExecSessionManager.ts
+++ b/src/main/lib/agentRuntime/backgroundExecSessionManager.ts
@@ -4,10 +4,13 @@ import path from 'path'
 import { nanoid } from 'nanoid'
 import logger from '@shared/logger'
 import { getShellEnvironment, getUserShell } from './shellEnvHelper'
+import { terminateProcessTree } from './processTree'
 import { resolveSessionDir } from './sessionPaths'
 
 // Configuration with environment variable support
-const getConfig = () => ({
+const FOREGROUND_PREVIEW_CHARS = 12000
+
+export const getBackgroundExecConfig = () => ({
   backgroundMs: parseInt(process.env.PI_BASH_YIELD_MS || '10000', 10),
   timeoutSec: parseInt(process.env.PI_BASH_TIMEOUT_SEC || '1800', 10),
   cleanupMs: parseInt(process.env.PI_BASH_JOB_TTL_MS || '1800000', 10),
@@ -21,6 +24,8 @@ const getConfig = () => ({
   offloadThresholdChars: 10000 // Offload to file when output exceeds this
 })
 
+const getConfig = getBackgroundExecConfig
+
 export interface SessionMeta {
   sessionId: string
   command: string
@@ -31,8 +36,22 @@ export interface SessionMeta {
   exitCode?: number
   outputLength: number
   offloaded: boolean
+  timedOut?: boolean
+}
+
+export interface SessionCompletionResult {
+  status: 'done' | 'error' | 'killed'
+  output: string
+  exitCode: number | null
+  offloaded: boolean
+  outputFilePath?: string
+  timedOut: boolean
 }
 
+export type WaitForCompletionOrYieldResult =
+  | { kind: 'running'; sessionId: string }
+  | { kind: 'completed'; result: SessionCompletionResult }
+
 interface BackgroundSession {
   sessionId: string
   conversationId: string
@@ -54,6 +73,7 @@ interface BackgroundSession {
   resolveClose: () => void
   closeSettled: boolean
   killTimeoutId?: NodeJS.Timeout
+  timedOut: boolean
 }
 
 interface StartSessionResult {
@@ -67,6 +87,7 @@ interface PollResult {
   exitCode?: number
   offloaded?: boolean
   outputFilePath?: string
+  timedOut?: boolean
 }
 
 interface LogResult {
@@ -76,6 +97,7 @@ interface LogResult {
   exitCode?: number
   offloaded?: boolean
   outputFilePath?: string
+  timedOut?: boolean
 }
 
 export class BackgroundExecSessionManager {
@@ -93,6 +115,7 @@ export class BackgroundExecSessionManager {
     options?: {
       timeout?: number
       env?: Record<string, string>
+      outputPrefix?: string
     }
   ): Promise<StartSessionResult> {
     const config = getConfig()
@@ -105,7 +128,9 @@ export class BackgroundExecSessionManager {
       fs.mkdirSync(sessionDir, { recursive: true })
     }
 
-    const outputFilePath = sessionDir ? path.join(sessionDir, `bgexec_${sessionId}.log`) : null
+    const outputFilePath = sessionDir
+      ? this.createOutputFilePath(sessionDir, sessionId, options?.outputPrefix)
+      : null
 
     const child = spawn(shell, [...args, command], {
       cwd,
@@ -114,6 +139,7 @@ export class BackgroundExecSessionManager {
         ...shellEnv,
         ...options?.env
       },
+      detached: process.platform !== 'win32',
       stdio: ['pipe', 'pipe', 'pipe']
     })
 
@@ -140,7 +166,8 @@ export class BackgroundExecSessionManager {
       stderrEof: false,
       closePromise,
       resolveClose,
-      closeSettled: false
+      closeSettled: false,
+      timedOut: false
     }
 
     this.setupOutputHandling(session, config)
@@ -176,7 +203,8 @@ export class BackgroundExecSessionManager {
       pid: session.child.pid,
       exitCode: session.exitCode,
       outputLength: session.totalOutputLength,
-      offloaded: this.hasPersistedOutput(session, getConfig())
+      offloaded: this.hasPersistedOutput(session, getConfig()),
+      timedOut: session.timedOut
     }))
   }
 
@@ -195,7 +223,8 @@ export class BackgroundExecSessionManager {
         output,
         exitCode: session.exitCode,
         offloaded: true,
-        outputFilePath: session.outputFilePath
+        outputFilePath: session.outputFilePath,
+        timedOut: session.timedOut
       }
     }
 
@@ -204,7 +233,8 @@ export class BackgroundExecSessionManager {
       status: session.status,
       output,
       exitCode: session.exitCode,
-      offloaded: false
+      offloaded: false,
+      timedOut: session.timedOut
     }
   }
 
@@ -234,10 +264,65 @@ export class BackgroundExecSessionManager {
       totalLength: session.totalOutputLength,
       exitCode: session.exitCode,
       offloaded: isOffloaded,
-      outputFilePath: session.outputFilePath || undefined
+      outputFilePath: session.outputFilePath || undefined,
+      timedOut: session.timedOut
+    }
+  }
+
+  async waitForCompletionOrYield(
+    conversationId: string,
+    sessionId: string,
+    yieldMs = getConfig().backgroundMs
+  ): Promise<WaitForCompletionOrYieldResult> {
+    const session = this.getSession(conversationId, sessionId)
+    session.lastAccessedAt = Date.now()
+
+    if (session.status !== 'running') {
+      return {
+        kind: 'completed',
+        result: await this.getCompletionResult(conversationId, sessionId)
+      }
+    }
+
+    let yieldTimer: NodeJS.Timeout | null = null
+
+    try {
+      await Promise.race([
+        session.closePromise,
+        new Promise((resolve) => {
+          yieldTimer = setTimeout(resolve, Math.max(0, yieldMs))
+        })
+      ])
+    } finally {
+      if (yieldTimer) {
+        clearTimeout(yieldTimer)
+      }
+    }
+
+    if (session.status !== 'running') {
+      return {
+        kind: 'completed',
+        result: await this.getCompletionResult(conversationId, sessionId)
+      }
+    }
+
+    return {
+      kind: 'running',
+      sessionId
     }
   }
 
+  async getCompletionResult(
+    conversationId: string,
+    sessionId: string,
+    previewChars = FOREGROUND_PREVIEW_CHARS
+  ): Promise<SessionCompletionResult> {
+    const session = this.getSession(conversationId, sessionId)
+    session.lastAccessedAt = Date.now()
+    await this.waitForSessionDrain(session)
+    return this.buildCompletionResult(session, previewChars)
+  }
+
   write(conversationId: string, sessionId: string, data: string, eof = false): void {
     const session = this.getSession(conversationId, sessionId)
 
@@ -446,31 +531,15 @@ export class BackgroundExecSessionManager {
       clearTimeout(session.killTimeoutId)
     }
 
-    const gracefulKill = new Promise<void>((resolve) => {
-      const timeout = setTimeout(() => {
-        resolve()
-      }, 2000)
-
-      session.child.once('close', () => {
-        clearTimeout(timeout)
-        resolve()
-      })
-
-      try {
-        session.child.kill('SIGTERM')
-      } catch {
-        resolve()
-      }
-    })
-
-    await gracefulKill
+    if (reason === 'timeout') {
+      session.timedOut = true
+    }
+    session.status = 'killed'
 
-    if (session.status === 'running') {
-      try {
-        session.child.kill('SIGKILL')
-      } catch (error) {
-        logger.warn(`[BackgroundExec] Failed to force kill session ${session.sessionId}:`, error)
-      }
+    const closed = await terminateProcessTree(session.child, { graceMs: 2000 })
+    if (!closed && !session.closeSettled) {
+      session.exitCode = undefined
+      await this.finalizeSession(session, null, 'SIGKILL')
     }
 
     await session.closePromise
@@ -682,6 +751,37 @@ export class BackgroundExecSessionManager {
     )
   }
 
+  private buildCompletionResult(
+    session: BackgroundSession,
+    previewChars: number
+  ): SessionCompletionResult {
+    const config = getConfig()
+    const offloaded = this.hasPersistedOutput(session, config)
+    const output =
+      offloaded && session.outputFilePath
+        ? this.getRecentOutputFromSession(session, previewChars)
+        : this.getRecentOutput(session.outputBuffer, previewChars)
+
+    return {
+      status: session.status === 'running' ? 'killed' : session.status,
+      output,
+      exitCode: session.exitCode ?? null,
+      offloaded,
+      outputFilePath: session.outputFilePath || undefined,
+      timedOut: session.timedOut
+    }
+  }
+
+  private createOutputFilePath(
+    sessionDir: string,
+    sessionId: string,
+    outputPrefix?: string
+  ): string {
+    const rawPrefix = outputPrefix?.trim() || 'bgexec'
+    const safePrefix = rawPrefix.replace(/[^a-zA-Z0-9_-]/g, '_')
+    return path.join(sessionDir, `${safePrefix}_${sessionId}.log`)
+  }
+
   private resolveUtf8ByteRange(
     fd: number,
     fileSize: number,
diff --git a/src/main/lib/agentRuntime/processTree.ts b/src/main/lib/agentRuntime/processTree.ts
new file mode 100644
index 000000000..df9716041
--- /dev/null
+++ b/src/main/lib/agentRuntime/processTree.ts
@@ -0,0 +1,165 @@
+import { spawn, type ChildProcess } from 'child_process'
+
+const FORCE_KILL_SETTLE_MS = 500
+
+function hasExited(child: ChildProcess): boolean {
+  return child.exitCode !== null || child.signalCode !== null
+}
+
+function waitForClose(child: ChildProcess, timeoutMs: number): Promise<boolean> {
+  if (hasExited(child)) {
+    return Promise.resolve(true)
+  }
+
+  return new Promise((resolve) => {
+    let settled = false
+    let timeoutId: NodeJS.Timeout | null = null
+
+    const cleanup = () => {
+      child.removeListener('close', onClose)
+      if (timeoutId) {
+        clearTimeout(timeoutId)
+        timeoutId = null
+      }
+    }
+
+    const onClose = () => {
+      if (settled) return
+      settled = true
+      cleanup()
+      resolve(true)
+    }
+
+    child.once('close', onClose)
+    timeoutId = setTimeout(() => {
+      if (settled) return
+      settled = true
+      cleanup()
+      resolve(false)
+    }, timeoutMs)
+  })
+}
+
+async function spawnAndWait(command: string, args: string[]): Promise<void> {
+  await new Promise<void>((resolve) => {
+    try {
+      const child = spawn(command, args, { stdio: 'ignore' })
+      child.on('error', () => resolve())
+      child.on('close', () => resolve())
+    } catch {
+      resolve()
+    }
+  })
+}
+
+async function spawnAndCapture(command: string, args: string[]): Promise<string> {
+  return await new Promise<string>((resolve) => {
+    let output = ''
+
+    try {
+      const child = spawn(command, args, { stdio: ['ignore', 'pipe', 'ignore'] })
+      child.stdout?.on('data', (chunk: Buffer | string) => {
+        output += chunk.toString()
+      })
+      child.on('error', () => resolve(''))
+      child.on('close', () => resolve(output))
+    } catch {
+      resolve('')
+    }
+  })
+}
+
+async function listChildPids(pid: number): Promise<number[]> {
+  const output = await spawnAndCapture('pgrep', ['-P', `${pid}`])
+  return output
+    .split(/\r?\n/)
+    .map((line) => Number.parseInt(line.trim(), 10))
+    .filter((childPid) => Number.isInteger(childPid) && childPid > 0)
+}
+
+async function collectDescendantPids(pid: number): Promise<number[]> {
+  const descendants: number[] = []
+  const pending = [pid]
+  const seen = new Set<number>()
+
+  while (pending.length > 0) {
+    const currentPid = pending.pop()
+    if (!currentPid) {
+      continue
+    }
+
+    const childPids = await listChildPids(currentPid)
+    for (const childPid of childPids) {
+      if (seen.has(childPid)) {
+        continue
+      }
+
+      seen.add(childPid)
+      descendants.push(childPid)
+      pending.push(childPid)
+    }
+  }
+
+  return descendants
+}
+
+async function signalDescendantsRecursively(
+  pid: number,
+  childSignal: '-TERM' | '-KILL'
+): Promise<void> {
+  const descendants = await collectDescendantPids(pid)
+  for (const descendantPid of descendants.reverse()) {
+    await spawnAndWait('kill', [childSignal, `${descendantPid}`])
+  }
+}
+
+async function signalProcessTree(pid: number, signal: 'SIGTERM' | 'SIGKILL'): Promise<void> {
+  if (process.platform === 'win32') {
+    const args = ['/PID', `${pid}`, '/T', '/F']
+    await spawnAndWait('taskkill', args)
+    return
+  }
+
+  const childSignal = signal === 'SIGKILL' ? '-KILL' : '-TERM'
+  try {
+    process.kill(-pid, signal)
+  } catch {
+    await signalDescendantsRecursively(pid, childSignal)
+    try {
+      process.kill(pid, signal)
+    } catch {
+      // Process may have already exited.
+    }
+  }
+}
+
+export async function terminateProcessTree(
+  child: ChildProcess,
+  options: {
+    graceMs?: number
+  } = {}
+): Promise<boolean> {
+  const graceMs = Math.max(0, options.graceMs ?? 2000)
+
+  if (hasExited(child)) {
+    return true
+  }
+
+  const pid = child.pid
+  if (!pid) {
+    try {
+      child.kill('SIGTERM')
+    } catch {
+      // Ignore missing pid failures.
+    }
+    return await waitForClose(child, graceMs)
+  }
+
+  await signalProcessTree(pid, 'SIGTERM')
+  if (await waitForClose(child, graceMs)) {
+    return true
+  }
+
+  await signalProcessTree(pid, 'SIGKILL')
+  return await waitForClose(child, FORCE_KILL_SETTLE_MS)
+}
diff --git a/src/main/lib/agentRuntime/systemEnvPromptBuilder.ts b/src/main/lib/agentRuntime/systemEnvPromptBuilder.ts
index 8d27af6ce..1579b1196 100644
--- a/src/main/lib/agentRuntime/systemEnvPromptBuilder.ts
+++ b/src/main/lib/agentRuntime/systemEnvPromptBuilder.ts
@@ -105,7 +105,9 @@ export function buildRuntimeCapabilitiesPrompt(
     lines.push('- YoBrowser tools are available for browser automation when needed.')
   }
   if (options.hasExec) {
-    lines.push('- Use exec(background: true) to start long-running terminal commands.')
+    lines.push(
+      '- Use exec(background: true) to explicitly detach long-running terminal commands; foreground exec may also return a running session after its yield window.'
+    )
   }
   if (options.hasProcess) {
     lines.push(
diff --git a/src/main/presenter/agentPresenter/acp/agentBashHandler.ts b/src/main/presenter/agentPresenter/acp/agentBashHandler.ts
index 883306cee..22c37b210 100644
--- a/src/main/presenter/agentPresenter/acp/agentBashHandler.ts
+++ b/src/main/presenter/agentPresenter/acp/agentBashHandler.ts
@@ -5,6 +5,8 @@ import os from 'os'
 import { z } from 'zod'
 import logger from '@shared/logger'
 import type { IConfigPresenter } from '@shared/presenter'
+import { getBackgroundExecConfig } from '@/lib/agentRuntime/backgroundExecSessionManager'
+import { terminateProcessTree } from '@/lib/agentRuntime/processTree'
 import { rtkRuntimeService } from '@/lib/agentRuntime/rtkRuntimeService'
 
 // Consider moving to a shared handlers location in future refactoring
@@ -47,6 +49,22 @@ interface PreparedCommand {
   rtkFallbackReason?: string
 }
 
+interface CompletedShellProcessResult {
+  kind: 'completed'
+  output: string
+  exitCode: number | null
+  timedOut: boolean
+  offloaded: boolean
+  outputFilePath?: string
+}
+
+interface RunningShellProcessResult {
+  kind: 'running'
+  sessionId: string
+}
+
+type ShellProcessResult = CompletedShellProcessResult | RunningShellProcessResult
+
 export class AgentBashHandler {
   private allowedDirectories: string[]
   private readonly commandPermissionHandler?: CommandPermissionService
@@ -81,7 +99,7 @@ export class AgentBashHandler {
       throw new Error(`Invalid arguments: ${parsed.error}`)
     }
 
-    const { command, timeout, background, cwd: requestedCwd } = parsed.data
+    const { command, timeout, background, cwd: requestedCwd, yieldMs } = parsed.data
     const cwd = this.resolveWorkingDirectory(requestedCwd)
 
     // Handle background execution
@@ -111,13 +129,7 @@ export class AgentBashHandler {
       }
     }
 
-    let result: {
-      output: string
-      exitCode: number | null
-      timedOut: boolean
-      offloaded: boolean
-      outputFilePath?: string
-    }
+    let result: ShellProcessResult
 
     const prepared = await this.prepareCommand(command, options.env)
 
@@ -127,10 +139,20 @@ export class AgentBashHandler {
       timeout ?? COMMAND_DEFAULT_TIMEOUT_MS,
       {
         ...options,
-        env: prepared.env
+        env: prepared.env,
+        yieldMs
       }
     )
 
+    if (result.kind === 'running') {
+      return {
+        output: { status: 'running', sessionId: result.sessionId },
+        rtkApplied: prepared.rtkApplied,
+        rtkMode: prepared.rtkMode,
+        rtkFallbackReason: prepared.rtkFallbackReason
+      }
+    }
+
     const fallbackReason = this.getRtkCapabilityFallbackReason(result.output)
     if (
       prepared.rewritten &&
@@ -155,28 +177,27 @@ export class AgentBashHandler {
         timeout ?? COMMAND_DEFAULT_TIMEOUT_MS,
         {
           ...options,
-          env: prepared.env
+          env: prepared.env,
+          yieldMs
         }
       )
 
       prepared.rtkApplied = false
       prepared.rtkMode = 'bypass'
       prepared.rtkFallbackReason = fallbackReason
-    }
 
-    const responseLines: string[] = []
-    if (result.output) {
-      responseLines.push(result.output.trimEnd())
-    }
-    responseLines.push(`Exit Code: ${result.exitCode ?? 'null'}`)
-    if (result.timedOut) {
-      responseLines.push('Timed out')
-    }
-    if (result.offloaded && result.outputFilePath) {
-      responseLines.push(`Output offloaded: ${result.outputFilePath}`)
+      if (result.kind === 'running') {
+        return {
+          output: { status: 'running', sessionId: result.sessionId },
+          rtkApplied: prepared.rtkApplied,
+          rtkMode: prepared.rtkMode,
+          rtkFallbackReason: prepared.rtkFallbackReason
+        }
+      }
     }
+
     return {
-      output: responseLines.join('\n'),
+      output: this.formatCompletedResult(result),
       rtkApplied: prepared.rtkApplied,
       rtkMode: prepared.rtkMode,
       rtkFallbackReason: prepared.rtkFallbackReason
@@ -228,17 +249,79 @@ export class AgentBashHandler {
   }
 
   private async runShellProcess(
+    command: string,
+    cwd: string,
+    timeout: number,
+    options: ExecuteCommandOptions & { yieldMs?: number }
+  ): Promise<ShellProcessResult> {
+    if (options.conversationId) {
+      return await this.runManagedShellProcess(command, cwd, timeout, options)
+    }
+
+    return await this.runDetachedShellProcess(command, cwd, timeout, options)
+  }
+
+  private async runManagedShellProcess(
+    command: string,
+    cwd: string,
+    timeout: number,
+    options: ExecuteCommandOptions & { yieldMs?: number }
+  ): Promise<ShellProcessResult> {
+    const conversationId = options.conversationId
+    if (!conversationId) {
+      throw new Error('Managed shell process requires a conversation ID')
+    }
+
+    const session = await backgroundExecSessionManager.start(conversationId, command, cwd, {
+      timeout,
+      env: options.env,
+      outputPrefix: options.outputPrefix
+    })
+
+    backgroundExecSessionManager.write(conversationId, session.sessionId, options.stdin ?? '', true)
+
+    const yielded = await backgroundExecSessionManager.waitForCompletionOrYield(
+      conversationId,
+      session.sessionId,
+      options.yieldMs ?? getBackgroundExecConfig().backgroundMs
+    )
+
+    if (yielded.kind === 'running') {
+      return yielded
+    }
+
+    const shouldCleanupSession = !yielded.result.offloaded
+
+    try {
+      return {
+        kind: 'completed',
+        output: yielded.result.output,
+        exitCode: yielded.result.exitCode,
+        timedOut: yielded.result.timedOut,
+        offloaded: yielded.result.offloaded,
+        outputFilePath: yielded.result.outputFilePath
+      }
+    } finally {
+      if (shouldCleanupSession) {
+        await backgroundExecSessionManager
+          .remove(conversationId, session.sessionId)
+          .catch((error) => {
+            logger.warn('[AgentBashHandler] Failed to cleanup completed foreground exec session', {
+              conversationId,
+              sessionId: session.sessionId,
+              error
+            })
+          })
+      }
+    }
+  }
+
+  private async runDetachedShellProcess(
     command: string,
     cwd: string,
     timeout: number,
     options: ExecuteCommandOptions
-  ): Promise<{
-    output: string
-    exitCode: number | null
-    timedOut: boolean
-    offloaded: boolean
-    outputFilePath?: string
-  }> {
+  ): Promise<CompletedShellProcessResult> {
     const { shell, args } = getUserShell()
     const shellEnv = await getShellEnvironment()
     const outputFilePath = this.createOutputFilePath(options.conversationId, options.outputPrefix)
@@ -251,17 +334,38 @@ export class AgentBashHandler {
           ...shellEnv,
           ...options.env
         },
+        detached: process.platform !== 'win32',
         stdio: ['pipe', 'pipe', 'pipe']
       })
 
+      let settled = false
       let output = ''
       let totalOutputLength = 0
       let offloaded = false
       let timedOut = false
-      let exitCode: number | null = null
       let outputWriteQueue = Promise.resolve()
       let timeoutId: NodeJS.Timeout | null = null
-      let killTimeoutId: NodeJS.Timeout | null = null
+
+      const cleanupTimeout = () => {
+        if (timeoutId) {
+          clearTimeout(timeoutId)
+          timeoutId = null
+        }
+      }
+
+      const settle = async (payload: CompletedShellProcessResult) => {
+        if (settled) return
+        settled = true
+        cleanupTimeout()
+
+        try {
+          await outputWriteQueue
+        } catch {
+          // Already logged when flushing output.
+        }
+
+        resolve(payload)
+      }
 
       const appendOutput = (chunk: string) => {
         totalOutputLength += chunk.length
@@ -308,50 +412,42 @@ export class AgentBashHandler {
 
       timeoutId = setTimeout(() => {
         timedOut = true
-        try {
-          child.kill('SIGTERM')
-        } catch {
-          // ignore kill errors
-        }
-        killTimeoutId = setTimeout(() => {
-          try {
-            child.kill('SIGKILL')
-          } catch {
-            // ignore kill errors
+        void terminateProcessTree(child, { graceMs: COMMAND_KILL_GRACE_MS }).then((closed) => {
+          if (closed || settled) {
+            return
           }
-        }, COMMAND_KILL_GRACE_MS)
+
+          const preview =
+            offloaded && outputFilePath
+              ? this.readLastCharsFromFile(outputFilePath, COMMAND_PREVIEW_CHARS)
+              : output
+
+          void settle({
+            kind: 'completed',
+            output: preview,
+            exitCode: null,
+            timedOut: true,
+            offloaded,
+            outputFilePath: outputFilePath ?? undefined
+          })
+        })
       }, timeout)
 
       child.on('error', (error) => {
-        if (timeoutId) clearTimeout(timeoutId)
-        if (killTimeoutId) clearTimeout(killTimeoutId)
+        cleanupTimeout()
         reject(error)
       })
 
       child.on('close', async (code, signal) => {
-        if (timeoutId) clearTimeout(timeoutId)
-        if (killTimeoutId) clearTimeout(killTimeoutId)
-
-        try {
-          await outputWriteQueue
-        } catch {
-          // Already logged when flushing output.
-        }
-
-        if (signal && timedOut) {
-          exitCode = null
-        } else {
-          exitCode = code ?? null
-        }
-
         const preview =
           offloaded && outputFilePath
             ? this.readLastCharsFromFile(outputFilePath, COMMAND_PREVIEW_CHARS)
             : output
 
-        resolve({
+        void settle({
+          kind: 'completed',
           output: preview,
-          exitCode,
+          exitCode: signal && timedOut ? null : (code ?? null),
           timedOut,
           offloaded,
           outputFilePath: outputFilePath ?? undefined
@@ -360,6 +456,21 @@ export class AgentBashHandler {
     })
   }
 
+  private formatCompletedResult(result: CompletedShellProcessResult): string {
+    const responseLines: string[] = []
+    if (result.output) {
+      responseLines.push(result.output.trimEnd())
+    }
+    responseLines.push(`Exit Code: ${result.exitCode ?? 'null'}`)
+    if (result.timedOut) {
+      responseLines.push('Timed out')
+    }
+    if (result.offloaded && result.outputFilePath) {
+      responseLines.push(`Output offloaded: ${result.outputFilePath}`)
+    }
+    return responseLines.join('\n')
+  }
+
   private createOutputFilePath(
     conversationId?: string,
     outputPrefix: string = 'exec'
@@ -458,9 +569,14 @@ export class AgentBashHandler {
 
     const result = await backgroundExecSessionManager.start(conversationId, prepared.command, cwd, {
       timeout: timeout ?? COMMAND_DEFAULT_TIMEOUT_MS,
-      env: prepared.env
+      env: prepared.env,
+      outputPrefix: options.outputPrefix
     })
 
+    if (options.stdin !== undefined) {
+      backgroundExecSessionManager.write(conversationId, result.sessionId, options.stdin, true)
+    }
+
     return {
       output: { status: 'running', sessionId: result.sessionId },
       rtkApplied: prepared.rtkApplied,
diff --git a/src/main/presenter/agentPresenter/acp/agentToolManager.ts b/src/main/presenter/agentPresenter/acp/agentToolManager.ts
index ee2b20704..082dbfb14 100644
--- a/src/main/presenter/agentPresenter/acp/agentToolManager.ts
+++ b/src/main/presenter/agentPresenter/acp/agentToolManager.ts
@@ -178,7 +178,7 @@ export class AgentToolManager {
         .min(100)
         .optional()
         .describe(
-          'Maximum time in milliseconds to wait for command output in foreground mode (default 120s). Ignored when background is true.'
+          'Foreground grace window in milliseconds before auto-backgrounding the command and returning a sessionId (defaults to PI_BASH_YIELD_MS or 10000). Ignored when background is true.'
         )
     }),
     process: z.object({
@@ -487,7 +487,7 @@ export class AgentToolManager {
         function: {
           name: 'exec',
           description:
-            'Execute a shell command in the workspace directory. For long-running commands (builds, tests, servers, installations), use background: true to run asynchronously and get a session ID. Then use the process tool to poll output, send input, or manage the session.',
+            'Execute a shell command in the workspace directory. Use background: true when you know the command should detach immediately. Otherwise foreground exec waits briefly, and long-running commands may auto-background and return a session ID for use with the process tool.',
           parameters: zodToJsonSchema(schemas.exec) as {
             type: string
             properties: Record<string, unknown>
@@ -505,7 +505,7 @@ export class AgentToolManager {
         function: {
           name: 'process',
           description:
-            'Manage background exec sessions created by exec with background: true. Use poll to check output and status, log to get full output with pagination, write to send input to stdin, kill to terminate, and remove to clean up completed sessions.',
+            'Manage background exec sessions created by explicit background exec calls or by long-running foreground exec calls that yielded a sessionId. Use poll to check output and status, log to get full output with pagination, write to send input to stdin, kill to terminate, and remove to clean up completed sessions.',
           parameters: zodToJsonSchema(schemas.process) as {
             type: string
             properties: Record<string, unknown>
diff --git a/src/main/presenter/deepchatAgentPresenter/contextBuilder.ts b/src/main/presenter/deepchatAgentPresenter/contextBuilder.ts
index c75b7a651..e5ffce3f0 100644
--- a/src/main/presenter/deepchatAgentPresenter/contextBuilder.ts
+++ b/src/main/presenter/deepchatAgentPresenter/contextBuilder.ts
@@ -17,6 +17,11 @@ export type ContextBuildOptions = {
   fallbackProtectedTurnCount?: number
 }
 
+type TokenizedTurn = {
+  messages: ChatMessage[]
+  tokens: number
+}
+
 export type HistoryTurn = {
   records: ChatMessageRecord[]
   messages: ChatMessage[]
@@ -314,10 +319,39 @@ export function buildHistoryTurns(
   })
 }
 
-function flattenTurns(turns: HistoryTurn[]): ChatMessage[] {
+function flattenTurns(turns: TokenizedTurn[]): ChatMessage[] {
   return turns.flatMap((turn) => turn.messages)
 }
 
+function buildChatMessageTurns(messages: ChatMessage[]): TokenizedTurn[] {
+  const turns: ChatMessage[][] = []
+  let currentTurn: ChatMessage[] = []
+
+  for (const message of messages) {
+    if (message.role === 'user' && currentTurn.length > 0) {
+      turns.push(currentTurn)
+      currentTurn = [message]
+      continue
+    }
+
+    if (currentTurn.length === 0) {
+      currentTurn = [message]
+      continue
+    }
+
+    currentTurn.push(message)
+  }
+
+  if (currentTurn.length > 0) {
+    turns.push(currentTurn)
+  }
+
+  return turns.map((turnMessages) => ({
+    messages: turnMessages,
+    tokens: estimateMessagesTokens(turnMessages)
+  }))
+}
+
 /**
  * Emergency fallback that drops full turns first and only then falls back to
  * message-level truncation to keep the prompt valid.
@@ -355,7 +389,7 @@ export function truncateContext(history: ChatMessage[], availableTokens: number)
 }
 
 function selectTurnHistory(
-  turns: HistoryTurn[],
+  turns: TokenizedTurn[],
   availableTokens: number,
   fallbackProtectedTurnCount: number
 ): ChatMessage[] {
@@ -427,6 +461,47 @@ export function buildContext(
   return messages
 }
 
+export function fitMessagesToContextWindow(
+  messages: ChatMessage[],
+  contextLength: number,
+  reserveTokens: number,
+  protectedTailCount: number = 0
+): ChatMessage[] {
+  if (messages.length === 0) {
+    return []
+  }
+
+  const leadingSystemMessage = messages[0]?.role === 'system' ? messages[0] : null
+  const conversationMessages = leadingSystemMessage ? messages.slice(1) : [...messages]
+  const clampedProtectedTailCount = Math.max(
+    0,
+    Math.min(protectedTailCount, conversationMessages.length)
+  )
+  const protectedTail =
+    clampedProtectedTailCount > 0 ? conversationMessages.slice(-clampedProtectedTailCount) : []
+  const historyPrefix =
+    clampedProtectedTailCount > 0
+      ? conversationMessages.slice(0, -clampedProtectedTailCount)
+      : conversationMessages
+
+  const systemTokens = leadingSystemMessage ? estimateMessagesTokens([leadingSystemMessage]) : 0
+  const protectedTailTokens = protectedTail.length > 0 ? estimateMessagesTokens(protectedTail) : 0
+  const availableHistoryTokens = contextLength - systemTokens - protectedTailTokens - reserveTokens
+  const selectedHistory = selectTurnHistory(
+    buildChatMessageTurns(historyPrefix),
+    availableHistoryTokens,
+    0
+  )
+
+  const result: ChatMessage[] = []
+  if (leadingSystemMessage) {
+    result.push(leadingSystemMessage)
+  }
+  result.push(...selectedHistory)
+  result.push(...protectedTail)
+  return result
+}
+
 export function buildResumeContext(
   sessionId: string,
   assistantMessageId: string,
diff --git a/src/main/presenter/deepchatAgentPresenter/index.ts b/src/main/presenter/deepchatAgentPresenter/index.ts
index 903adc205..21e1fd233 100644
--- a/src/main/presenter/deepchatAgentPresenter/index.ts
+++ b/src/main/presenter/deepchatAgentPresenter/index.ts
@@ -4,6 +4,7 @@ import type {
   DeepChatSessionState,
   IAgentImplementation,
   MessageFile,
+  PendingSessionInputRecord,
   PermissionMode,
   SendMessageInput,
   SessionCompactionState,
@@ -18,6 +19,12 @@ import type { IConfigPresenter, ILlmProviderPresenter, ModelConfig } from '@shar
 import type { MCPToolDefinition } from '@shared/types/core/mcp'
 import type { IToolPresenter } from '@shared/types/presenters/tool.presenter'
 import type { ReasoningPortrait } from '@shared/types/model-db'
+import {
+  normalizeLegacyThinkingBudgetValue,
+  parseFiniteNumericValue,
+  toValidNonNegativeInteger,
+  validateGenerationNumericField
+} from '@shared/utils/generationSettingsValidation'
 import { nanoid } from 'nanoid'
 import type { SQLitePresenter } from '../sqlitePresenter'
 import { eventBus, SendTarget } from '@/eventbus'
@@ -27,10 +34,17 @@ import {
   buildSystemEnvPrompt
 } from '@/lib/agentRuntime/systemEnvPromptBuilder'
 import { presenter } from '@/presenter'
-import { buildContext, buildResumeContext } from './contextBuilder'
+import {
+  buildContext,
+  buildResumeContext,
+  createUserChatMessage,
+  fitMessagesToContextWindow
+} from './contextBuilder'
 import { appendSummarySection, CompactionService, type CompactionIntent } from './compactionService'
 import { buildPersistableMessageTracePayload } from './messageTracePayload'
 import { DeepChatMessageStore } from './messageStore'
+import { PendingInputCoordinator } from './pendingInputCoordinator'
+import { DeepChatPendingInputStore } from './pendingInputStore'
 import { processStream } from './process'
 import { DeepChatSessionStore, type SessionSummaryState } from './sessionStore'
 import type { PendingToolInteraction, ProcessResult } from './types'
@@ -79,11 +93,6 @@ type SystemPromptCacheEntry = {
   fingerprint: string
 }
 
-const TEMPERATURE_MIN = 0
-const TEMPERATURE_MAX = 2
-const CONTEXT_LENGTH_MIN = 2048
-const MAX_TOKENS_MIN = 128
-
 const isReasoningEffort = (value: unknown): value is 'minimal' | 'low' | 'medium' | 'high' =>
   value === 'minimal' || value === 'low' || value === 'medium' || value === 'high'
 
@@ -97,6 +106,8 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
   private readonly toolPresenter: IToolPresenter | null
   private readonly sessionStore: DeepChatSessionStore
   private readonly messageStore: DeepChatMessageStore
+  private readonly pendingInputStore: DeepChatPendingInputStore
+  private readonly pendingInputCoordinator: PendingInputCoordinator
   private readonly runtimeState: Map<string, DeepChatSessionState> = new Map()
   private readonly sessionGenerationSettings: Map<string, SessionGenerationSettings> = new Map()
   private readonly abortControllers: Map<string, AbortController> = new Map()
@@ -106,6 +117,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
   private readonly sessionCompactionStates: Map<string, SessionCompactionState> = new Map()
   private readonly interactionLocks: Set<string> = new Set()
   private readonly resumingMessages: Set<string> = new Set()
+  private readonly drainingPendingQueues: Set<string> = new Set()
   private readonly compactionService: CompactionService
   private readonly toolOutputGuard: ToolOutputGuard
   private readonly hooksBridge?: NewSessionHooksBridge
@@ -123,6 +135,8 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     this.toolPresenter = toolPresenter ?? null
     this.sessionStore = new DeepChatSessionStore(sqlitePresenter)
     this.messageStore = new DeepChatMessageStore(sqlitePresenter)
+    this.pendingInputStore = new DeepChatPendingInputStore(sqlitePresenter)
+    this.pendingInputCoordinator = new PendingInputCoordinator(this.pendingInputStore)
     this.compactionService = new CompactionService(
       this.sessionStore,
       this.messageStore,
@@ -136,6 +150,13 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     if (recovered > 0) {
       console.log(`DeepChatAgent: recovered ${recovered} pending messages to error status`)
     }
+
+    const recoveredPendingInputs = this.pendingInputCoordinator.recoverClaimedInputsAfterRestart()
+    if (recoveredPendingInputs > 0) {
+      console.log(
+        `DeepChatAgent: recovered ${recoveredPendingInputs} sessions with claimed pending inputs`
+      )
+    }
   }
 
   async initSession(
@@ -190,6 +211,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
       this.abortControllers.delete(sessionId)
     }
 
+    this.pendingInputCoordinator.deleteBySession(sessionId)
     this.messageStore.deleteBySession(sessionId)
     this.sessionStore.delete(sessionId)
     this.runtimeState.delete(sessionId)
@@ -198,6 +220,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     this.sessionProjectDirs.delete(sessionId)
     this.systemPromptCache.delete(sessionId)
     this.sessionCompactionStates.delete(sessionId)
+    this.drainingPendingQueues.delete(sessionId)
   }
 
   async getSessionState(sessionId: string): Promise<DeepChatSessionState | null> {
@@ -226,10 +249,84 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     return { ...rebuilt }
   }
 
+  async listPendingInputs(sessionId: string): Promise<PendingSessionInputRecord[]> {
+    return this.pendingInputCoordinator.listPendingInputs(sessionId)
+  }
+
+  async queuePendingInput(
+    sessionId: string,
+    content: string | SendMessageInput
+  ): Promise<PendingSessionInputRecord> {
+    const state = await this.getSessionState(sessionId)
+    if (!state) {
+      throw new Error(`Session ${sessionId} not found`)
+    }
+
+    const record = this.pendingInputCoordinator.queuePendingInput(sessionId, content)
+    if (this.isAwaitingToolQuestionFollowUp(sessionId)) {
+      const claimedFollowUp = this.pendingInputCoordinator.claimQueuedInput(sessionId, record.id)
+      void this.processMessage(sessionId, claimedFollowUp.payload, {
+        projectDir: this.resolveProjectDir(sessionId),
+        pendingQueueItemId: claimedFollowUp.id
+      })
+      return claimedFollowUp
+    }
+
+    void this.drainPendingQueueIfPossible(sessionId, 'enqueue')
+    return record
+  }
+
+  async updateQueuedInput(
+    sessionId: string,
+    itemId: string,
+    content: string | SendMessageInput
+  ): Promise<PendingSessionInputRecord> {
+    await this.ensureSessionReadyForPendingInputMutation(sessionId)
+    return this.pendingInputCoordinator.updateQueuedInput(sessionId, itemId, content)
+  }
+
+  async moveQueuedInput(
+    sessionId: string,
+    itemId: string,
+    toIndex: number
+  ): Promise<PendingSessionInputRecord[]> {
+    await this.ensureSessionReadyForPendingInputMutation(sessionId)
+    return this.pendingInputCoordinator.moveQueuedInput(sessionId, itemId, toIndex)
+  }
+
+  async convertPendingInputToSteer(
+    sessionId: string,
+    itemId: string
+  ): Promise<PendingSessionInputRecord> {
+    await this.ensureSessionReadyForPendingInputMutation(sessionId)
+    return this.pendingInputCoordinator.convertPendingInputToSteer(sessionId, itemId)
+  }
+
+  async deletePendingInput(sessionId: string, itemId: string): Promise<void> {
+    await this.ensureSessionReadyForPendingInputMutation(sessionId)
+    this.pendingInputCoordinator.deletePendingInput(sessionId, itemId)
+  }
+
+  async resumePendingQueue(sessionId: string): Promise<void> {
+    const state = await this.getSessionState(sessionId)
+    if (!state) {
+      throw new Error(`Session ${sessionId} not found`)
+    }
+    if (this.isAwaitingToolQuestionFollowUp(sessionId)) {
+      return
+    }
+
+    void this.drainPendingQueueIfPossible(sessionId, 'resume')
+  }
+
   async processMessage(
     sessionId: string,
     content: string | SendMessageInput,
-    context?: { projectDir?: string | null; emitRefreshBeforeStream?: boolean }
+    context?: {
+      projectDir?: string | null
+      emitRefreshBeforeStream?: boolean
+      pendingQueueItemId?: string
+    }
   ): Promise<void> {
     const state = this.runtimeState.get(sessionId)
     if (!state) throw new Error(`Session ${sessionId} not found`)
@@ -245,6 +342,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     )
 
     this.setSessionStatus(sessionId, 'generating')
+    let consumedPendingQueueItem = false
 
     try {
       const generationSettings = await this.getEffectiveSessionGenerationSettings(sessionId)
@@ -340,6 +438,11 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
         assistantOrderSeq
       )
 
+      if (context?.pendingQueueItemId) {
+        this.pendingInputCoordinator.consumeQueuedInput(sessionId, context.pendingQueueItemId)
+        consumedPendingQueueItem = true
+      }
+
       if (context?.emitRefreshBeforeStream) {
         this.emitMessageRefresh(sessionId, assistantMessageId || userMessageId)
       }
@@ -353,8 +456,21 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
         tools
       })
       this.applyProcessResultStatus(sessionId, result)
+      if (result?.status === 'completed') {
+        void this.drainPendingQueueIfPossible(sessionId, 'completed')
+      }
     } catch (err) {
       console.error('[DeepChatAgent] processMessage error:', err)
+      if (context?.pendingQueueItemId && !consumedPendingQueueItem) {
+        try {
+          this.pendingInputCoordinator.releaseClaimedQueueInput(
+            sessionId,
+            context.pendingQueueItemId
+          )
+        } catch (releaseError) {
+          console.warn('[DeepChatAgent] failed to release claimed queue input:', releaseError)
+        }
+      }
       const errorMessage = err instanceof Error ? err.message : String(err)
       this.dispatchHook('Stop', {
         sessionId,
@@ -884,6 +1000,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     }
 
     await this.cancelGeneration(sessionId)
+    this.pendingInputCoordinator.deleteBySession(sessionId)
     this.messageStore.deleteBySession(sessionId)
     this.resetSummaryState(sessionId)
     this.setSessionStatus(sessionId, 'idle')
@@ -900,6 +1017,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     if (this.hasPendingInteractions(sessionId)) {
       throw new Error('Please resolve pending tool interactions before retrying.')
     }
+    this.assertNoActivePendingInputs(sessionId)
 
     const target = await this.messageStore.getMessage(messageId)
     if (!target) {
@@ -931,6 +1049,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
   }
 
   async deleteMessage(sessionId: string, messageId: string): Promise<void> {
+    this.assertNoActivePendingInputs(sessionId)
     const target = await this.messageStore.getMessage(messageId)
     if (!target) {
       throw new Error(`Message ${messageId} not found`)
@@ -950,6 +1069,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     messageId: string,
     text: string
   ): Promise<ChatMessageRecord> {
+    this.assertNoActivePendingInputs(sessionId)
     const target = await this.messageStore.getMessage(messageId)
     if (!target) {
       throw new Error(`Message ${messageId} not found`)
@@ -1045,6 +1165,9 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     }
 
     const traceEnabled = this.configPresenter.getSetting<boolean>('traceDebugEnabled') === true
+    const pendingInputCoordinator = this.pendingInputCoordinator
+    const injectSteerInputsIntoRequest = this.injectSteerInputsIntoRequest.bind(this)
+    const persistMessageTrace = this.persistMessageTrace.bind(this)
     if (traceEnabled) {
       const traceAwareConfig = modelConfig as ModelConfig & {
         requestTraceContext?: {
@@ -1055,7 +1178,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
       traceAwareConfig.requestTraceContext = {
         enabled: true,
         persist: async (payload: ProviderRequestTracePayload) => {
-          this.persistMessageTrace({
+          persistMessageTrace({
             sessionId,
             messageId,
             providerId: state.providerId,
@@ -1070,6 +1193,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     const maxTokens = generationSettings.maxTokens
 
     const tools = providedTools ?? (await this.loadToolDefinitionsForSession(sessionId, projectDir))
+    const supportsVision = this.supportsVision(state.providerId, state.modelId)
 
     const abortController = new AbortController()
     this.abortControllers.set(sessionId, abortController)
@@ -1088,7 +1212,51 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
         messages,
         tools,
         toolPresenter: this.toolPresenter,
-        coreStream: provider.coreStream.bind(provider),
+        coreStream: async function* (
+          requestMessages,
+          requestModelId,
+          requestModelConfig,
+          requestTemperature,
+          requestMaxTokens,
+          requestTools
+        ) {
+          const claimedSteerBatch = pendingInputCoordinator.claimSteerBatchForNextLoop(sessionId)
+          const injectedMessages = injectSteerInputsIntoRequest(
+            requestMessages,
+            claimedSteerBatch,
+            supportsVision,
+            requestModelConfig.contextLength,
+            requestMaxTokens
+          )
+
+          let didConsumeSteerBatch = false
+
+          try {
+            for await (const event of provider.coreStream(
+              injectedMessages,
+              requestModelId,
+              requestModelConfig,
+              requestTemperature,
+              requestMaxTokens,
+              requestTools
+            )) {
+              if (!didConsumeSteerBatch && claimedSteerBatch.length > 0) {
+                pendingInputCoordinator.consumeClaimedSteerBatch(sessionId)
+                didConsumeSteerBatch = true
+              }
+              yield event
+            }
+
+            if (!didConsumeSteerBatch && claimedSteerBatch.length > 0) {
+              pendingInputCoordinator.consumeClaimedSteerBatch(sessionId)
+            }
+          } catch (error) {
+            if (!didConsumeSteerBatch && claimedSteerBatch.length > 0) {
+              pendingInputCoordinator.releaseClaimedInputs(sessionId)
+            }
+            throw error
+          }
+        },
         providerId: state.providerId,
         modelId: state.modelId,
         modelConfig,
@@ -1155,6 +1323,97 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     }
   }
 
+  private injectSteerInputsIntoRequest(
+    messages: ChatMessage[],
+    steerInputs: PendingSessionInputRecord[],
+    supportsVision: boolean,
+    contextLength: number,
+    reserveTokens: number
+  ): ChatMessage[] {
+    if (steerInputs.length === 0) {
+      return messages
+    }
+
+    const steerMessages = steerInputs.map((input) =>
+      createUserChatMessage(input.payload, supportsVision)
+    )
+    const clonedMessages = [...messages]
+    const lastMessage = clonedMessages[clonedMessages.length - 1]
+    const trailingUserCount = lastMessage?.role === 'user' ? 1 : 0
+    const injectedMessages =
+      trailingUserCount > 0
+        ? [...clonedMessages.slice(0, -1), ...steerMessages, lastMessage]
+        : [...clonedMessages, ...steerMessages]
+
+    return fitMessagesToContextWindow(
+      injectedMessages,
+      contextLength,
+      reserveTokens,
+      steerMessages.length + trailingUserCount
+    )
+  }
+
+  private async drainPendingQueueIfPossible(
+    sessionId: string,
+    reason: 'enqueue' | 'resume' | 'completed'
+  ): Promise<boolean> {
+    if (this.drainingPendingQueues.has(sessionId)) {
+      return false
+    }
+
+    const state = await this.getSessionState(sessionId)
+    if (!state || !this.canDrainPendingQueueFromStatus(state.status, reason)) {
+      return false
+    }
+    if (this.isAwaitingToolQuestionFollowUp(sessionId)) {
+      return false
+    }
+    if (this.hasPendingInteractions(sessionId)) {
+      return false
+    }
+
+    const nextQueuedInput = this.pendingInputCoordinator.getNextQueuedInput(sessionId)
+    if (!nextQueuedInput) {
+      return false
+    }
+
+    this.drainingPendingQueues.add(sessionId)
+    try {
+      const claimedInput = this.pendingInputCoordinator.claimQueuedInput(
+        sessionId,
+        nextQueuedInput.id
+      )
+      await this.processMessage(sessionId, claimedInput.payload, {
+        projectDir: this.resolveProjectDir(sessionId),
+        pendingQueueItemId: claimedInput.id
+      })
+      return true
+    } catch (error) {
+      console.error('[DeepChatAgent] drainPendingQueueIfPossible error:', error)
+      return false
+    } finally {
+      this.drainingPendingQueues.delete(sessionId)
+      if (
+        this.pendingInputCoordinator.getNextQueuedInput(sessionId) &&
+        (await this.getSessionState(sessionId))?.status === 'idle' &&
+        !this.hasPendingInteractions(sessionId)
+      ) {
+        void this.drainPendingQueueIfPossible(sessionId, 'completed')
+      }
+    }
+  }
+
+  private canDrainPendingQueueFromStatus(
+    status: DeepChatSessionState['status'],
+    reason: 'enqueue' | 'resume' | 'completed'
+  ): boolean {
+    if (status === 'idle') {
+      return true
+    }
+
+    return (reason === 'enqueue' || reason === 'resume') && status === 'error'
+  }
+
   private applyProcessResultStatus(
     sessionId: string,
     result: ProcessResult | null | undefined
@@ -1278,6 +1537,9 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
         initialBlocks
       })
       this.applyProcessResultStatus(sessionId, result)
+      if (result?.status === 'completed') {
+        void this.drainPendingQueueIfPossible(sessionId, 'completed')
+      }
       return true
     } catch (error) {
       console.error('[DeepChatAgent] resumeAssistantMessage error:', error)
@@ -1633,7 +1895,7 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
       patch.maxTokens = sessionRow.max_tokens
     }
     if (sessionRow.thinking_budget !== null) {
-      patch.thinkingBudget = sessionRow.thinking_budget
+      patch.thinkingBudget = normalizeLegacyThinkingBudgetValue(sessionRow.thinking_budget)
     }
     if (sessionRow.reasoning_effort !== null) {
       patch.reasoningEffort = sessionRow.reasoning_effort
@@ -1651,45 +1913,29 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
   ): Promise<SessionGenerationSettings> {
     const modelConfig = this.configPresenter.getModelConfig(modelId, providerId)
     const defaultSystemPrompt = await this.configPresenter.getDefaultSystemPrompt()
-    const contextLengthLimit = this.getContextLengthLimit(modelConfig)
-    const maxTokensLimit = this.getMaxTokensLimit(modelConfig)
+    const contextLengthDefault = toValidNonNegativeInteger(modelConfig.contextLength) ?? 32000
+    const maxTokensDefault =
+      toValidNonNegativeInteger(modelConfig.maxTokens) ?? Math.min(4096, contextLengthDefault)
 
     const defaults: SessionGenerationSettings = {
       systemPrompt: defaultSystemPrompt ?? '',
-      temperature: this.clampNumber(
-        modelConfig.temperature ?? 0.7,
-        TEMPERATURE_MIN,
-        TEMPERATURE_MAX
-      ),
-      contextLength: this.clampInteger(
-        modelConfig.contextLength ?? contextLengthLimit,
-        CONTEXT_LENGTH_MIN,
-        contextLengthLimit
-      ),
-      maxTokens: this.clampInteger(
-        modelConfig.maxTokens ?? Math.min(4096, maxTokensLimit),
-        MAX_TOKENS_MIN,
-        maxTokensLimit
-      )
+      temperature: parseFiniteNumericValue(modelConfig.temperature) ?? 0.7,
+      contextLength: contextLengthDefault,
+      maxTokens:
+        maxTokensDefault <= contextLengthDefault
+          ? maxTokensDefault
+          : Math.min(4096, contextLengthDefault)
     }
 
-    defaults.maxTokens = Math.min(defaults.maxTokens, defaults.contextLength)
-
     const supportsReasoning =
       this.configPresenter.supportsReasoningCapability?.(providerId, modelId) === true
     if (supportsReasoning) {
-      const budgetRange = this.configPresenter.getThinkingBudgetRange?.(providerId, modelId) ?? {}
-      const defaultBudget = this.toFiniteNumber(
-        modelConfig.thinkingBudget ?? budgetRange.default ?? undefined
+      const defaultBudget = normalizeLegacyThinkingBudgetValue(
+        modelConfig.thinkingBudget ??
+          this.configPresenter.getThinkingBudgetRange?.(providerId, modelId)?.default
       )
       if (defaultBudget !== undefined) {
-        defaults.thinkingBudget = this.normalizeThinkingBudget(
-          providerId,
-          modelId,
-          Math.round(defaultBudget),
-          budgetRange.min,
-          budgetRange.max
-        )
+        defaults.thinkingBudget = defaultBudget
       }
     }
 
@@ -1728,10 +1974,6 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     const base = baseSettings
       ? { ...baseSettings }
       : await this.buildDefaultGenerationSettings(providerId, modelId)
-    const modelConfig = this.configPresenter.getModelConfig(modelId, providerId)
-    const contextLengthLimit = this.getContextLengthLimit(modelConfig)
-    const maxTokensLimit = this.getMaxTokensLimit(modelConfig)
-
     const next: SessionGenerationSettings = { ...base }
 
     if (Object.prototype.hasOwnProperty.call(patch, 'systemPrompt')) {
@@ -1740,67 +1982,58 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     }
 
     if (Object.prototype.hasOwnProperty.call(patch, 'temperature')) {
-      const numeric = this.toFiniteNumber(patch.temperature)
-      next.temperature = this.clampNumber(
-        numeric ?? base.temperature,
-        TEMPERATURE_MIN,
-        TEMPERATURE_MAX
-      )
+      const numeric = parseFiniteNumericValue(patch.temperature)
+      if (numeric !== undefined) {
+        next.temperature = numeric
+      }
     }
 
+    const parsedContextLength = parseFiniteNumericValue(patch.contextLength)
+    const parsedMaxTokens = parseFiniteNumericValue(patch.maxTokens)
+    const nextContextReference =
+      Object.prototype.hasOwnProperty.call(patch, 'contextLength') &&
+      toValidNonNegativeInteger(parsedContextLength) !== undefined
+        ? toValidNonNegativeInteger(parsedContextLength)
+        : next.contextLength
+    const nextMaxTokensReference =
+      Object.prototype.hasOwnProperty.call(patch, 'maxTokens') &&
+      toValidNonNegativeInteger(parsedMaxTokens) !== undefined
+        ? toValidNonNegativeInteger(parsedMaxTokens)
+        : next.maxTokens
+
     if (Object.prototype.hasOwnProperty.call(patch, 'contextLength')) {
-      const numeric = this.toFiniteNumber(patch.contextLength)
-      next.contextLength = this.clampInteger(
-        Math.round(numeric ?? base.contextLength),
-        CONTEXT_LENGTH_MIN,
-        contextLengthLimit
-      )
-    } else {
-      next.contextLength = this.clampInteger(
-        next.contextLength,
-        CONTEXT_LENGTH_MIN,
-        contextLengthLimit
-      )
+      const error = validateGenerationNumericField('contextLength', patch.contextLength, {
+        maxTokens: nextMaxTokensReference
+      })
+      const numeric = toValidNonNegativeInteger(parsedContextLength)
+      if (!error && numeric !== undefined) {
+        next.contextLength = numeric
+      }
     }
 
     if (Object.prototype.hasOwnProperty.call(patch, 'maxTokens')) {
-      const numeric = this.toFiniteNumber(patch.maxTokens)
-      next.maxTokens = this.clampInteger(
-        Math.round(numeric ?? base.maxTokens),
-        MAX_TOKENS_MIN,
-        maxTokensLimit
-      )
-    } else {
-      next.maxTokens = this.clampInteger(next.maxTokens, MAX_TOKENS_MIN, maxTokensLimit)
+      const error = validateGenerationNumericField('maxTokens', patch.maxTokens, {
+        contextLength: nextContextReference
+      })
+      const numeric = toValidNonNegativeInteger(parsedMaxTokens)
+      if (!error && numeric !== undefined) {
+        next.maxTokens = numeric
+      }
     }
-    next.maxTokens = Math.min(next.maxTokens, next.contextLength)
 
     const supportsReasoning =
       this.configPresenter.supportsReasoningCapability?.(providerId, modelId) === true
     if (supportsReasoning) {
-      const budgetRange = this.configPresenter.getThinkingBudgetRange?.(providerId, modelId) ?? {}
       if (Object.prototype.hasOwnProperty.call(patch, 'thinkingBudget')) {
         const raw = patch.thinkingBudget
-        const numeric = this.toFiniteNumber(raw)
-        if (numeric === undefined) {
+        if (raw === undefined) {
           delete next.thinkingBudget
-        } else {
-          next.thinkingBudget = this.normalizeThinkingBudget(
-            providerId,
-            modelId,
-            Math.round(numeric),
-            budgetRange.min,
-            budgetRange.max
-          )
+        } else if (!validateGenerationNumericField('thinkingBudget', raw)) {
+          const numeric = toValidNonNegativeInteger(raw)
+          if (numeric !== undefined) {
+            next.thinkingBudget = numeric
+          }
         }
-      } else if (next.thinkingBudget !== undefined) {
-        next.thinkingBudget = this.normalizeThinkingBudget(
-          providerId,
-          modelId,
-          Math.round(next.thinkingBudget),
-          budgetRange.min,
-          budgetRange.max
-        )
       }
     } else {
       delete next.thinkingBudget
@@ -1911,70 +2144,18 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     return this.configPresenter.getReasoningPortrait?.(providerId, modelId) ?? null
   }
 
-  private normalizeThinkingBudget(
-    providerId: string,
-    modelId: string,
-    value: number,
-    min?: number,
-    max?: number
-  ): number {
-    const roundedValue = Math.round(value)
-    const budget = this.getReasoningPortrait(providerId, modelId)?.budget
-    const sentinelValues = new Set<number>()
-
-    if (typeof budget?.default === 'number') sentinelValues.add(Math.round(budget.default))
-    if (typeof budget?.auto === 'number') sentinelValues.add(Math.round(budget.auto))
-    if (typeof budget?.off === 'number') sentinelValues.add(Math.round(budget.off))
-
-    if (sentinelValues.has(roundedValue)) {
-      return roundedValue
-    }
-
-    return this.clampNumberWithOptionalRange(roundedValue, min, max)
-  }
-
-  private toFiniteNumber(value: unknown): number | undefined {
-    if (typeof value !== 'number' || Number.isNaN(value) || !Number.isFinite(value)) {
-      return undefined
-    }
-    return value
-  }
-
-  private clampNumber(value: number, min: number, max: number): number {
-    if (value < min) return min
-    if (value > max) return max
-    return value
-  }
-
-  private clampInteger(value: number, min: number, max: number): number {
-    return Math.round(this.clampNumber(value, min, max))
-  }
-
-  private clampNumberWithOptionalRange(value: number, min?: number, max?: number): number {
-    let next = value
-    if (typeof min === 'number' && Number.isFinite(min)) {
-      next = Math.max(next, Math.round(min))
-    }
-    if (typeof max === 'number' && Number.isFinite(max)) {
-      next = Math.min(next, Math.round(max))
-    }
-    return next
-  }
-
-  private getContextLengthLimit(modelConfig: ModelConfig): number {
-    const configured = this.toFiniteNumber(modelConfig.contextLength)
-    if (configured === undefined) {
-      return 32000
+  private async ensureSessionReadyForPendingInputMutation(sessionId: string): Promise<void> {
+    const state = await this.getSessionState(sessionId)
+    if (!state) {
+      throw new Error(`Session ${sessionId} not found`)
     }
-    return Math.max(CONTEXT_LENGTH_MIN, Math.round(configured))
   }
 
-  private getMaxTokensLimit(modelConfig: ModelConfig): number {
-    const configured = this.toFiniteNumber(modelConfig.maxTokens)
-    if (configured === undefined) {
-      return 4096
+  private assertNoActivePendingInputs(sessionId: string): void {
+    if (!this.pendingInputCoordinator.hasActiveInputs(sessionId)) {
+      return
     }
-    return Math.max(MAX_TOKENS_MIN, Math.round(configured))
+    throw new Error('Please clear the waiting lane before mutating chat history.')
   }
 
   private parseAssistantBlocks(rawContent: string): AssistantMessageBlock[] {
@@ -2520,6 +2701,33 @@ export class DeepChatAgentPresenter implements IAgentImplementation {
     return false
   }
 
+  private isAwaitingToolQuestionFollowUp(sessionId: string): boolean {
+    const messages = this.messageStore.getMessages(sessionId)
+    let latestUserOrderSeq = 0
+
+    for (const message of messages) {
+      if (message.role === 'user') {
+        latestUserOrderSeq = Math.max(latestUserOrderSeq, message.orderSeq)
+      }
+    }
+
+    return messages.some((message) => {
+      if (message.role !== 'assistant' || message.orderSeq <= latestUserOrderSeq) {
+        return false
+      }
+
+      return this.parseAssistantBlocks(message.content).some(
+        (block) =>
+          block.type === 'action' &&
+          block.action_type === 'question_request' &&
+          block.status === 'success' &&
+          block.extra?.needsUserAction === false &&
+          block.extra?.questionResolution === 'replied' &&
+          typeof block.extra?.answerText !== 'string'
+      )
+    })
+  }
+
   private async resolveCompactionStateForResumeTurn(params: {
     sessionId: string
     messageId: string
diff --git a/src/main/presenter/deepchatAgentPresenter/pendingInputCoordinator.ts b/src/main/presenter/deepchatAgentPresenter/pendingInputCoordinator.ts
new file mode 100644
index 000000000..29ec7a56e
--- /dev/null
+++ b/src/main/presenter/deepchatAgentPresenter/pendingInputCoordinator.ts
@@ -0,0 +1,159 @@
+import { eventBus, SendTarget } from '@/eventbus'
+import { SESSION_EVENTS } from '@/events'
+import type { PendingSessionInputRecord, SendMessageInput } from '@shared/types/agent-interface'
+import { DeepChatPendingInputStore } from './pendingInputStore'
+
+const MAX_ACTIVE_PENDING_INPUTS = 5
+
+function normalizeInput(input: string | SendMessageInput): SendMessageInput {
+  if (typeof input === 'string') {
+    return { text: input, files: [] }
+  }
+
+  return {
+    text: typeof input?.text === 'string' ? input.text : '',
+    files: Array.isArray(input?.files) ? input.files.filter(Boolean) : []
+  }
+}
+
+export class PendingInputCoordinator {
+  private readonly store: DeepChatPendingInputStore
+
+  constructor(store: DeepChatPendingInputStore) {
+    this.store = store
+  }
+
+  listPendingInputs(sessionId: string): PendingSessionInputRecord[] {
+    return this.store.listPendingInputs(sessionId)
+  }
+
+  queuePendingInput(
+    sessionId: string,
+    input: string | SendMessageInput
+  ): PendingSessionInputRecord {
+    this.ensureWithinLimit(sessionId)
+    const record = this.store.createQueueInput(sessionId, normalizeInput(input))
+    this.emitUpdated(sessionId)
+    return record
+  }
+
+  updateQueuedInput(
+    sessionId: string,
+    itemId: string,
+    input: string | SendMessageInput
+  ): PendingSessionInputRecord {
+    this.assertQueueInput(sessionId, itemId)
+    const record = this.store.updateQueueInput(itemId, normalizeInput(input))
+    this.emitUpdated(sessionId)
+    return record
+  }
+
+  moveQueuedInput(sessionId: string, itemId: string, toIndex: number): PendingSessionInputRecord[] {
+    this.assertQueueInput(sessionId, itemId)
+    const records = this.store.moveQueueInput(sessionId, itemId, toIndex)
+    this.emitUpdated(sessionId)
+    return records
+  }
+
+  convertPendingInputToSteer(sessionId: string, itemId: string): PendingSessionInputRecord {
+    this.assertQueueInput(sessionId, itemId)
+    const record = this.store.convertQueueInputToSteer(itemId)
+    this.emitUpdated(sessionId)
+    return record
+  }
+
+  deletePendingInput(sessionId: string, itemId: string): void {
+    this.assertQueueInput(sessionId, itemId)
+    this.store.deleteInput(itemId)
+    this.emitUpdated(sessionId)
+  }
+
+  getNextQueuedInput(sessionId: string): PendingSessionInputRecord | null {
+    return this.store.getNextPendingQueueInput(sessionId)
+  }
+
+  claimQueuedInput(sessionId: string, itemId: string): PendingSessionInputRecord {
+    this.assertQueueInput(sessionId, itemId)
+    const record = this.store.claimQueueInput(itemId)
+    this.emitUpdated(sessionId)
+    return record
+  }
+
+  releaseClaimedQueueInput(sessionId: string, itemId: string): PendingSessionInputRecord {
+    const record = this.store.releaseClaimedQueueInput(itemId)
+    this.emitUpdated(sessionId)
+    return record
+  }
+
+  consumeQueuedInput(sessionId: string, itemId: string): void {
+    this.store.consumeQueueInput(itemId)
+    this.emitUpdated(sessionId)
+  }
+
+  claimSteerBatchForNextLoop(sessionId: string): PendingSessionInputRecord[] {
+    const claimed = this.store.claimSteerBatch(sessionId)
+    if (claimed.length > 0) {
+      this.emitUpdated(sessionId)
+    }
+    return claimed
+  }
+
+  releaseClaimedInputs(sessionId: string): number {
+    const released = this.store.releaseClaimedInputs(sessionId)
+    if (released > 0) {
+      this.emitUpdated(sessionId)
+    }
+    return released
+  }
+
+  consumeClaimedSteerBatch(sessionId: string): number {
+    const consumed = this.store.consumeClaimedSteerBatch(sessionId)
+    if (consumed > 0) {
+      this.emitUpdated(sessionId)
+    }
+    return consumed
+  }
+
+  recoverClaimedInputsAfterRestart(): number {
+    const sessionIds = this.store.recoverClaimedInputs()
+    for (const sessionId of sessionIds) {
+      this.emitUpdated(sessionId)
+    }
+    return sessionIds.length
+  }
+
+  hasActiveInputs(sessionId: string): boolean {
+    return this.store.countActive(sessionId) > 0
+  }
+
+  isAtCapacity(sessionId: string): boolean {
+    return this.store.countActive(sessionId) >= MAX_ACTIVE_PENDING_INPUTS
+  }
+
+  deleteBySession(sessionId: string): void {
+    this.store.deleteBySession(sessionId)
+    this.emitUpdated(sessionId)
+  }
+
+  private ensureWithinLimit(sessionId: string): void {
+    if (this.store.countActive(sessionId) >= MAX_ACTIVE_PENDING_INPUTS) {
+      throw new Error('Pending input limit reached for this session.')
+    }
+  }
+
+  private assertQueueInput(sessionId: string, itemId: string): void {
+    const record = this.store.listPendingInputs(sessionId).find((item) => item.id === itemId)
+    if (!record) {
+      throw new Error(`Pending input not found: ${itemId}`)
+    }
+    if (record.mode !== 'queue') {
+      throw new Error('Steer inputs are locked and cannot be modified.')
+    }
+  }
+
+  private emitUpdated(sessionId: string): void {
+    eventBus.sendToRenderer(SESSION_EVENTS.PENDING_INPUTS_UPDATED, SendTarget.ALL_WINDOWS, {
+      sessionId
+    })
+  }
+}
diff --git a/src/main/presenter/deepchatAgentPresenter/pendingInputStore.ts b/src/main/presenter/deepchatAgentPresenter/pendingInputStore.ts
new file mode 100644
index 000000000..b4d2d114d
--- /dev/null
+++ b/src/main/presenter/deepchatAgentPresenter/pendingInputStore.ts
@@ -0,0 +1,286 @@
+import { nanoid } from 'nanoid'
+import type {
+  PendingSessionInputRecord,
+  PendingSessionInputState,
+  SendMessageInput
+} from '@shared/types/agent-interface'
+import type { SQLitePresenter } from '../sqlitePresenter'
+import type { DeepChatPendingInputRow } from '../sqlitePresenter/tables/deepchatPendingInputs'
+
+function normalizeInput(input: string | SendMessageInput): SendMessageInput {
+  if (typeof input === 'string') {
+    return { text: input, files: [] }
+  }
+
+  return {
+    text: typeof input?.text === 'string' ? input.text : '',
+    files: Array.isArray(input?.files) ? input.files.filter(Boolean) : []
+  }
+}
+
+export class DeepChatPendingInputStore {
+  private readonly sqlitePresenter: SQLitePresenter
+
+  constructor(sqlitePresenter: SQLitePresenter) {
+    this.sqlitePresenter = sqlitePresenter
+  }
+
+  listPendingInputs(sessionId: string): PendingSessionInputRecord[] {
+    return this.sqlitePresenter.deepchatPendingInputsTable
+      .listActiveBySession(sessionId)
+      .filter((row) => !(row.mode === 'queue' && row.state === 'claimed'))
+      .map((row) => this.toRecord(row))
+  }
+
+  countActive(sessionId: string): number {
+    return this.sqlitePresenter.deepchatPendingInputsTable.countActiveBySession(sessionId)
+  }
+
+  createQueueInput(sessionId: string, input: string | SendMessageInput): PendingSessionInputRecord {
+    const normalized = normalizeInput(input)
+    const id = nanoid()
+    const nextQueueOrder = this.getNextQueueOrder(sessionId)
+    this.sqlitePresenter.deepchatPendingInputsTable.insert({
+      id,
+      sessionId,
+      mode: 'queue',
+      state: 'pending',
+      payloadJson: JSON.stringify(normalized),
+      queueOrder: nextQueueOrder
+    })
+    const row = this.sqlitePresenter.deepchatPendingInputsTable.get(id)
+    if (!row) {
+      throw new Error(`Failed to create pending input ${id}`)
+    }
+    return this.toRecord(row)
+  }
+
+  updateQueueInput(itemId: string, input: string | SendMessageInput): PendingSessionInputRecord {
+    const row = this.requireRow(itemId)
+    this.sqlitePresenter.deepchatPendingInputsTable.update(itemId, {
+      payload_json: JSON.stringify(normalizeInput(input))
+    })
+    return this.toRecord(this.requireRow(itemId, row.session_id))
+  }
+
+  moveQueueInput(sessionId: string, itemId: string, toIndex: number): PendingSessionInputRecord[] {
+    const queueRows = this.getPendingQueueRows(sessionId)
+    const fromIndex = queueRows.findIndex((row) => row.id === itemId)
+    if (fromIndex === -1) {
+      throw new Error(`Pending queue item not found: ${itemId}`)
+    }
+
+    const clampedIndex = Math.max(0, Math.min(toIndex, queueRows.length - 1))
+    if (fromIndex === clampedIndex) {
+      return this.listPendingInputs(sessionId)
+    }
+
+    const [moved] = queueRows.splice(fromIndex, 1)
+    queueRows.splice(clampedIndex, 0, moved)
+    this.resequenceQueueRows(queueRows)
+
+    return this.listPendingInputs(sessionId)
+  }
+
+  convertQueueInputToSteer(itemId: string): PendingSessionInputRecord {
+    const row = this.requireRow(itemId)
+    this.sqlitePresenter.deepchatPendingInputsTable.update(itemId, {
+      mode: 'steer',
+      queue_order: null
+    })
+    this.resequenceQueue(row.session_id)
+    return this.toRecord(this.requireRow(itemId, row.session_id))
+  }
+
+  deleteInput(itemId: string): void {
+    const row = this.requireRow(itemId)
+    this.sqlitePresenter.deepchatPendingInputsTable.delete(itemId)
+    if (row.mode === 'queue') {
+      this.resequenceQueue(row.session_id)
+    }
+  }
+
+  getNextPendingQueueInput(sessionId: string): PendingSessionInputRecord | null {
+    const row = this.getPendingQueueRows(sessionId)[0]
+    return row ? this.toRecord(row) : null
+  }
+
+  claimQueueInput(itemId: string): PendingSessionInputRecord {
+    const row = this.requireRow(itemId)
+    if (row.mode !== 'queue') {
+      throw new Error(`Pending input ${itemId} is not a queue item.`)
+    }
+    if (row.state !== 'pending') {
+      throw new Error(`Pending queue item ${itemId} is not claimable.`)
+    }
+
+    this.sqlitePresenter.deepchatPendingInputsTable.update(itemId, {
+      state: 'claimed',
+      claimed_at: Date.now()
+    })
+    return this.toRecord(this.requireRow(itemId, row.session_id))
+  }
+
+  releaseClaimedQueueInput(itemId: string): PendingSessionInputRecord {
+    const row = this.requireRow(itemId)
+    if (row.mode !== 'queue') {
+      throw new Error(`Pending input ${itemId} is not a queue item.`)
+    }
+    if (row.state !== 'claimed') {
+      return this.toRecord(row)
+    }
+
+    this.sqlitePresenter.deepchatPendingInputsTable.update(itemId, {
+      state: 'pending',
+      claimed_at: null
+    })
+    return this.toRecord(this.requireRow(itemId, row.session_id))
+  }
+
+  consumeQueueInput(itemId: string): void {
+    this.deleteInput(itemId)
+  }
+
+  claimSteerBatch(sessionId: string): PendingSessionInputRecord[] {
+    const now = Date.now()
+    const steerRows = this.getSteerRows(sessionId).filter((row) => row.state === 'pending')
+    if (steerRows.length === 0) {
+      return []
+    }
+
+    for (const row of steerRows) {
+      this.sqlitePresenter.deepchatPendingInputsTable.update(row.id, {
+        state: 'claimed',
+        claimed_at: now
+      })
+    }
+
+    return this.getSteerRows(sessionId)
+      .filter((row) => row.state === 'claimed')
+      .map((row) => this.toRecord(row))
+  }
+
+  releaseClaimedInputs(sessionId: string): number {
+    const claimedRows = this.sqlitePresenter.deepchatPendingInputsTable
+      .listActiveBySession(sessionId)
+      .filter((row) => row.state === 'claimed')
+    for (const row of claimedRows) {
+      this.sqlitePresenter.deepchatPendingInputsTable.update(row.id, {
+        state: 'pending',
+        claimed_at: null
+      })
+    }
+    return claimedRows.length
+  }
+
+  recoverClaimedInputs(): string[] {
+    const rows = this.listClaimedRows()
+    const recoveredSessionIds = new Set<string>()
+
+    for (const row of rows) {
+      if (!this.sqlitePresenter.deepchatSessionsTable.get(row.session_id)) {
+        continue
+      }
+
+      this.sqlitePresenter.deepchatPendingInputsTable.update(row.id, {
+        state: 'pending',
+        claimed_at: null
+      })
+      recoveredSessionIds.add(row.session_id)
+    }
+
+    return Array.from(recoveredSessionIds)
+  }
+
+  consumeClaimedSteerBatch(sessionId: string): number {
+    const claimedSteerRows = this.getSteerRows(sessionId).filter((row) => row.state === 'claimed')
+    if (claimedSteerRows.length === 0) {
+      return 0
+    }
+
+    const now = Date.now()
+    for (const row of claimedSteerRows) {
+      this.sqlitePresenter.deepchatPendingInputsTable.update(row.id, {
+        state: 'consumed',
+        consumed_at: now
+      })
+    }
+    return claimedSteerRows.length
+  }
+
+  deleteBySession(sessionId: string): void {
+    this.sqlitePresenter.deepchatPendingInputsTable.deleteBySession(sessionId)
+  }
+
+  private getNextQueueOrder(sessionId: string): number {
+    const queueRows = this.getPendingQueueRows(sessionId)
+    if (queueRows.length === 0) {
+      return 1
+    }
+    return (queueRows[queueRows.length - 1].queue_order ?? 0) + 1
+  }
+
+  private getPendingQueueRows(sessionId: string): DeepChatPendingInputRow[] {
+    return this.sqlitePresenter.deepchatPendingInputsTable
+      .listActiveBySession(sessionId)
+      .filter((row) => row.mode === 'queue' && row.state === 'pending')
+      .sort((left, right) => (left.queue_order ?? 0) - (right.queue_order ?? 0))
+  }
+
+  private getSteerRows(sessionId: string): DeepChatPendingInputRow[] {
+    return this.sqlitePresenter.deepchatPendingInputsTable
+      .listActiveBySession(sessionId)
+      .filter((row) => row.mode === 'steer')
+      .sort((left, right) => left.created_at - right.created_at)
+  }
+
+  private listClaimedRows(): DeepChatPendingInputRow[] {
+    return this.sqlitePresenter.deepchatPendingInputsTable.listClaimed()
+  }
+
+  private resequenceQueue(sessionId: string): void {
+    this.resequenceQueueRows(this.getPendingQueueRows(sessionId))
+  }
+
+  private resequenceQueueRows(rows: DeepChatPendingInputRow[]): void {
+    rows.forEach((row, index) => {
+      this.sqlitePresenter.deepchatPendingInputsTable.update(row.id, {
+        queue_order: index + 1
+      })
+    })
+  }
+
+  private requireRow(itemId: string, expectedSessionId?: string): DeepChatPendingInputRow {
+    const row = this.sqlitePresenter.deepchatPendingInputsTable.get(itemId)
+    if (!row) {
+      throw new Error(`Pending input not found: ${itemId}`)
+    }
+    if (expectedSessionId && row.session_id !== expectedSessionId) {
+      throw new Error(`Pending input ${itemId} does not belong to session ${expectedSessionId}`)
+    }
+    return row
+  }
+
+  private toRecord(row: DeepChatPendingInputRow): PendingSessionInputRecord {
+    return {
+      id: row.id,
+      sessionId: row.session_id,
+      mode: row.mode,
+      state: row.state as PendingSessionInputState,
+      payload: this.parsePayload(row.payload_json),
+      queueOrder: row.queue_order,
+      claimedAt: row.claimed_at,
+      consumedAt: row.consumed_at,
+      createdAt: row.created_at,
+      updatedAt: row.updated_at
+    }
+  }
+
+  private parsePayload(raw: string): SendMessageInput {
+    try {
+      return normalizeInput(JSON.parse(raw) as SendMessageInput)
+    } catch {
+      return normalizeInput(raw)
+    }
+  }
+}
diff --git a/src/main/presenter/newAgentPresenter/index.ts b/src/main/presenter/newAgentPresenter/index.ts
index 8afefb149..cecdadf74 100644
--- a/src/main/presenter/newAgentPresenter/index.ts
+++ b/src/main/presenter/newAgentPresenter/index.ts
@@ -181,11 +181,19 @@ export class NewAgentPresenter {
       modelId: state?.modelId ?? modelId
     }
 
-    // Process the first message (non-blocking) after returning session ID
-    console.log(`[NewAgentPresenter] firing processMessage (non-blocking)`)
-    agent.processMessage(sessionId, normalizedInput, { projectDir }).catch((err) => {
-      console.error('[NewAgentPresenter] processMessage failed:', err)
-    })
+    // Queue the first message (non-blocking) after returning session ID
+    if (normalizedInput.text.trim() || (normalizedInput.files?.length ?? 0) > 0) {
+      console.log(`[NewAgentPresenter] firing queuePendingInput (non-blocking)`)
+      if (agent.queuePendingInput) {
+        agent.queuePendingInput(sessionId, normalizedInput).catch((err) => {
+          console.error('[NewAgentPresenter] queuePendingInput failed:', err)
+        })
+      } else {
+        agent.processMessage(sessionId, normalizedInput, { projectDir }).catch((err) => {
+          console.error('[NewAgentPresenter] processMessage failed:', err)
+        })
+      }
+    }
     void this.generateSessionTitle(sessionId, title, providerId, modelId)
 
     return sessionResult
@@ -272,11 +280,118 @@ export class NewAgentPresenter {
       }
     }
     this.assertAcpSessionHasWorkdir(providerId, session.projectDir ?? null)
+    if (agent.queuePendingInput) {
+      await agent.queuePendingInput(sessionId, normalizedInput)
+      return
+    }
     await agent.processMessage(sessionId, normalizedInput, {
       projectDir: session.projectDir ?? null
     })
   }
 
+  async listPendingInputs(sessionId: string) {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+    const agent = await this.resolveAgentImplementation(session.agentId)
+    if (!agent.listPendingInputs) {
+      return []
+    }
+    return await agent.listPendingInputs(sessionId)
+  }
+
+  async queuePendingInput(sessionId: string, content: string | SendMessageInput) {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+
+    let currentSession = session
+    const normalizedInput = this.normalizeSendMessageInput(content)
+    if (currentSession.isDraft) {
+      const title = normalizedInput.text.trim().slice(0, 50) || 'New Chat'
+      this.sessionManager.update(sessionId, { isDraft: false, title })
+      this.emitSessionListUpdated()
+      currentSession = this.sessionManager.get(sessionId) ?? currentSession
+    }
+
+    const agent = await this.resolveAgentImplementation(currentSession.agentId)
+    if (!agent.queuePendingInput) {
+      throw new Error(`Agent ${currentSession.agentId} does not support pending inputs.`)
+    }
+
+    let providerId = (await agent.getSessionState(sessionId))?.providerId ?? ''
+    if (!providerId) {
+      const acpAgents = await this.configPresenter.getAcpAgents()
+      if (acpAgents.some((item) => item.id === currentSession.agentId)) {
+        providerId = 'acp'
+      }
+    }
+    this.assertAcpSessionHasWorkdir(providerId, currentSession.projectDir ?? null)
+    return await agent.queuePendingInput(sessionId, normalizedInput)
+  }
+
+  async updateQueuedInput(sessionId: string, itemId: string, content: string | SendMessageInput) {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+    const agent = await this.resolveAgentImplementation(session.agentId)
+    if (!agent.updateQueuedInput) {
+      throw new Error(`Agent ${session.agentId} does not support pending input edits.`)
+    }
+    return await agent.updateQueuedInput(sessionId, itemId, this.normalizeSendMessageInput(content))
+  }
+
+  async moveQueuedInput(sessionId: string, itemId: string, toIndex: number) {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+    const agent = await this.resolveAgentImplementation(session.agentId)
+    if (!agent.moveQueuedInput) {
+      throw new Error(`Agent ${session.agentId} does not support pending input sorting.`)
+    }
+    return await agent.moveQueuedInput(sessionId, itemId, toIndex)
+  }
+
+  async convertPendingInputToSteer(sessionId: string, itemId: string) {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+    const agent = await this.resolveAgentImplementation(session.agentId)
+    if (!agent.convertPendingInputToSteer) {
+      throw new Error(`Agent ${session.agentId} does not support steer conversion.`)
+    }
+    return await agent.convertPendingInputToSteer(sessionId, itemId)
+  }
+
+  async deletePendingInput(sessionId: string, itemId: string): Promise<void> {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+    const agent = await this.resolveAgentImplementation(session.agentId)
+    if (!agent.deletePendingInput) {
+      throw new Error(`Agent ${session.agentId} does not support pending input deletion.`)
+    }
+    await agent.deletePendingInput(sessionId, itemId)
+  }
+
+  async resumePendingQueue(sessionId: string): Promise<void> {
+    const session = this.sessionManager.get(sessionId)
+    if (!session) {
+      throw new Error(`Session not found: ${sessionId}`)
+    }
+    const agent = await this.resolveAgentImplementation(session.agentId)
+    if (!agent.resumePendingQueue) {
+      throw new Error(`Agent ${session.agentId} does not support pending queue resume.`)
+    }
+    await agent.resumePendingQueue(sessionId)
+  }
+
   async retryMessage(sessionId: string, messageId: string): Promise<void> {
     const session = this.sessionManager.get(sessionId)
     if (!session) {
diff --git a/src/main/presenter/sqlitePresenter/index.ts b/src/main/presenter/sqlitePresenter/index.ts
index 2e36219d5..3591c8b14 100644
--- a/src/main/presenter/sqlitePresenter/index.ts
+++ b/src/main/presenter/sqlitePresenter/index.ts
@@ -20,6 +20,7 @@ import { DeepChatSessionsTable } from './tables/deepchatSessions'
 import { DeepChatMessagesTable } from './tables/deepchatMessages'
 import { DeepChatMessageTracesTable } from './tables/deepchatMessageTraces'
 import { DeepChatMessageSearchResultsTable } from './tables/deepchatMessageSearchResults'
+import { DeepChatPendingInputsTable } from './tables/deepchatPendingInputs'
 import { DeepChatUsageStatsTable } from './tables/deepchatUsageStats'
 import { LegacyImportStatusTable } from './tables/legacyImportStatus'
 
@@ -44,6 +45,7 @@ export class SQLitePresenter implements ISQLitePresenter {
   public deepchatMessagesTable!: DeepChatMessagesTable
   public deepchatMessageTracesTable!: DeepChatMessageTracesTable
   public deepchatMessageSearchResultsTable!: DeepChatMessageSearchResultsTable
+  public deepchatPendingInputsTable!: DeepChatPendingInputsTable
   public deepchatUsageStatsTable!: DeepChatUsageStatsTable
   public legacyImportStatusTable!: LegacyImportStatusTable
   private currentVersion: number = 0
@@ -163,6 +165,7 @@ export class SQLitePresenter implements ISQLitePresenter {
     this.deepchatMessagesTable = new DeepChatMessagesTable(this.db)
     this.deepchatMessageTracesTable = new DeepChatMessageTracesTable(this.db)
     this.deepchatMessageSearchResultsTable = new DeepChatMessageSearchResultsTable(this.db)
+    this.deepchatPendingInputsTable = new DeepChatPendingInputsTable(this.db)
     this.deepchatUsageStatsTable = new DeepChatUsageStatsTable(this.db)
     this.legacyImportStatusTable = new LegacyImportStatusTable(this.db)
 
@@ -175,6 +178,7 @@ export class SQLitePresenter implements ISQLitePresenter {
     this.deepchatMessagesTable.createTable()
     this.deepchatMessageTracesTable.createTable()
     this.deepchatMessageSearchResultsTable.createTable()
+    this.deepchatPendingInputsTable.createTable()
     this.deepchatUsageStatsTable.createTable()
     this.legacyImportStatusTable.createTable()
   }
@@ -206,6 +210,7 @@ export class SQLitePresenter implements ISQLitePresenter {
       this.deepchatMessagesTable,
       this.deepchatMessageTracesTable,
       this.deepchatMessageSearchResultsTable,
+      this.deepchatPendingInputsTable,
       this.deepchatUsageStatsTable,
       this.legacyImportStatusTable
     ]
diff --git a/src/main/presenter/sqlitePresenter/tables/deepchatPendingInputs.ts b/src/main/presenter/sqlitePresenter/tables/deepchatPendingInputs.ts
new file mode 100644
index 000000000..336c337d6
--- /dev/null
+++ b/src/main/presenter/sqlitePresenter/tables/deepchatPendingInputs.ts
@@ -0,0 +1,218 @@
+import Database from 'better-sqlite3-multiple-ciphers'
+import { BaseTable } from './baseTable'
+
+export interface DeepChatPendingInputRow {
+  id: string
+  session_id: string
+  mode: 'queue' | 'steer'
+  state: 'pending' | 'claimed' | 'consumed'
+  payload_json: string
+  queue_order: number | null
+  claimed_at: number | null
+  consumed_at: number | null
+  created_at: number
+  updated_at: number
+}
+
+export class DeepChatPendingInputsTable extends BaseTable {
+  constructor(db: Database.Database) {
+    super(db, 'deepchat_pending_inputs')
+  }
+
+  getCreateTableSQL(): string {
+    return `
+      CREATE TABLE IF NOT EXISTS deepchat_pending_inputs (
+        id TEXT PRIMARY KEY,
+        session_id TEXT NOT NULL,
+        mode TEXT NOT NULL,
+        state TEXT NOT NULL DEFAULT 'pending',
+        payload_json TEXT NOT NULL,
+        queue_order INTEGER,
+        claimed_at INTEGER,
+        consumed_at INTEGER,
+        created_at INTEGER NOT NULL,
+        updated_at INTEGER NOT NULL
+      );
+      CREATE INDEX IF NOT EXISTS idx_deepchat_pending_inputs_session
+        ON deepchat_pending_inputs(session_id, state, mode, queue_order, created_at);
+    `
+  }
+
+  getMigrationSQL(version: number): string | null {
+    if (version === 17) {
+      return this.getCreateTableSQL()
+    }
+    return null
+  }
+
+  getLatestVersion(): number {
+    return 17
+  }
+
+  insert(row: {
+    id: string
+    sessionId: string
+    mode: 'queue' | 'steer'
+    state?: 'pending' | 'claimed' | 'consumed'
+    payloadJson: string
+    queueOrder?: number | null
+    claimedAt?: number | null
+    consumedAt?: number | null
+    createdAt?: number
+    updatedAt?: number
+  }): void {
+    const now = Date.now()
+    const createdAt = row.createdAt ?? now
+    const updatedAt = row.updatedAt ?? createdAt
+    this.db
+      .prepare(
+        `INSERT INTO deepchat_pending_inputs (
+          id,
+          session_id,
+          mode,
+          state,
+          payload_json,
+          queue_order,
+          claimed_at,
+          consumed_at,
+          created_at,
+          updated_at
+        ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)`
+      )
+      .run(
+        row.id,
+        row.sessionId,
+        row.mode,
+        row.state ?? 'pending',
+        row.payloadJson,
+        row.queueOrder ?? null,
+        row.claimedAt ?? null,
+        row.consumedAt ?? null,
+        createdAt,
+        updatedAt
+      )
+  }
+
+  get(id: string): DeepChatPendingInputRow | undefined {
+    return this.db.prepare('SELECT * FROM deepchat_pending_inputs WHERE id = ?').get(id) as
+      | DeepChatPendingInputRow
+      | undefined
+  }
+
+  listBySession(sessionId: string): DeepChatPendingInputRow[] {
+    return this.db
+      .prepare(
+        `SELECT *
+         FROM deepchat_pending_inputs
+         WHERE session_id = ?
+         ORDER BY
+           CASE mode WHEN 'steer' THEN 0 ELSE 1 END ASC,
+           CASE
+             WHEN mode = 'queue' THEN COALESCE(queue_order, 2147483647)
+             ELSE created_at
+           END ASC,
+           created_at ASC`
+      )
+      .all(sessionId) as DeepChatPendingInputRow[]
+  }
+
+  listClaimed(): DeepChatPendingInputRow[] {
+    return this.db
+      .prepare(
+        `SELECT *
+         FROM deepchat_pending_inputs
+         WHERE state = 'claimed'
+         ORDER BY session_id ASC, created_at ASC`
+      )
+      .all() as DeepChatPendingInputRow[]
+  }
+
+  listActiveBySession(sessionId: string): DeepChatPendingInputRow[] {
+    return this.db
+      .prepare(
+        `SELECT *
+         FROM deepchat_pending_inputs
+         WHERE session_id = ?
+           AND state != 'consumed'
+         ORDER BY
+           CASE mode WHEN 'steer' THEN 0 ELSE 1 END ASC,
+           CASE
+             WHEN mode = 'queue' THEN COALESCE(queue_order, 2147483647)
+             ELSE created_at
+           END ASC,
+           created_at ASC`
+      )
+      .all(sessionId) as DeepChatPendingInputRow[]
+  }
+
+  countActiveBySession(sessionId: string): number {
+    const row = this.db
+      .prepare(
+        `SELECT COUNT(*) AS total
+         FROM deepchat_pending_inputs
+         WHERE session_id = ?
+           AND state != 'consumed'
+           AND NOT (mode = 'queue' AND state = 'claimed')`
+      )
+      .get(sessionId) as { total: number }
+    return row.total
+  }
+
+  update(
+    id: string,
+    fields: Partial<
+      Pick<
+        DeepChatPendingInputRow,
+        'mode' | 'state' | 'payload_json' | 'queue_order' | 'claimed_at' | 'consumed_at'
+      >
+    >
+  ): void {
+    const setClauses: string[] = []
+    const params: unknown[] = []
+
+    if (fields.mode !== undefined) {
+      setClauses.push('mode = ?')
+      params.push(fields.mode)
+    }
+    if (fields.state !== undefined) {
+      setClauses.push('state = ?')
+      params.push(fields.state)
+    }
+    if (fields.payload_json !== undefined) {
+      setClauses.push('payload_json = ?')
+      params.push(fields.payload_json)
+    }
+    if (fields.queue_order !== undefined) {
+      setClauses.push('queue_order = ?')
+      params.push(fields.queue_order)
+    }
+    if (fields.claimed_at !== undefined) {
+      setClauses.push('claimed_at = ?')
+      params.push(fields.claimed_at)
+    }
+    if (fields.consumed_at !== undefined) {
+      setClauses.push('consumed_at = ?')
+      params.push(fields.consumed_at)
+    }
+
+    if (setClauses.length === 0) {
+      return
+    }
+
+    setClauses.push('updated_at = ?')
+    params.push(Date.now())
+    params.push(id)
+
+    this.db
+      .prepare(`UPDATE deepchat_pending_inputs SET ${setClauses.join(', ')} WHERE id = ?`)
+      .run(...params)
+  }
+
+  delete(id: string): void {
+    this.db.prepare('DELETE FROM deepchat_pending_inputs WHERE id = ?').run(id)
+  }
+
+  deleteBySession(sessionId: string): void {
+    this.db.prepare('DELETE FROM deepchat_pending_inputs WHERE session_id = ?').run(sessionId)
+  }
+}
diff --git a/src/main/presenter/toolPresenter/index.ts b/src/main/presenter/toolPresenter/index.ts
index 09c99bdc6..6fb77b450 100644
--- a/src/main/presenter/toolPresenter/index.ts
+++ b/src/main/presenter/toolPresenter/index.ts
@@ -373,6 +373,9 @@ export class ToolPresenter implements IToolPresenter {
       lines.push(
         'Prefer shell patterns like `rg -n`, `rg --files`, `find . -name ...`, `ls`, and `tree` inside `exec`.'
       )
+      lines.push(
+        'Use `background: true` when you know a command should detach immediately; otherwise a foreground `exec` may yield a running `sessionId` after `yieldMs`.'
+      )
     }
     if (toolNames.has('exec') && toolNames.has('read') && toolNames.has('edit')) {
       lines.push(
@@ -381,7 +384,7 @@ export class ToolPresenter implements IToolPresenter {
     }
     if (toolNames.has('process')) {
       lines.push(
-        'Use `process` to monitor, write to, or terminate long-running background `exec` tasks.'
+        'Use `process` to monitor, write to, or terminate long-running `exec` tasks that returned a running `sessionId`.'
       )
     }
 
diff --git a/src/renderer/src/components/chat/ChatInputToolbar.vue b/src/renderer/src/components/chat/ChatInputToolbar.vue
index fd9bf38e2..c1dc241f2 100644
--- a/src/renderer/src/components/chat/ChatInputToolbar.vue
+++ b/src/renderer/src/components/chat/ChatInputToolbar.vue
@@ -37,42 +37,54 @@
       </Tooltip>
 
       <!-- Send button -->
-      <Button
-        v-if="!isGenerating"
-        size="icon"
-        class="h-7 w-7 rounded-full"
-        :disabled="sendDisabled"
-        @click="$emit('send')"
-      >
-        <Icon icon="lucide:arrow-up" class="w-4 h-4" />
-      </Button>
-      <Button
-        v-else
-        variant="outline"
-        size="icon"
-        class="h-7 w-7 rounded-full"
-        @click="$emit('stop')"
-      >
-        <Icon icon="lucide:square" class="w-4 h-4 text-red-500" />
-      </Button>
+      <Tooltip v-if="isGenerating && !hasActiveInput">
+        <TooltipTrigger as-child>
+          <Button variant="outline" size="icon" class="h-7 w-7 rounded-full" @click="$emit('stop')">
+            <Icon icon="lucide:square" class="w-4 h-4 text-red-500" />
+          </Button>
+        </TooltipTrigger>
+        <TooltipContent>
+          <p>{{ t('chat.input.stop') }}</p>
+        </TooltipContent>
+      </Tooltip>
+      <Tooltip v-else>
+        <TooltipTrigger as-child>
+          <Button
+            size="icon"
+            class="h-7 w-7 rounded-full"
+            :disabled="sendDisabled"
+            @click="$emit('send')"
+          >
+            <Icon icon="lucide:arrow-up" class="w-4 h-4" />
+          </Button>
+        </TooltipTrigger>
+        <TooltipContent>
+          <p>{{ t('chat.input.queue') }}</p>
+        </TooltipContent>
+      </Tooltip>
     </div>
   </div>
 </template>
 
 <script setup lang="ts">
+import { computed } from 'vue'
 import { Button } from '@shadcn/components/ui/button'
 import { Tooltip, TooltipContent, TooltipTrigger } from '@shadcn/components/ui/tooltip'
 import { Icon } from '@iconify/vue'
 import { useI18n } from 'vue-i18n'
 
-withDefaults(
+const props = withDefaults(
   defineProps<{
     isGenerating?: boolean
+    hasInput?: boolean
+    hasText?: boolean
     sendDisabled?: boolean
     showVoiceInput?: boolean
   }>(),
   {
     isGenerating: false,
+    hasInput: false,
+    hasText: false,
     sendDisabled: false,
     showVoiceInput: false
   }
@@ -85,4 +97,5 @@ defineEmits<{
 }>()
 
 const { t } = useI18n()
+const hasActiveInput = computed(() => props.hasInput || props.hasText)
 </script>
diff --git a/src/renderer/src/components/chat/ChatStatusBar.vue b/src/renderer/src/components/chat/ChatStatusBar.vue
index d277c046c..6a30b2f37 100644
--- a/src/renderer/src/components/chat/ChatStatusBar.vue
+++ b/src/renderer/src/components/chat/ChatStatusBar.vue
@@ -221,75 +221,191 @@
 
                   <div v-else-if="localSettings" class="space-y-4">
                     <div class="space-y-1.5">
-                      <div class="flex items-center justify-between gap-2">
-                        <label class="text-xs font-medium">{{
-                          t('chat.advancedSettings.temperature')
-                        }}</label>
+                      <label class="text-xs font-medium">{{
+                        t('chat.advancedSettings.temperature')
+                      }}</label>
+                      <div class="flex items-center gap-2">
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="temperature"
+                          data-setting-action="decrement"
+                          :aria-label="
+                            t('chat.advancedSettings.decreaseValue', {
+                              label: t('chat.advancedSettings.temperature')
+                            })
+                          "
+                          :disabled="hasNumericInputError('temperature')"
+                          @click="stepTemperature(-1)"
+                        >
+                          <Icon icon="lucide:minus" class="h-3 w-3" />
+                        </Button>
                         <Input
-                          class="h-7 w-20 text-xs tabular-nums"
+                          :class="[
+                            'h-8 flex-1 text-xs tabular-nums',
+                            hasNumericInputError('temperature') ? 'border-destructive' : ''
+                          ]"
+                          data-setting-control="temperature"
                           type="number"
-                          :min="TEMPERATURE_MIN"
-                          :max="TEMPERATURE_MAX"
-                          step="0.1"
-                          :model-value="localSettings.temperature.toFixed(1)"
+                          :step="TEMPERATURE_STEP"
+                          :aria-invalid="hasNumericInputError('temperature')"
+                          :model-value="temperatureInputValue"
+                          @focus="startNumericInputEdit('temperature')"
                           @update:model-value="onTemperatureInput"
+                          @blur="commitTemperatureInput"
+                          @keydown.enter.prevent="commitTemperatureInput"
                         />
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="temperature"
+                          data-setting-action="increment"
+                          :aria-label="
+                            t('chat.advancedSettings.increaseValue', {
+                              label: t('chat.advancedSettings.temperature')
+                            })
+                          "
+                          :disabled="hasNumericInputError('temperature')"
+                          @click="stepTemperature(1)"
+                        >
+                          <Icon icon="lucide:plus" class="h-3 w-3" />
+                        </Button>
                       </div>
-                      <Slider
-                        :model-value="[localSettings.temperature]"
-                        :min="TEMPERATURE_MIN"
-                        :max="TEMPERATURE_MAX"
-                        :step="0.1"
-                        @update:model-value="onTemperatureSlider"
-                      />
+                      <p
+                        v-if="getNumericInputErrorMessage('temperature')"
+                        class="text-[11px] text-destructive"
+                      >
+                        {{ getNumericInputErrorMessage('temperature') }}
+                      </p>
                     </div>
 
                     <div class="space-y-1.5">
-                      <div class="flex items-center justify-between gap-2">
-                        <label class="text-xs font-medium">{{
-                          t('chat.advancedSettings.contextLength')
-                        }}</label>
+                      <label class="text-xs font-medium">{{
+                        t('chat.advancedSettings.contextLength')
+                      }}</label>
+                      <div class="flex items-center gap-2">
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="contextLength"
+                          data-setting-action="decrement"
+                          :aria-label="
+                            t('chat.advancedSettings.decreaseValue', {
+                              label: t('chat.advancedSettings.contextLength')
+                            })
+                          "
+                          :disabled="
+                            hasNumericInputError('contextLength') ||
+                            localSettings.contextLength <= 0
+                          "
+                          @click="stepContextLength(-1)"
+                        >
+                          <Icon icon="lucide:minus" class="h-3 w-3" />
+                        </Button>
                         <Input
-                          class="h-7 w-24 text-xs tabular-nums"
+                          :class="[
+                            'h-8 flex-1 text-xs tabular-nums',
+                            hasNumericInputError('contextLength') ? 'border-destructive' : ''
+                          ]"
+                          data-setting-control="contextLength"
                           type="number"
-                          :min="CONTEXT_LENGTH_MIN"
-                          :max="contextLengthLimit"
-                          :step="1024"
-                          :model-value="localSettings.contextLength.toString()"
+                          :step="CONTEXT_LENGTH_STEP"
+                          :aria-invalid="hasNumericInputError('contextLength')"
+                          :model-value="contextLengthInputValue"
+                          @focus="startNumericInputEdit('contextLength')"
                           @update:model-value="onContextLengthInput"
+                          @blur="commitContextLengthInput"
+                          @keydown.enter.prevent="commitContextLengthInput"
                         />
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="contextLength"
+                          data-setting-action="increment"
+                          :aria-label="
+                            t('chat.advancedSettings.increaseValue', {
+                              label: t('chat.advancedSettings.contextLength')
+                            })
+                          "
+                          :disabled="hasNumericInputError('contextLength')"
+                          @click="stepContextLength(1)"
+                        >
+                          <Icon icon="lucide:plus" class="h-3 w-3" />
+                        </Button>
                       </div>
-                      <Slider
-                        :model-value="[localSettings.contextLength]"
-                        :min="CONTEXT_LENGTH_MIN"
-                        :max="contextLengthLimit"
-                        :step="1024"
-                        @update:model-value="onContextLengthSlider"
-                      />
+                      <p
+                        v-if="getNumericInputErrorMessage('contextLength')"
+                        class="text-[11px] text-destructive"
+                      >
+                        {{ getNumericInputErrorMessage('contextLength') }}
+                      </p>
                     </div>
 
                     <div class="space-y-1.5">
-                      <div class="flex items-center justify-between gap-2">
-                        <label class="text-xs font-medium">{{
-                          t('chat.advancedSettings.maxTokens')
-                        }}</label>
+                      <label class="text-xs font-medium">{{
+                        t('chat.advancedSettings.maxTokens')
+                      }}</label>
+                      <div class="flex items-center gap-2">
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="maxTokens"
+                          data-setting-action="decrement"
+                          :aria-label="
+                            t('chat.advancedSettings.decreaseValue', {
+                              label: t('chat.advancedSettings.maxTokens')
+                            })
+                          "
+                          :disabled="
+                            hasNumericInputError('maxTokens') || localSettings.maxTokens <= 0
+                          "
+                          @click="stepMaxTokens(-1)"
+                        >
+                          <Icon icon="lucide:minus" class="h-3 w-3" />
+                        </Button>
                         <Input
-                          class="h-7 w-24 text-xs tabular-nums"
+                          :class="[
+                            'h-8 flex-1 text-xs tabular-nums',
+                            hasNumericInputError('maxTokens') ? 'border-destructive' : ''
+                          ]"
+                          data-setting-control="maxTokens"
                           type="number"
-                          :min="MAX_TOKENS_MIN"
-                          :max="maxTokensSliderLimit"
-                          :step="128"
-                          :model-value="localSettings.maxTokens.toString()"
+                          :step="MAX_TOKENS_STEP"
+                          :aria-invalid="hasNumericInputError('maxTokens')"
+                          :model-value="maxTokensInputValue"
+                          @focus="startNumericInputEdit('maxTokens')"
                           @update:model-value="onMaxTokensInput"
+                          @blur="commitMaxTokensInput"
+                          @keydown.enter.prevent="commitMaxTokensInput"
                         />
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="maxTokens"
+                          data-setting-action="increment"
+                          :aria-label="
+                            t('chat.advancedSettings.increaseValue', {
+                              label: t('chat.advancedSettings.maxTokens')
+                            })
+                          "
+                          :disabled="hasNumericInputError('maxTokens')"
+                          @click="stepMaxTokens(1)"
+                        >
+                          <Icon icon="lucide:plus" class="h-3 w-3" />
+                        </Button>
                       </div>
-                      <Slider
-                        :model-value="[localSettings.maxTokens]"
-                        :min="MAX_TOKENS_MIN"
-                        :max="maxTokensSliderLimit"
-                        :step="128"
-                        @update:model-value="onMaxTokensSlider"
-                      />
+                      <p
+                        v-if="getNumericInputErrorMessage('maxTokens')"
+                        class="text-[11px] text-destructive"
+                      >
+                        {{ getNumericInputErrorMessage('maxTokens') }}
+                      </p>
                     </div>
 
                     <div v-if="showReasoningEffort" class="space-y-1.5">
@@ -349,19 +465,80 @@
                         <label class="text-xs font-medium">{{
                           t('chat.advancedSettings.thinkingBudget')
                         }}</label>
-                        <span class="text-[11px] text-muted-foreground">
-                          {{ thinkingBudgetHint }}
-                        </span>
+                        <div class="flex items-center gap-2">
+                          <span v-if="thinkingBudgetHint" class="text-[11px] text-muted-foreground">
+                            {{ thinkingBudgetHint }}
+                          </span>
+                          <Switch
+                            data-setting-control="thinkingBudget-toggle"
+                            :model-value="isThinkingBudgetEnabled"
+                            :aria-label="
+                              t('chat.advancedSettings.toggleValue', {
+                                label: t('chat.advancedSettings.thinkingBudget')
+                              })
+                            "
+                            @update:model-value="onThinkingBudgetToggle(Boolean($event))"
+                          />
+                        </div>
                       </div>
-                      <Input
-                        class="h-8 text-xs"
-                        type="number"
-                        :min="budgetRange?.min"
-                        :max="budgetRange?.max"
-                        :step="128"
-                        :model-value="localSettings.thinkingBudget?.toString() ?? ''"
-                        @update:model-value="onThinkingBudgetInput"
-                      />
+                      <div v-if="isThinkingBudgetEnabled" class="flex items-center gap-2">
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="thinkingBudget"
+                          data-setting-action="decrement"
+                          :aria-label="
+                            t('chat.advancedSettings.decreaseValue', {
+                              label: t('chat.advancedSettings.thinkingBudget')
+                            })
+                          "
+                          :disabled="
+                            hasNumericInputError('thinkingBudget') ||
+                            (localSettings.thinkingBudget ?? 0) <= 0
+                          "
+                          @click="stepThinkingBudget(-1)"
+                        >
+                          <Icon icon="lucide:minus" class="h-3 w-3" />
+                        </Button>
+                        <Input
+                          :class="[
+                            'h-8 flex-1 text-xs tabular-nums',
+                            hasNumericInputError('thinkingBudget') ? 'border-destructive' : ''
+                          ]"
+                          data-setting-control="thinkingBudget"
+                          type="number"
+                          :step="THINKING_BUDGET_STEP"
+                          :aria-invalid="hasNumericInputError('thinkingBudget')"
+                          :model-value="thinkingBudgetInputValue"
+                          @focus="startNumericInputEdit('thinkingBudget')"
+                          @update:model-value="onThinkingBudgetInput"
+                          @blur="commitThinkingBudgetInput"
+                          @keydown.enter.prevent="commitThinkingBudgetInput"
+                        />
+                        <Button
+                          variant="outline"
+                          size="icon"
+                          class="h-8 w-8 shrink-0"
+                          data-setting-control="thinkingBudget"
+                          data-setting-action="increment"
+                          :aria-label="
+                            t('chat.advancedSettings.increaseValue', {
+                              label: t('chat.advancedSettings.thinkingBudget')
+                            })
+                          "
+                          :disabled="hasNumericInputError('thinkingBudget')"
+                          @click="stepThinkingBudget(1)"
+                        >
+                          <Icon icon="lucide:plus" class="h-3 w-3" />
+                        </Button>
+                      </div>
+                      <p
+                        v-if="getNumericInputErrorMessage('thinkingBudget')"
+                        class="text-[11px] text-destructive"
+                      >
+                        {{ getNumericInputErrorMessage('thinkingBudget') }}
+                      </p>
                     </div>
                   </div>
                 </div>
@@ -522,7 +699,7 @@ import {
   SelectTrigger,
   SelectValue
 } from '@shadcn/components/ui/select'
-import { Slider } from '@shadcn/components/ui/slider'
+import { Switch } from '@shadcn/components/ui/switch'
 import type {
   AcpConfigOption,
   AcpConfigState,
@@ -531,6 +708,14 @@ import type {
 } from '@shared/presenter'
 import type { PermissionMode, SessionGenerationSettings } from '@shared/types/agent-interface'
 import type { ReasoningPortrait } from '@shared/types/model-db'
+import {
+  normalizeLegacyThinkingBudgetValue,
+  parseFiniteNumericValue,
+  toValidNonNegativeInteger,
+  type GenerationNumericField,
+  type GenerationNumericValidationCode,
+  validateGenerationNumericField
+} from '@shared/utils/generationSettingsValidation'
 import McpIndicator from '@/components/chat-input/McpIndicator.vue'
 import ModelIcon from '@/components/icons/ModelIcon.vue'
 import { usePresenter } from '@/composables/usePresenter'
@@ -572,10 +757,10 @@ type GroupedModelList = {
   models: RENDERER_MODEL_META[]
 }
 
-const TEMPERATURE_MIN = 0
-const TEMPERATURE_MAX = 2
-const CONTEXT_LENGTH_MIN = 2048
-const MAX_TOKENS_MIN = 128
+const TEMPERATURE_STEP = 0.1
+const CONTEXT_LENGTH_STEP = 1024
+const MAX_TOKENS_STEP = 128
+const THINKING_BUDGET_STEP = 128
 const ACP_INLINE_OPTION_LIMIT = 3
 const DEFAULT_REASONING_EFFORT_OPTIONS: SessionGenerationSettings['reasoningEffort'][] = [
   'minimal',
@@ -616,12 +801,24 @@ const acpConfigLoadingRequestKey = ref<string | null>(null)
 const acpInlineOpenOptionId = ref<string | null>(null)
 const acpOptionSavingIds = ref<string[]>([])
 const acpConfigCacheByAgent = new Map<string, AcpConfigState>()
+const activeNumericInput = ref<GenerationNumericField | null>(null)
+const numericInputDrafts = ref<Record<GenerationNumericField, string>>({
+  temperature: '',
+  contextLength: '',
+  maxTokens: '',
+  thinkingBudget: ''
+})
+const numericInputErrors = ref<
+  Record<GenerationNumericField, GenerationNumericValidationCode | null>
+>({
+  temperature: null,
+  contextLength: null,
+  maxTokens: null,
+  thinkingBudget: null
+})
 
 const capabilitySupportsReasoning = ref<boolean | null>(null)
 const capabilityReasoningPortrait = ref<ReasoningPortrait | null>(null)
-const capabilityBudgetRange = ref<{ min?: number; max?: number; default?: number } | null>(null)
-const capabilitySupportsEffort = ref<boolean | null>(null)
-const capabilitySupportsVerbosity = ref<boolean | null>(null)
 
 let draftModelSyncToken = 0
 let permissionSyncToken = 0
@@ -630,6 +827,7 @@ let acpConfigSyncToken = 0
 let generationPersistTimer: ReturnType<typeof setTimeout> | null = null
 let pendingGenerationPatch: Partial<SessionGenerationSettings> = {}
 let generationPersistRequestToken = 0
+let generationLocalRevision = 0
 
 const hasActiveSession = computed(() => sessionStore.hasActiveSession)
 
@@ -924,29 +1122,104 @@ const isReasoningEffort = (value: unknown): value is 'minimal' | 'low' | 'medium
 const isVerbosity = (value: unknown): value is 'low' | 'medium' | 'high' =>
   value === 'low' || value === 'medium' || value === 'high'
 
-const clamp = (value: number, min: number, max: number): number => {
-  if (value < min) return min
-  if (value > max) return max
-  return value
+const getCommittedNumericInputValue = (field: GenerationNumericField): string => {
+  if (!localSettings.value) {
+    return ''
+  }
+
+  switch (field) {
+    case 'temperature':
+      return String(localSettings.value.temperature)
+    case 'contextLength':
+      return String(localSettings.value.contextLength)
+    case 'maxTokens':
+      return String(localSettings.value.maxTokens)
+    case 'thinkingBudget': {
+      const value = localSettings.value.thinkingBudget
+      return value === undefined ? '' : String(value)
+    }
+  }
 }
 
-const toFiniteNumber = (value: unknown): number | undefined => {
-  if (typeof value !== 'number' || Number.isNaN(value) || !Number.isFinite(value)) {
-    return undefined
+const syncNumericInputDraft = (field: GenerationNumericField): void => {
+  numericInputDrafts.value[field] = getCommittedNumericInputValue(field)
+}
+
+const clearNumericInputError = (field: GenerationNumericField): void => {
+  numericInputErrors.value[field] = null
+}
+
+const setNumericInputError = (
+  field: GenerationNumericField,
+  code: GenerationNumericValidationCode
+): void => {
+  numericInputErrors.value[field] = code
+}
+
+const resetNumericInputFieldState = (field: GenerationNumericField): void => {
+  clearNumericInputError(field)
+  syncNumericInputDraft(field)
+}
+
+const resetNumericInputState = (): void => {
+  activeNumericInput.value = null
+  resetNumericInputFieldState('temperature')
+  resetNumericInputFieldState('contextLength')
+  resetNumericInputFieldState('maxTokens')
+  resetNumericInputFieldState('thinkingBudget')
+}
+
+const hasNumericInputError = (field: GenerationNumericField): boolean =>
+  numericInputErrors.value[field] !== null
+
+const startNumericInputEdit = (field: GenerationNumericField): void => {
+  activeNumericInput.value = field
+  if (!hasNumericInputError(field)) {
+    syncNumericInputDraft(field)
   }
-  return value
 }
 
-const parseNumericInput = (value: string | number): number | undefined => {
-  const normalized = typeof value === 'string' ? value.trim() : String(value)
-  if (!normalized) {
-    return undefined
+const setNumericInputDraft = (field: GenerationNumericField, value: string | number): void => {
+  if (activeNumericInput.value !== field) {
+    activeNumericInput.value = field
   }
-  const numeric = Number(normalized)
-  if (!Number.isFinite(numeric)) {
-    return undefined
+  const nextValue = typeof value === 'string' ? value : String(value)
+  if (numericInputDrafts.value[field] !== nextValue) {
+    generationLocalRevision += 1
+  }
+  numericInputDrafts.value[field] = nextValue
+  clearNumericInputError(field)
+}
+
+const stopNumericInputEdit = (field: GenerationNumericField): void => {
+  if (activeNumericInput.value === field) {
+    activeNumericInput.value = null
+  }
+}
+
+const getNumericInputValue = (field: GenerationNumericField): string => {
+  if (activeNumericInput.value === field || hasNumericInputError(field)) {
+    return numericInputDrafts.value[field]
+  }
+  return getCommittedNumericInputValue(field)
+}
+
+const getNumericInputErrorMessage = (field: GenerationNumericField): string => {
+  const code = numericInputErrors.value[field]
+  if (!code) {
+    return ''
+  }
+
+  switch (code) {
+    case 'finite_number':
+      return t('chat.advancedSettings.validation.finiteNumber')
+    case 'non_negative_integer':
+      return t('chat.advancedSettings.validation.nonNegativeInteger')
+    case 'context_length_below_max_tokens':
+      return t('chat.advancedSettings.validation.contextLengthAtLeastMaxTokens')
+    case 'max_tokens_exceed_context_length':
+      return t('chat.advancedSettings.validation.maxTokensWithinContextLength')
   }
-  return numeric
 }
 
 const isAcpConfigOptionValue = (
@@ -1118,35 +1391,6 @@ const normalizeVerbosity = (
     : undefined
 }
 
-const normalizeThinkingBudget = (
-  portrait: ReasoningPortrait | null | undefined,
-  value: number,
-  min?: number,
-  max?: number
-): number => {
-  const roundedValue = Math.round(value)
-  const sentinelValues = new Set<number>()
-
-  if (typeof portrait?.budget?.default === 'number')
-    sentinelValues.add(Math.round(portrait.budget.default))
-  if (typeof portrait?.budget?.auto === 'number')
-    sentinelValues.add(Math.round(portrait.budget.auto))
-  if (typeof portrait?.budget?.off === 'number') sentinelValues.add(Math.round(portrait.budget.off))
-
-  if (sentinelValues.has(roundedValue)) {
-    return roundedValue
-  }
-
-  let nextValue = roundedValue
-  if (typeof min === 'number') {
-    nextValue = Math.max(nextValue, Math.round(min))
-  }
-  if (typeof max === 'number') {
-    nextValue = Math.min(nextValue, Math.round(max))
-  }
-  return nextValue
-}
-
 const findEnabledModel = (providerId: string, modelId: string): ModelSelection | null => {
   const hit = findEnabledModelMeta(providerId, modelId)
   if (!hit) {
@@ -1202,43 +1446,21 @@ const clearPendingGenerationPersist = () => {
   pendingGenerationPatch = {}
 }
 
-const getCurrentLimits = () => {
-  const selection = effectiveModelSelection.value
-  if (!selection) {
-    return {
-      contextLengthLimit: 32000,
-      maxTokensLimit: 8192
-    }
-  }
-
-  const modelConfig = configPresenter.getModelConfig(selection.modelId, selection.providerId)
-  const contextLengthLimit = Math.max(
-    CONTEXT_LENGTH_MIN,
-    Math.round(toFiniteNumber(modelConfig.contextLength) ?? 32000)
-  )
-  const maxTokensLimit = Math.max(
-    MAX_TOKENS_MIN,
-    Math.round(toFiniteNumber(modelConfig.maxTokens) ?? 4096)
-  )
-  return { contextLengthLimit, maxTokensLimit }
+const invalidateGenerationPersistResponses = () => {
+  generationPersistRequestToken += 1
 }
 
-const contextLengthLimit = computed(() => getCurrentLimits().contextLengthLimit)
-
-const maxTokensSliderLimit = computed(() => {
-  const baseLimit = getCurrentLimits().maxTokensLimit
-  const contextLimit = localSettings.value?.contextLength ?? contextLengthLimit.value
-  return Math.max(MAX_TOKENS_MIN, Math.min(baseLimit, contextLimit))
-})
-
-const budgetRange = computed(() => capabilityBudgetRange.value)
+const temperatureInputValue = computed(() => getNumericInputValue('temperature'))
+const contextLengthInputValue = computed(() => getNumericInputValue('contextLength'))
+const maxTokensInputValue = computed(() => getNumericInputValue('maxTokens'))
+const thinkingBudgetInputValue = computed(() => getNumericInputValue('thinkingBudget'))
+const isThinkingBudgetEnabled = computed(() => localSettings.value?.thinkingBudget !== undefined)
 
 const thinkingBudgetHint = computed(() => {
-  const value = localSettings.value?.thinkingBudget
-  if (value === undefined) {
-    return t('chat.advancedSettings.useDefault')
+  if (!isThinkingBudgetEnabled.value) {
+    return t('common.disabled')
   }
-  return String(value)
+  return ''
 })
 
 const showThinkingBudget = computed(() => {
@@ -1470,38 +1692,26 @@ const resolveDefaultGenerationSettings = async (
   const modelConfig = configPresenter.getModelConfig(modelId, providerId)
   const defaultSystemPrompt = await configPresenter.getDefaultSystemPrompt()
   const portrait = (await configPresenter.getReasoningPortrait?.(providerId, modelId)) ?? null
-  const limits = getCurrentLimits()
+  const contextLengthDefault = toValidNonNegativeInteger(modelConfig.contextLength) ?? 32000
+  const maxTokensDefault =
+    toValidNonNegativeInteger(modelConfig.maxTokens) ?? Math.min(4096, contextLengthDefault)
 
   const defaults: SessionGenerationSettings = {
     systemPrompt: defaultSystemPrompt ?? '',
-    temperature: clamp(
-      toFiniteNumber(modelConfig.temperature) ?? 0.7,
-      TEMPERATURE_MIN,
-      TEMPERATURE_MAX
-    ),
-    contextLength: clamp(
-      Math.round(toFiniteNumber(modelConfig.contextLength) ?? limits.contextLengthLimit),
-      CONTEXT_LENGTH_MIN,
-      limits.contextLengthLimit
-    ),
-    maxTokens: clamp(
-      Math.round(toFiniteNumber(modelConfig.maxTokens) ?? Math.min(4096, limits.maxTokensLimit)),
-      MAX_TOKENS_MIN,
-      limits.maxTokensLimit
-    )
+    temperature: parseFiniteNumericValue(modelConfig.temperature) ?? 0.7,
+    contextLength: contextLengthDefault,
+    maxTokens:
+      maxTokensDefault <= contextLengthDefault
+        ? maxTokensDefault
+        : Math.min(4096, contextLengthDefault)
   }
-  defaults.maxTokens = Math.min(defaults.maxTokens, defaults.contextLength)
 
   if (portrait?.supported === true && hasThinkingBudgetSupport(portrait)) {
-    const range = portrait.budget ?? {}
-    const defaultBudget = toFiniteNumber(modelConfig.thinkingBudget ?? range.default)
+    const defaultBudget = normalizeLegacyThinkingBudgetValue(
+      modelConfig.thinkingBudget ?? portrait.budget?.default
+    )
     if (defaultBudget !== undefined) {
-      defaults.thinkingBudget = normalizeThinkingBudget(
-        portrait,
-        Math.round(defaultBudget),
-        range.min,
-        range.max
-      )
+      defaults.thinkingBudget = defaultBudget
     }
   }
 
@@ -1525,60 +1735,6 @@ const resolveDefaultGenerationSettings = async (
   return defaults
 }
 
-const mergeDraftOverrides = (
-  defaults: SessionGenerationSettings,
-  portrait: ReasoningPortrait | null
-): SessionGenerationSettings => {
-  const next: SessionGenerationSettings = {
-    ...defaults,
-    ...(draftStore.systemPrompt !== undefined ? { systemPrompt: draftStore.systemPrompt } : {}),
-    ...(draftStore.temperature !== undefined ? { temperature: draftStore.temperature } : {}),
-    ...(draftStore.contextLength !== undefined ? { contextLength: draftStore.contextLength } : {}),
-    ...(draftStore.maxTokens !== undefined ? { maxTokens: draftStore.maxTokens } : {}),
-    ...(draftStore.thinkingBudget !== undefined
-      ? { thinkingBudget: draftStore.thinkingBudget }
-      : {}),
-    ...(draftStore.reasoningEffort !== undefined
-      ? {
-          reasoningEffort: normalizeReasoningEffort(portrait, draftStore.reasoningEffort)
-        }
-      : {}),
-    ...(draftStore.verbosity !== undefined ? { verbosity: draftStore.verbosity } : {})
-  }
-
-  const limits = getCurrentLimits()
-  next.temperature = clamp(next.temperature, TEMPERATURE_MIN, TEMPERATURE_MAX)
-  next.contextLength = clamp(
-    Math.round(next.contextLength),
-    CONTEXT_LENGTH_MIN,
-    limits.contextLengthLimit
-  )
-  next.maxTokens = clamp(
-    Math.round(next.maxTokens),
-    MAX_TOKENS_MIN,
-    Math.min(limits.maxTokensLimit, next.contextLength)
-  )
-
-  if (next.thinkingBudget !== undefined) {
-    next.thinkingBudget = normalizeThinkingBudget(
-      portrait,
-      next.thinkingBudget,
-      portrait?.budget?.min,
-      portrait?.budget?.max
-    )
-  }
-
-  if (next.reasoningEffort !== undefined) {
-    next.reasoningEffort = normalizeReasoningEffort(portrait, next.reasoningEffort)
-  }
-
-  if (next.verbosity !== undefined) {
-    next.verbosity = normalizeVerbosity(portrait, next.verbosity)
-  }
-
-  return next
-}
-
 const fetchCapabilities = async (providerId: string, modelId: string): Promise<void> => {
   try {
     const portrait = (await configPresenter.getReasoningPortrait?.(providerId, modelId)) ?? null
@@ -1586,24 +1742,10 @@ const fetchCapabilities = async (providerId: string, modelId: string): Promise<v
     capabilityReasoningPortrait.value = portrait
     capabilitySupportsReasoning.value =
       typeof portrait?.supported === 'boolean' ? portrait.supported : null
-    capabilityBudgetRange.value = portrait?.budget
-      ? {
-          ...(typeof portrait.budget.min === 'number' ? { min: portrait.budget.min } : {}),
-          ...(typeof portrait.budget.max === 'number' ? { max: portrait.budget.max } : {}),
-          ...(typeof portrait.budget.default === 'number'
-            ? { default: portrait.budget.default }
-            : {})
-        }
-      : null
-    capabilitySupportsEffort.value = supportsReasoningEffort(portrait)
-    capabilitySupportsVerbosity.value = supportsVerbosity(portrait)
   } catch (error) {
     console.warn('[ChatStatusBar] Failed to fetch model capabilities:', error)
     capabilitySupportsReasoning.value = null
     capabilityReasoningPortrait.value = null
-    capabilityBudgetRange.value = null
-    capabilitySupportsEffort.value = null
-    capabilitySupportsVerbosity.value = null
   }
 }
 
@@ -1623,25 +1765,29 @@ const flushGenerationPatch = async () => {
   }
 
   const requestToken = ++generationPersistRequestToken
+  const localRevisionAtRequest = generationLocalRevision
   try {
     const updated = await newAgentPresenter.updateSessionGenerationSettings(sessionId, patch)
     if (requestToken !== generationPersistRequestToken) {
       return
     }
-    if (!localSettings.value) {
-      localSettings.value = { ...updated }
+    if (localRevisionAtRequest !== generationLocalRevision) {
       return
     }
-    localSettings.value = {
-      ...localSettings.value,
-      ...updated
-    }
+    localSettings.value = { ...updated }
+    resetNumericInputState()
   } catch (error) {
     console.warn('[ChatStatusBar] Failed to update generation settings:', error)
   }
 }
 
 const scheduleGenerationPersist = (patch: Partial<SessionGenerationSettings>) => {
+  if (!sessionStore.activeSessionId) {
+    clearPendingGenerationPersist()
+    draftStore.updateGenerationSettings(patch)
+    return
+  }
+
   pendingGenerationPatch = { ...pendingGenerationPatch, ...patch }
   if (generationPersistTimer) {
     clearTimeout(generationPersistTimer)
@@ -1656,25 +1802,13 @@ const updateLocalGenerationSettings = (patch: Partial<SessionGenerationSettings>
     return
   }
   generationSyncToken += 1
+  generationLocalRevision += 1
 
-  const limits = getCurrentLimits()
   const next: SessionGenerationSettings = {
     ...localSettings.value,
     ...patch
   }
 
-  next.temperature = clamp(next.temperature, TEMPERATURE_MIN, TEMPERATURE_MAX)
-  next.contextLength = clamp(
-    Math.round(next.contextLength),
-    CONTEXT_LENGTH_MIN,
-    limits.contextLengthLimit
-  )
-  next.maxTokens = clamp(
-    Math.round(next.maxTokens),
-    MAX_TOKENS_MIN,
-    Math.min(limits.maxTokensLimit, next.contextLength)
-  )
-
   localSettings.value = next
 
   const normalizedPatch: Partial<SessionGenerationSettings> = {}
@@ -1706,6 +1840,8 @@ const updateLocalGenerationSettings = (patch: Partial<SessionGenerationSettings>
 const syncGenerationSettings = async () => {
   const token = ++generationSyncToken
   clearPendingGenerationPersist()
+  invalidateGenerationPersistResponses()
+  resetNumericInputState()
   loadedSettingsSelection.value = null
 
   if (isAcpAgent.value) {
@@ -1713,9 +1849,6 @@ const syncGenerationSettings = async () => {
     loadedSettingsSelection.value = null
     capabilitySupportsReasoning.value = null
     capabilityReasoningPortrait.value = null
-    capabilityBudgetRange.value = null
-    capabilitySupportsEffort.value = null
-    capabilitySupportsVerbosity.value = null
     return
   }
 
@@ -1725,9 +1858,6 @@ const syncGenerationSettings = async () => {
     loadedSettingsSelection.value = null
     capabilityReasoningPortrait.value = null
     capabilitySupportsReasoning.value = null
-    capabilityBudgetRange.value = null
-    capabilitySupportsEffort.value = null
-    capabilitySupportsVerbosity.value = null
     return
   }
 
@@ -1767,7 +1897,7 @@ const syncGenerationSettings = async () => {
   if (token !== generationSyncToken) {
     return
   }
-  localSettings.value = mergeDraftOverrides(defaults, capabilityReasoningPortrait.value)
+  localSettings.value = defaults
   loadedSettingsSelection.value = { ...selection }
 }
 
@@ -2040,6 +2170,7 @@ watch(isModelPanelOpen, (open) => {
 
 onBeforeUnmount(() => {
   clearPendingGenerationPersist()
+  invalidateGenerationPersistResponses()
   window.electron?.ipcRenderer?.removeListener?.(
     ACP_WORKSPACE_EVENTS.SESSION_CONFIG_OPTIONS_READY,
     handleAcpConfigOptionsReady
@@ -2089,8 +2220,27 @@ async function changeModelSelection(providerId: string, modelId: string): Promis
   const previousDraftSelection = draftModelSelection.value ? { ...draftModelSelection.value } : null
   const previousDraftProviderId = draftStore.providerId
   const previousDraftModelId = draftStore.modelId
+  const previousDraftGenerationSettings = {
+    systemPrompt: draftStore.systemPrompt,
+    temperature: draftStore.temperature,
+    contextLength: draftStore.contextLength,
+    maxTokens: draftStore.maxTokens,
+    thinkingBudget: draftStore.thinkingBudget,
+    reasoningEffort: draftStore.reasoningEffort,
+    verbosity: draftStore.verbosity
+  } as Partial<SessionGenerationSettings>
+  const clearedDraftModelOverrides = {
+    temperature: undefined,
+    contextLength: undefined,
+    maxTokens: undefined,
+    thinkingBudget: undefined,
+    reasoningEffort: undefined,
+    verbosity: undefined
+  } as Partial<SessionGenerationSettings>
 
   try {
+    clearPendingGenerationPersist()
+    draftStore.updateGenerationSettings(clearedDraftModelOverrides)
     draftModelSelection.value = { providerId, modelId }
     draftStore.providerId = providerId
     draftStore.modelId = modelId
@@ -2100,6 +2250,7 @@ async function changeModelSelection(providerId: string, modelId: string): Promis
     draftModelSelection.value = previousDraftSelection
     draftStore.providerId = previousDraftProviderId
     draftStore.modelId = previousDraftModelId
+    draftStore.updateGenerationSettings(previousDraftGenerationSettings)
     console.warn('[ChatStatusBar] Failed to switch draft model:', error)
     return false
   }
@@ -2150,89 +2301,179 @@ function onSystemPromptSelect(optionId: string) {
   updateLocalGenerationSettings({ systemPrompt: option.content })
 }
 
-function onTemperatureSlider(values: number[]) {
-  const next = values[0]
-  if (!localSettings.value || typeof next !== 'number') {
-    return
+const getNumericValidationContext = (
+  field: GenerationNumericField
+): Pick<SessionGenerationSettings, 'contextLength' | 'maxTokens'> => ({
+  contextLength:
+    field === 'contextLength'
+      ? (localSettings.value?.contextLength ?? 0)
+      : (localSettings.value?.contextLength ?? 0),
+  maxTokens:
+    field === 'maxTokens'
+      ? (localSettings.value?.maxTokens ?? 0)
+      : (localSettings.value?.maxTokens ?? 0)
+})
+
+const commitNumericField = (
+  field: GenerationNumericField,
+  rawValue: string | number
+): number | undefined => {
+  if (!localSettings.value) {
+    stopNumericInputEdit(field)
+    resetNumericInputFieldState(field)
+    return undefined
+  }
+
+  const error = validateGenerationNumericField(field, rawValue, getNumericValidationContext(field))
+  if (error) {
+    stopNumericInputEdit(field)
+    setNumericInputError(field, error)
+    return undefined
   }
-  updateLocalGenerationSettings({ temperature: Number(next.toFixed(1)) })
+
+  const numeric = parseFiniteNumericValue(rawValue)
+  if (numeric === undefined) {
+    stopNumericInputEdit(field)
+    setNumericInputError(field, field === 'temperature' ? 'finite_number' : 'non_negative_integer')
+    return undefined
+  }
+
+  stopNumericInputEdit(field)
+  clearNumericInputError(field)
+  return numeric
 }
 
-function onTemperatureInput(value: string | number) {
+const roundTemperatureStepValue = (value: number): number => Number(value.toFixed(10))
+
+function stepTemperature(direction: -1 | 1) {
   if (!localSettings.value) {
     return
   }
-  const numeric = parseNumericInput(value)
-  if (numeric === undefined) {
+  if (hasNumericInputError('temperature')) {
     return
   }
-  const next = clamp(numeric, TEMPERATURE_MIN, TEMPERATURE_MAX)
-  updateLocalGenerationSettings({ temperature: Number(next.toFixed(1)) })
+  const next = roundTemperatureStepValue(
+    localSettings.value.temperature + direction * TEMPERATURE_STEP
+  )
+  updateLocalGenerationSettings({ temperature: next })
+  resetNumericInputFieldState('temperature')
 }
 
-function onContextLengthSlider(values: number[]) {
-  const next = values[0]
-  if (!localSettings.value || typeof next !== 'number') {
+function onTemperatureInput(value: string | number) {
+  setNumericInputDraft('temperature', value)
+}
+
+function commitTemperatureInput() {
+  const next = commitNumericField('temperature', numericInputDrafts.value.temperature)
+  if (next === undefined) {
     return
   }
-  updateLocalGenerationSettings({ contextLength: Math.round(next) })
+  updateLocalGenerationSettings({ temperature: next })
+  resetNumericInputFieldState('temperature')
 }
 
-function onContextLengthInput(value: string | number) {
+function stepContextLength(direction: -1 | 1) {
   if (!localSettings.value) {
     return
   }
-  const numeric = parseNumericInput(value)
-  if (numeric === undefined) {
+  if (hasNumericInputError('contextLength')) {
     return
   }
-  const next = clamp(Math.round(numeric), CONTEXT_LENGTH_MIN, contextLengthLimit.value)
-  updateLocalGenerationSettings({ contextLength: next })
+  const next = Math.max(0, localSettings.value.contextLength + direction * CONTEXT_LENGTH_STEP)
+  const committed = commitNumericField('contextLength', next)
+  if (committed === undefined) {
+    return
+  }
+  updateLocalGenerationSettings({ contextLength: committed })
+  resetNumericInputFieldState('contextLength')
+}
+
+function onContextLengthInput(value: string | number) {
+  setNumericInputDraft('contextLength', value)
 }
 
-function onMaxTokensSlider(values: number[]) {
-  const next = values[0]
-  if (!localSettings.value || typeof next !== 'number') {
+function commitContextLengthInput() {
+  const next = commitNumericField('contextLength', numericInputDrafts.value.contextLength)
+  if (next === undefined) {
     return
   }
-  updateLocalGenerationSettings({ maxTokens: Math.round(next) })
+  updateLocalGenerationSettings({ contextLength: next })
+  resetNumericInputFieldState('contextLength')
 }
 
-function onMaxTokensInput(value: string | number) {
+function stepMaxTokens(direction: -1 | 1) {
   if (!localSettings.value) {
     return
   }
-  const numeric = parseNumericInput(value)
-  if (numeric === undefined) {
+  if (hasNumericInputError('maxTokens')) {
+    return
+  }
+  const next = Math.max(0, localSettings.value.maxTokens + direction * MAX_TOKENS_STEP)
+  const committed = commitNumericField('maxTokens', next)
+  if (committed === undefined) {
+    return
+  }
+  updateLocalGenerationSettings({ maxTokens: committed })
+  resetNumericInputFieldState('maxTokens')
+}
+
+function onMaxTokensInput(value: string | number) {
+  setNumericInputDraft('maxTokens', value)
+}
+
+function commitMaxTokensInput() {
+  const next = commitNumericField('maxTokens', numericInputDrafts.value.maxTokens)
+  if (next === undefined) {
     return
   }
-  const next = clamp(Math.round(numeric), MAX_TOKENS_MIN, maxTokensSliderLimit.value)
   updateLocalGenerationSettings({ maxTokens: next })
+  resetNumericInputFieldState('maxTokens')
 }
 
-function onThinkingBudgetInput(value: string | number) {
+function onThinkingBudgetToggle(enabled: boolean) {
   if (!localSettings.value) {
     return
   }
-  const normalized = typeof value === 'string' ? value.trim() : String(value)
-  if (!normalized) {
+  if (!enabled) {
+    stopNumericInputEdit('thinkingBudget')
+    resetNumericInputFieldState('thinkingBudget')
     updateLocalGenerationSettings({ thinkingBudget: undefined })
     return
   }
 
-  const numeric = Number(normalized)
-  if (!Number.isFinite(numeric)) {
+  const preferred = normalizeLegacyThinkingBudgetValue(localSettings.value.thinkingBudget) ?? 0
+  updateLocalGenerationSettings({ thinkingBudget: preferred })
+  resetNumericInputFieldState('thinkingBudget')
+}
+
+function stepThinkingBudget(direction: -1 | 1) {
+  if (!localSettings.value) {
     return
   }
+  if (hasNumericInputError('thinkingBudget')) {
+    return
+  }
+  const current = localSettings.value.thinkingBudget ?? 0
+  const next = Math.max(0, current + direction * THINKING_BUDGET_STEP)
+  const committed = commitNumericField('thinkingBudget', next)
+  if (committed === undefined) {
+    return
+  }
+  updateLocalGenerationSettings({ thinkingBudget: committed })
+  resetNumericInputFieldState('thinkingBudget')
+}
 
-  const range = budgetRange.value
-  const budget = normalizeThinkingBudget(
-    capabilityReasoningPortrait.value,
-    Math.round(numeric),
-    range?.min,
-    range?.max
-  )
-  updateLocalGenerationSettings({ thinkingBudget: budget })
+function onThinkingBudgetInput(value: string | number) {
+  setNumericInputDraft('thinkingBudget', value)
+}
+
+function commitThinkingBudgetInput() {
+  const next = commitNumericField('thinkingBudget', numericInputDrafts.value.thinkingBudget)
+  if (next === undefined) {
+    return
+  }
+  updateLocalGenerationSettings({ thinkingBudget: next })
+  resetNumericInputFieldState('thinkingBudget')
 }
 
 function onReasoningEffortSelect(value: string) {
@@ -2304,7 +2545,19 @@ defineExpose({
   permissionMode,
   showSystemPromptSection,
   showReasoningEffort,
-  onTemperatureSlider,
+  onTemperatureInput,
+  commitTemperatureInput,
+  onContextLengthInput,
+  commitContextLengthInput,
+  onMaxTokensInput,
+  commitMaxTokensInput,
+  onThinkingBudgetInput,
+  commitThinkingBudgetInput,
+  onThinkingBudgetToggle,
+  stepTemperature,
+  stepContextLength,
+  stepMaxTokens,
+  stepThinkingBudget,
   selectModel: changeModelSelection,
   openModelSettings,
   isModelSettingsExpanded,
diff --git a/src/renderer/src/components/chat/PendingInputLane.vue b/src/renderer/src/components/chat/PendingInputLane.vue
new file mode 100644
index 000000000..00e8cc45d
--- /dev/null
+++ b/src/renderer/src/components/chat/PendingInputLane.vue
@@ -0,0 +1,328 @@
+<template>
+  <div v-if="showLane" class="w-full max-w-4xl" data-testid="pending-rail">
+    <div
+      class="rounded-xl border border-border/70 bg-card/55 px-2.5 py-2 shadow-sm backdrop-blur-lg"
+    >
+      <div class="mb-1.5 flex items-center justify-between gap-2" data-testid="pending-rail-header">
+        <div class="flex min-w-0 flex-wrap items-center gap-1.5">
+          <span
+            v-if="steerItems.length > 0"
+            class="inline-flex items-center rounded-full border border-border/60 bg-background/70 px-2 py-0.5 text-[11px] font-medium text-muted-foreground"
+          >
+            {{ t('chat.pendingInput.steer') }} {{ steerItems.length }}
+          </span>
+          <span
+            v-if="queueItems.length > 0"
+            class="inline-flex items-center rounded-full border border-border/60 bg-background/70 px-2 py-0.5 text-[11px] font-medium text-muted-foreground"
+          >
+            {{ t('chat.pendingInput.queueCount', { count: queueItems.length, max: activeLimit }) }}
+          </span>
+        </div>
+        <Button
+          v-if="showResumeQueue"
+          variant="ghost"
+          size="sm"
+          class="h-6 shrink-0 rounded-full px-2.5 text-[11px] text-muted-foreground"
+          @click="emit('resume-queue')"
+        >
+          {{ t('chat.pendingInput.resumeQueue') }}
+        </Button>
+      </div>
+
+      <div
+        :class="[
+          'space-y-1',
+          isScrollable ? `${listMaxHeightClass} overflow-y-auto pr-1` : 'overflow-visible'
+        ]"
+        data-testid="pending-rail-list"
+        :data-scrollable="isScrollable ? 'true' : 'false'"
+      >
+        <div
+          v-for="item in steerItems"
+          :key="item.id"
+          data-testid="pending-row"
+          data-mode="steer"
+          class="group flex items-center gap-1.5 rounded-lg border border-border/50 bg-background/65 px-1.5 py-1 transition hover:border-border/80 hover:bg-background/80"
+        >
+          <Icon
+            icon="lucide:corner-down-right"
+            class="h-3.5 w-3.5 shrink-0 text-muted-foreground/80"
+          />
+          <div class="min-w-0 flex-1">
+            <div
+              class="truncate text-[13px] leading-5 text-foreground"
+              :title="formatPayloadTitle(item)"
+            >
+              {{ formatPayloadText(item) }}
+            </div>
+          </div>
+          <div class="flex shrink-0 items-center gap-1">
+            <span
+              v-if="(item.payload.files?.length ?? 0) > 0"
+              class="inline-flex items-center rounded-full border border-border/60 bg-muted/35 px-1.5 py-0.5 text-[11px] leading-none text-muted-foreground"
+            >
+              {{ t('chat.pendingInput.files', { count: item.payload.files?.length ?? 0 }) }}
+            </span>
+            <span
+              class="inline-flex items-center rounded-full border border-border/60 bg-muted/45 px-1.5 py-0.5 text-[11px] leading-none text-muted-foreground"
+            >
+              {{ t('chat.pendingInput.locked') }}
+            </span>
+          </div>
+        </div>
+
+        <draggable
+          :list="localQueueItems"
+          item-key="id"
+          handle=".pending-input-drag"
+          :animation="150"
+          :disabled="Boolean(editingItemId)"
+          ghost-class="pending-input-ghost"
+          class="space-y-1"
+          @end="onDragEnd"
+        >
+          <template #item="{ element }">
+            <div
+              data-testid="pending-row"
+              data-mode="queue"
+              :data-editing="editingItemId === element.id ? 'true' : 'false'"
+              :class="[
+                'group rounded-lg border border-border/50 bg-background/65 px-1.5 transition hover:border-border/80 hover:bg-background/80 focus-within:border-border/80 focus-within:bg-background/80',
+                editingItemId === element.id ? 'py-2' : 'py-1'
+              ]"
+            >
+              <div
+                :class="
+                  editingItemId === element.id
+                    ? 'flex items-start gap-1.5'
+                    : 'flex items-center gap-1.5'
+                "
+              >
+                <button
+                  type="button"
+                  class="pending-input-drag inline-flex h-6 w-5 shrink-0 items-center justify-center rounded-md text-muted-foreground transition hover:bg-muted/80 hover:text-foreground"
+                  :title="t('chat.pendingInput.reorder')"
+                  :disabled="Boolean(editingItemId)"
+                >
+                  <Icon icon="lucide:grip-vertical" class="h-3.5 w-3.5" />
+                </button>
+
+                <div class="min-w-0 flex-1">
+                  <template v-if="editingItemId === element.id">
+                    <textarea
+                      v-model="editingText"
+                      data-testid="pending-edit-textarea"
+                      class="min-h-[88px] w-full resize-y rounded-lg border border-border bg-background px-3 py-2 text-sm text-foreground outline-none ring-0"
+                      @click.stop
+                      @keydown.enter.exact.prevent="saveEdit"
+                      @keydown.esc.stop.prevent="cancelEdit"
+                    />
+                    <div class="mt-2 flex items-center justify-between gap-2">
+                      <div class="text-xs text-muted-foreground">
+                        <span v-if="(element.payload.files?.length ?? 0) > 0">
+                          {{
+                            t('chat.pendingInput.files', {
+                              count: element.payload.files?.length ?? 0
+                            })
+                          }}
+                        </span>
+                      </div>
+                      <div class="flex items-center gap-1">
+                        <Button
+                          variant="ghost"
+                          size="sm"
+                          class="h-7 rounded-full px-2 text-xs"
+                          @click.stop="cancelEdit"
+                        >
+                          {{ t('common.cancel') }}
+                        </Button>
+                        <Button
+                          size="sm"
+                          class="h-7 rounded-full px-2 text-xs"
+                          :disabled="!canSaveEdit"
+                          @click.stop="saveEdit"
+                        >
+                          {{ t('common.save') }}
+                        </Button>
+                      </div>
+                    </div>
+                  </template>
+
+                  <button
+                    v-else
+                    type="button"
+                    data-testid="pending-row-main"
+                    class="block w-full min-w-0 rounded-md px-1 py-0.5 text-left outline-none transition hover:bg-muted/35 focus-visible:bg-muted/35"
+                    :title="formatPayloadTitle(element)"
+                    @click="beginEdit(element)"
+                  >
+                    <span class="block truncate text-[13px] leading-5 text-foreground">
+                      {{ formatPayloadText(element) }}
+                    </span>
+                  </button>
+                </div>
+
+                <div
+                  v-if="editingItemId !== element.id"
+                  class="flex shrink-0 items-center gap-1 opacity-70 transition group-hover:opacity-100 group-focus-within:opacity-100"
+                >
+                  <span
+                    v-if="(element.payload.files?.length ?? 0) > 0"
+                    class="inline-flex items-center rounded-full border border-border/60 bg-muted/35 px-1.5 py-0.5 text-[11px] leading-none text-muted-foreground"
+                  >
+                    {{
+                      t('chat.pendingInput.files', { count: element.payload.files?.length ?? 0 })
+                    }}
+                  </span>
+                  <Button
+                    variant="ghost"
+                    size="sm"
+                    class="h-6 rounded-full px-2 text-[11px] text-muted-foreground"
+                    :disabled="disableSteerAction"
+                    @click.stop="emit('convert-queue-to-steer', element.id)"
+                  >
+                    {{ t('chat.pendingInput.toSteer') }}
+                  </Button>
+                  <Button
+                    variant="ghost"
+                    size="icon"
+                    class="h-6 w-6 rounded-full text-muted-foreground"
+                    @click.stop="emit('delete-queue', element.id)"
+                  >
+                    <Icon icon="lucide:x" class="h-3.5 w-3.5" />
+                  </Button>
+                </div>
+              </div>
+            </div>
+          </template>
+        </draggable>
+      </div>
+
+      <div v-if="disableSteerAction" class="mt-1.5 text-[11px] text-muted-foreground">
+        {{ t('chat.pendingInput.limitReached', { max: activeLimit }) }}
+      </div>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { computed, ref, watch } from 'vue'
+import draggable from 'vuedraggable'
+import { Icon } from '@iconify/vue'
+import { Button } from '@shadcn/components/ui/button'
+import { useI18n } from 'vue-i18n'
+import type { PendingSessionInputRecord } from '@shared/types/agent-interface'
+
+const props = withDefaults(
+  defineProps<{
+    steerItems: PendingSessionInputRecord[]
+    queueItems: PendingSessionInputRecord[]
+    activeLimit?: number
+    disableSteerAction?: boolean
+    showResumeQueue?: boolean
+  }>(),
+  {
+    activeLimit: 5,
+    disableSteerAction: false,
+    showResumeQueue: false
+  }
+)
+
+const emit = defineEmits<{
+  'update-queue': [payload: { itemId: string; text: string }]
+  'move-queue': [payload: { itemId: string; toIndex: number }]
+  'convert-queue-to-steer': [itemId: string]
+  'delete-queue': [itemId: string]
+  'resume-queue': []
+}>()
+const { t } = useI18n()
+
+const localQueueItems = ref<PendingSessionInputRecord[]>([])
+const editingItemId = ref<string | null>(null)
+const editingText = ref('')
+
+const showLane = computed(() => props.steerItems.length > 0 || props.queueItems.length > 0)
+const totalItems = computed(() => props.steerItems.length + props.queueItems.length)
+const isScrollable = computed(() => totalItems.value > 3 || Boolean(editingItemId.value))
+const listMaxHeightClass = computed(() => (editingItemId.value ? 'max-h-[220px]' : 'max-h-[116px]'))
+const editingQueueItem = computed(
+  () => props.queueItems.find((item) => item.id === editingItemId.value) ?? null
+)
+const canSaveEdit = computed(() => {
+  if (!editingItemId.value) {
+    return false
+  }
+  return (
+    editingText.value.trim().length > 0 || (editingQueueItem.value?.payload.files?.length ?? 0) > 0
+  )
+})
+
+watch(
+  () => props.queueItems,
+  (nextQueueItems) => {
+    localQueueItems.value = [...nextQueueItems]
+    if (editingItemId.value && !nextQueueItems.some((item) => item.id === editingItemId.value)) {
+      editingItemId.value = null
+      editingText.value = ''
+    }
+  },
+  { deep: true, immediate: true }
+)
+
+function formatPayloadText(item: PendingSessionInputRecord): string {
+  const text = item.payload.text?.trim()
+  if (text) {
+    return text
+  }
+  const fileCount = item.payload.files?.length ?? 0
+  if (fileCount > 0) {
+    return t('chat.pendingInput.attachmentsOnly', { count: fileCount })
+  }
+  return t('chat.pendingInput.empty')
+}
+
+function formatPayloadTitle(item: PendingSessionInputRecord): string {
+  return formatPayloadText(item)
+}
+
+function beginEdit(item: PendingSessionInputRecord): void {
+  editingItemId.value = item.id
+  editingText.value = item.payload.text ?? ''
+}
+
+function cancelEdit(): void {
+  editingItemId.value = null
+  editingText.value = ''
+}
+
+function saveEdit(): void {
+  const itemId = editingItemId.value
+  if (!itemId) {
+    return
+  }
+
+  const text = editingText.value.trim()
+  const currentItem = props.queueItems.find((item) => item.id === itemId)
+  if (!text && (currentItem?.payload.files?.length ?? 0) === 0) {
+    return
+  }
+
+  emit('update-queue', { itemId, text })
+  cancelEdit()
+}
+
+function onDragEnd(event: { oldIndex?: number; newIndex?: number }): void {
+  const oldIndex = typeof event.oldIndex === 'number' ? event.oldIndex : -1
+  const newIndex = typeof event.newIndex === 'number' ? event.newIndex : -1
+  if (oldIndex < 0 || newIndex < 0 || oldIndex === newIndex) {
+    return
+  }
+
+  const movedItem = localQueueItems.value[newIndex]
+  if (!movedItem) {
+    return
+  }
+
+  emit('move-queue', { itemId: movedItem.id, toIndex: newIndex })
+}
+</script>
diff --git a/src/renderer/src/events.ts b/src/renderer/src/events.ts
index 5f72daa9b..31a452996 100644
--- a/src/renderer/src/events.ts
+++ b/src/renderer/src/events.ts
@@ -223,7 +223,8 @@ export const SESSION_EVENTS = {
   ACTIVATED: 'session:activated',
   DEACTIVATED: 'session:deactivated',
   STATUS_CHANGED: 'session:status-changed',
-  COMPACTION_UPDATED: 'session:compaction-updated'
+  COMPACTION_UPDATED: 'session:compaction-updated',
+  PENDING_INPUTS_UPDATED: 'session:pending-inputs-updated'
 }
 
 // 系统相关事件
diff --git a/src/renderer/src/i18n/da-DK/chat.json b/src/renderer/src/i18n/da-DK/chat.json
index 34a3381ba..3339f8593 100644
--- a/src/renderer/src/i18n/da-DK/chat.json
+++ b/src/renderer/src/i18n/da-DK/chat.json
@@ -35,6 +35,8 @@
     "agentWorkspaceTooltip": "Indstil agentens arbejdsmappe",
     "attach": "Vedhæft",
     "voiceInput": "Stemmeinput",
+    "queue": "Læg i kø",
+    "stop": "Stop",
     "mcp": {
       "badge": "MCP {count}",
       "title": "Aktiverede MCP'er",
@@ -57,6 +59,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "Styring",
+    "queueCount": "Afventer {count}/{max}",
+    "resumeQueue": "Fortsæt afsendelse",
+    "toSteer": "Brug til styring",
+    "locked": "Låst",
+    "reorder": "Omarranger",
+    "files": "{count} filer",
+    "attachmentsOnly": "{count} vedhæftede filer",
+    "empty": "Tom besked",
+    "limitReached": "Venteområdet er fuldt (maks. {max})."
+  },
   "mcpUi": {
     "badge": "UI",
     "collapse": "Skjul",
@@ -126,7 +140,16 @@
     "verbosity": "Detaljegrad",
     "verbosityPlaceholder": "Vælg detaljegrad",
     "currentCustomPrompt": "Aktuel brugerdefineret",
-    "useDefault": "Brug standard"
+    "useDefault": "Brug standard",
+    "decreaseValue": "Reducer {label}",
+    "increaseValue": "Øg {label}",
+    "toggleValue": "Slå {label} til eller fra",
+    "validation": {
+      "finiteNumber": "Skal være et endeligt tal",
+      "nonNegativeInteger": "Skal være et ikke-negativt heltal",
+      "contextLengthAtLeastMaxTokens": "Skal være større end eller lig med maksimumtokens",
+      "maxTokensWithinContextLength": "Skal være mindre end eller lig med kontekstlængden"
+    }
   },
   "workspace": {
     "collapse": "tæt",
diff --git a/src/renderer/src/i18n/en-US/chat.json b/src/renderer/src/i18n/en-US/chat.json
index 32a50d727..ee74f6ef2 100644
--- a/src/renderer/src/i18n/en-US/chat.json
+++ b/src/renderer/src/i18n/en-US/chat.json
@@ -6,6 +6,8 @@
     "functionSwitch": "Function Switch",
     "attach": "Attach",
     "voiceInput": "Voice input",
+    "queue": "Queue",
+    "stop": "Stop",
     "fileSelect": "Select File",
     "pasteFiles": "Paste files from clipboard",
     "dropFiles": "Drop files here",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "Steer",
+    "queueCount": "Queued {count}/{max}",
+    "resumeQueue": "Resume sending",
+    "toSteer": "Steer",
+    "locked": "Locked",
+    "reorder": "Reorder",
+    "files": "{count} files",
+    "attachmentsOnly": "{count} attachments",
+    "empty": "Empty message",
+    "limitReached": "Waiting lane is full (max {max})."
+  },
   "features": {
     "webSearch": "Web Search",
     "thoughtForSeconds": "Thought for {seconds}s",
@@ -130,7 +144,16 @@
     "verbosity": "Verbosity",
     "verbosityPlaceholder": "Select verbosity",
     "currentCustomPrompt": "Current custom",
-    "useDefault": "Use default"
+    "useDefault": "Use default",
+    "decreaseValue": "Decrease {label}",
+    "increaseValue": "Increase {label}",
+    "toggleValue": "Toggle {label}",
+    "validation": {
+      "finiteNumber": "Must be a finite number",
+      "nonNegativeInteger": "Must be a non-negative integer",
+      "contextLengthAtLeastMaxTokens": "Must be greater than or equal to Max Tokens",
+      "maxTokensWithinContextLength": "Must be less than or equal to Context Length"
+    }
   },
   "modelPicker": {
     "empty": "No models found"
diff --git a/src/renderer/src/i18n/fa-IR/chat.json b/src/renderer/src/i18n/fa-IR/chat.json
index 2f3a19056..5a2099a36 100644
--- a/src/renderer/src/i18n/fa-IR/chat.json
+++ b/src/renderer/src/i18n/fa-IR/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "دایرکتوری کاری عامل را تنظیم کنید",
     "attach": "پیوست",
     "voiceInput": "ورودی صوتی",
+    "queue": "افزودن به صف",
+    "stop": "توقف",
     "mcp": {
       "badge": "MCP {count}",
       "title": "MCPهای فعال",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "هدایت",
+    "queueCount": "در انتظار ارسال {count}/{max}",
+    "resumeQueue": "ادامه ارسال",
+    "toSteer": "تبدیل به هدایت",
+    "locked": "قفل‌شده",
+    "reorder": "تغییر ترتیب",
+    "files": "{count} فایل",
+    "attachmentsOnly": "{count} پیوست",
+    "empty": "پیام خالی",
+    "limitReached": "بخش انتظار پر است (حداکثر {max})."
+  },
   "features": {
     "webSearch": "جستجوی وب",
     "artifactThinking": "تفکر مصنوعی",
@@ -126,7 +140,16 @@
     "verbosity": "میزان جزئیات پاسخ",
     "verbosityPlaceholder": "سطح جزئیات را انتخاب کنید",
     "currentCustomPrompt": "سفارشی فعلی",
-    "useDefault": "استفاده از پیش‌فرض"
+    "useDefault": "استفاده از پیش‌فرض",
+    "decreaseValue": "کاهش {label}",
+    "increaseValue": "افزایش {label}",
+    "toggleValue": "روشن یا خاموش کردن {label}",
+    "validation": {
+      "finiteNumber": "باید یک عدد متناهی باشد",
+      "nonNegativeInteger": "باید یک عدد صحیح نامنفی باشد",
+      "contextLengthAtLeastMaxTokens": "باید بزرگ‌تر یا مساوی حداکثر توکن‌ها باشد",
+      "maxTokensWithinContextLength": "باید کوچک‌تر یا مساوی طول زمینه باشد"
+    }
   },
   "workspace": {
     "collapse": "بستن",
diff --git a/src/renderer/src/i18n/fr-FR/chat.json b/src/renderer/src/i18n/fr-FR/chat.json
index ce30a2d5d..824fc2e00 100644
--- a/src/renderer/src/i18n/fr-FR/chat.json
+++ b/src/renderer/src/i18n/fr-FR/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "Définir le répertoire de travail de l'agent",
     "attach": "Joindre",
     "voiceInput": "Saisie vocale",
+    "queue": "Ajouter à la file",
+    "stop": "Arrêter",
     "mcp": {
       "badge": "MCP {count}",
       "title": "MCP activés",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "Guidage",
+    "queueCount": "En attente {count}/{max}",
+    "resumeQueue": "Reprendre l'envoi",
+    "toSteer": "Guider",
+    "locked": "Verrouillé",
+    "reorder": "Réorganiser",
+    "files": "{count} fichiers",
+    "attachmentsOnly": "{count} pièces jointes",
+    "empty": "Message vide",
+    "limitReached": "La zone d'attente est pleine (max. {max})."
+  },
   "features": {
     "webSearch": "Recherche web",
     "artifactThinking": "Réflexion sur les artefacts",
@@ -126,7 +140,16 @@
     "verbosity": "Niveau de détail",
     "verbosityPlaceholder": "Sélectionner un niveau de détail",
     "currentCustomPrompt": "Personnalisé actuel",
-    "useDefault": "Utiliser la valeur par défaut"
+    "useDefault": "Utiliser la valeur par défaut",
+    "decreaseValue": "Réduire {label}",
+    "increaseValue": "Augmenter {label}",
+    "toggleValue": "Activer ou désactiver {label}",
+    "validation": {
+      "finiteNumber": "Doit être un nombre fini",
+      "nonNegativeInteger": "Doit être un entier positif ou nul",
+      "contextLengthAtLeastMaxTokens": "Doit être supérieur ou égal au nombre maximal de tokens",
+      "maxTokensWithinContextLength": "Doit être inférieur ou égal à la longueur de contexte"
+    }
   },
   "workspace": {
     "collapse": "fermer",
diff --git a/src/renderer/src/i18n/he-IL/chat.json b/src/renderer/src/i18n/he-IL/chat.json
index 137784adb..4d6f59c12 100644
--- a/src/renderer/src/i18n/he-IL/chat.json
+++ b/src/renderer/src/i18n/he-IL/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "הגדר את ספריית העבודה של הסוכן",
     "attach": "צרף",
     "voiceInput": "קלט קולי",
+    "queue": "הוסף לתור",
+    "stop": "עצור",
     "mcp": {
       "badge": "MCP {count}",
       "title": "MCP פעילים",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "הכוונה",
+    "queueCount": "ממתין לשליחה {count}/{max}",
+    "resumeQueue": "המשך שליחה",
+    "toSteer": "הפוך להכוונה",
+    "locked": "נעול",
+    "reorder": "שנה סדר",
+    "files": "{count} קבצים",
+    "attachmentsOnly": "{count} קבצים מצורפים",
+    "empty": "הודעה ריקה",
+    "limitReached": "אזור ההמתנה מלא (מקסימום {max})."
+  },
   "features": {
     "webSearch": "חיפוש אינטרנט",
     "thoughtForSeconds": "חשב במשך {seconds} שניות",
@@ -126,7 +140,16 @@
     "verbosity": "רמת פירוט",
     "verbosityPlaceholder": "בחר רמת פירוט",
     "currentCustomPrompt": "מותאם נוכחי",
-    "useDefault": "השתמש בברירת מחדל"
+    "useDefault": "השתמש בברירת מחדל",
+    "decreaseValue": "הקטן את {label}",
+    "increaseValue": "הגדל את {label}",
+    "toggleValue": "הפעל או כבה את {label}",
+    "validation": {
+      "finiteNumber": "חייב להיות מספר סופי",
+      "nonNegativeInteger": "חייב להיות מספר שלם לא שלילי",
+      "contextLengthAtLeastMaxTokens": "חייב להיות גדול או שווה למספר הטוקנים המרבי",
+      "maxTokensWithinContextLength": "חייב להיות קטן או שווה לאורך ההקשר"
+    }
   },
   "workspace": {
     "collapse": "לִסְגוֹר",
diff --git a/src/renderer/src/i18n/ja-JP/chat.json b/src/renderer/src/i18n/ja-JP/chat.json
index df73ec1af..365283938 100644
--- a/src/renderer/src/i18n/ja-JP/chat.json
+++ b/src/renderer/src/i18n/ja-JP/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "エージェントの作業ディレクトリを設定する",
     "attach": "添付",
     "voiceInput": "音声入力",
+    "queue": "キューに追加",
+    "stop": "停止",
     "mcp": {
       "badge": "MCP {count}",
       "title": "有効な MCP",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "誘導",
+    "queueCount": "送信待ち {count}/{max}",
+    "resumeQueue": "送信を再開",
+    "toSteer": "誘導にする",
+    "locked": "ロック済み",
+    "reorder": "並べ替え",
+    "files": "{count} 件のファイル",
+    "attachmentsOnly": "{count} 件の添付ファイル",
+    "empty": "空のメッセージ",
+    "limitReached": "待機レーンがいっぱいです（最大{max}件）。"
+  },
   "features": {
     "webSearch": "ウェブ検索",
     "artifactThinking": "アーティファクト思考",
@@ -126,7 +140,16 @@
     "verbosity": "回答の詳しさ",
     "verbosityPlaceholder": "詳しさを選択",
     "currentCustomPrompt": "現在のカスタム",
-    "useDefault": "デフォルトを使用"
+    "useDefault": "デフォルトを使用",
+    "decreaseValue": "{label}を減らす",
+    "increaseValue": "{label}を増やす",
+    "toggleValue": "{label}のオン・オフを切り替える",
+    "validation": {
+      "finiteNumber": "有限の数値である必要があります",
+      "nonNegativeInteger": "0以上の整数である必要があります",
+      "contextLengthAtLeastMaxTokens": "最大トークン数以上である必要があります",
+      "maxTokensWithinContextLength": "コンテキスト長以下である必要があります"
+    }
   },
   "workspace": {
     "collapse": "近い",
diff --git a/src/renderer/src/i18n/ko-KR/chat.json b/src/renderer/src/i18n/ko-KR/chat.json
index 1cd8082dc..4b63d96ba 100644
--- a/src/renderer/src/i18n/ko-KR/chat.json
+++ b/src/renderer/src/i18n/ko-KR/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "에이전트 작업 디렉터리 설정",
     "attach": "첨부",
     "voiceInput": "음성 입력",
+    "queue": "대기열에 추가",
+    "stop": "중지",
     "mcp": {
       "badge": "MCP {count}",
       "title": "활성화된 MCP",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "유도",
+    "queueCount": "전송 대기 {count}/{max}",
+    "resumeQueue": "전송 계속",
+    "toSteer": "유도로 전환",
+    "locked": "잠금됨",
+    "reorder": "순서 변경",
+    "files": "파일 {count}개",
+    "attachmentsOnly": "첨부 {count}개",
+    "empty": "빈 메시지",
+    "limitReached": "대기 영역이 가득 찼습니다 (최대 {max}개)."
+  },
   "features": {
     "webSearch": "웹 검색",
     "artifactThinking": "아티팩트 추론",
@@ -126,7 +140,16 @@
     "verbosity": "응답 상세도",
     "verbosityPlaceholder": "상세도 선택",
     "currentCustomPrompt": "현재 사용자 지정",
-    "useDefault": "기본값 사용"
+    "useDefault": "기본값 사용",
+    "decreaseValue": "{label} 줄이기",
+    "increaseValue": "{label} 늘리기",
+    "toggleValue": "{label} 켜기 또는 끄기",
+    "validation": {
+      "finiteNumber": "유한한 숫자여야 합니다",
+      "nonNegativeInteger": "0 이상의 정수여야 합니다",
+      "contextLengthAtLeastMaxTokens": "최대 출력 이상이어야 합니다",
+      "maxTokensWithinContextLength": "컨텍스트 길이 이하여야 합니다"
+    }
   },
   "workspace": {
     "collapse": "닫다",
diff --git a/src/renderer/src/i18n/pt-BR/chat.json b/src/renderer/src/i18n/pt-BR/chat.json
index 79302df78..f3b12b31e 100644
--- a/src/renderer/src/i18n/pt-BR/chat.json
+++ b/src/renderer/src/i18n/pt-BR/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "Definir diretório de trabalho do agente",
     "attach": "Anexar",
     "voiceInput": "Entrada de voz",
+    "queue": "Enfileirar",
+    "stop": "Parar",
     "mcp": {
       "badge": "MCP {count}",
       "title": "MCPs habilitados",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "Direcionamento",
+    "queueCount": "Pendentes {count}/{max}",
+    "resumeQueue": "Retomar envio",
+    "toSteer": "Direcionar",
+    "locked": "Bloqueado",
+    "reorder": "Reordenar",
+    "files": "{count} arquivos",
+    "attachmentsOnly": "{count} anexos",
+    "empty": "Mensagem vazia",
+    "limitReached": "A área de espera está cheia (máx. {max})."
+  },
   "features": {
     "webSearch": "Busca na Web",
     "thoughtForSeconds": "Pensou por {seconds}s",
@@ -126,7 +140,16 @@
     "verbosity": "Nível de detalhe",
     "verbosityPlaceholder": "Selecione o nível de detalhe",
     "currentCustomPrompt": "Personalização atual",
-    "useDefault": "Usar padrão"
+    "useDefault": "Usar padrão",
+    "decreaseValue": "Diminuir {label}",
+    "increaseValue": "Aumentar {label}",
+    "toggleValue": "Ativar ou desativar {label}",
+    "validation": {
+      "finiteNumber": "Deve ser um número finito",
+      "nonNegativeInteger": "Deve ser um inteiro não negativo",
+      "contextLengthAtLeastMaxTokens": "Deve ser maior ou igual ao Máximo de saída",
+      "maxTokensWithinContextLength": "Deve ser menor ou igual ao Tamanho de contexto"
+    }
   },
   "workspace": {
     "collapse": "fechar",
diff --git a/src/renderer/src/i18n/ru-RU/chat.json b/src/renderer/src/i18n/ru-RU/chat.json
index 565806c7c..f58097653 100644
--- a/src/renderer/src/i18n/ru-RU/chat.json
+++ b/src/renderer/src/i18n/ru-RU/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "Установить рабочий каталог агента",
     "attach": "Прикрепить",
     "voiceInput": "Голосовой ввод",
+    "queue": "В очередь",
+    "stop": "Стоп",
     "mcp": {
       "badge": "MCP {count}",
       "title": "Включённые MCP",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "Направление",
+    "queueCount": "В ожидании {count}/{max}",
+    "resumeQueue": "Продолжить отправку",
+    "toSteer": "Направить",
+    "locked": "Зафиксировано",
+    "reorder": "Изменить порядок",
+    "files": "{count} файлов",
+    "attachmentsOnly": "{count} вложений",
+    "empty": "Пустое сообщение",
+    "limitReached": "Область ожидания заполнена (макс. {max})."
+  },
   "features": {
     "webSearch": "Поиск в интернете",
     "artifactThinking": "Артефакт мышление",
@@ -126,7 +140,16 @@
     "verbosity": "Детализация ответа",
     "verbosityPlaceholder": "Выберите уровень детализации",
     "currentCustomPrompt": "Текущий пользовательский",
-    "useDefault": "Использовать по умолчанию"
+    "useDefault": "Использовать по умолчанию",
+    "decreaseValue": "Уменьшить {label}",
+    "increaseValue": "Увеличить {label}",
+    "toggleValue": "Включить или выключить {label}",
+    "validation": {
+      "finiteNumber": "Должно быть конечным числом",
+      "nonNegativeInteger": "Должно быть неотрицательным целым числом",
+      "contextLengthAtLeastMaxTokens": "Должно быть больше или равно максимальному числу токенов",
+      "maxTokensWithinContextLength": "Должно быть меньше или равно длине контекста"
+    }
   },
   "workspace": {
     "collapse": "закрывать",
diff --git a/src/renderer/src/i18n/zh-CN/chat.json b/src/renderer/src/i18n/zh-CN/chat.json
index 989c3b5e1..d138acdee 100644
--- a/src/renderer/src/i18n/zh-CN/chat.json
+++ b/src/renderer/src/i18n/zh-CN/chat.json
@@ -6,6 +6,8 @@
     "functionSwitch": "功能开关",
     "attach": "添加附件",
     "voiceInput": "语音输入",
+    "queue": "加入队列",
+    "stop": "停止",
     "fileSelect": "选择文件",
     "pasteFiles": "支持复制粘贴文件",
     "dropFiles": "拖拽文件到此处",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "引导",
+    "queueCount": "待发 {count}/{max}",
+    "resumeQueue": "继续发送",
+    "toSteer": "转为引导",
+    "locked": "已锁定",
+    "reorder": "调整顺序",
+    "files": "{count} 个文件",
+    "attachmentsOnly": "{count} 个附件",
+    "empty": "空消息",
+    "limitReached": "等待区已满（最多 {max} 条）。"
+  },
   "features": {
     "webSearch": "联网搜索",
     "thoughtForSeconds": "思考了 {seconds} 秒",
@@ -130,7 +144,16 @@
     "verbosity": "回答详略",
     "verbosityPlaceholder": "选择详略级别",
     "currentCustomPrompt": "当前自定义",
-    "useDefault": "使用默认值"
+    "useDefault": "使用默认值",
+    "decreaseValue": "减少 {label}",
+    "increaseValue": "增加 {label}",
+    "toggleValue": "切换 {label}",
+    "validation": {
+      "finiteNumber": "必须是有限数字",
+      "nonNegativeInteger": "必须是非负整数",
+      "contextLengthAtLeastMaxTokens": "必须大于或等于最大输出",
+      "maxTokensWithinContextLength": "必须小于或等于上下文长度"
+    }
   },
   "modelPicker": {
     "empty": "未找到模型"
diff --git a/src/renderer/src/i18n/zh-HK/chat.json b/src/renderer/src/i18n/zh-HK/chat.json
index 340f9c78c..272795609 100644
--- a/src/renderer/src/i18n/zh-HK/chat.json
+++ b/src/renderer/src/i18n/zh-HK/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "設置 Agent 工作目錄",
     "attach": "添加附件",
     "voiceInput": "語音輸入",
+    "queue": "加入佇列",
+    "stop": "停止",
     "mcp": {
       "badge": "MCP {count}",
       "title": "已啟用 MCP",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "引導",
+    "queueCount": "待發 {count}/{max}",
+    "resumeQueue": "繼續發送",
+    "toSteer": "轉為引導",
+    "locked": "已鎖定",
+    "reorder": "調整順序",
+    "files": "{count} 個文件",
+    "attachmentsOnly": "{count} 個附件",
+    "empty": "空訊息",
+    "limitReached": "等待區已滿（最多 {max} 條）。"
+  },
   "features": {
     "webSearch": "網絡搜索",
     "artifactThinking": "artifact 思考",
@@ -130,7 +144,16 @@
     "verbosity": "回答詳略",
     "verbosityPlaceholder": "選擇詳略等級",
     "currentCustomPrompt": "目前自訂",
-    "useDefault": "使用預設值"
+    "useDefault": "使用預設值",
+    "decreaseValue": "減少 {label}",
+    "increaseValue": "增加 {label}",
+    "toggleValue": "切換 {label}",
+    "validation": {
+      "finiteNumber": "必須是有限數字",
+      "nonNegativeInteger": "必須是非負整數",
+      "contextLengthAtLeastMaxTokens": "必須大於或等於最大輸出",
+      "maxTokensWithinContextLength": "必須小於或等於上下文長度"
+    }
   },
   "workspace": {
     "collapse": "收起",
diff --git a/src/renderer/src/i18n/zh-TW/chat.json b/src/renderer/src/i18n/zh-TW/chat.json
index 00974b715..7526e84d5 100644
--- a/src/renderer/src/i18n/zh-TW/chat.json
+++ b/src/renderer/src/i18n/zh-TW/chat.json
@@ -28,6 +28,8 @@
     "agentWorkspaceTooltip": "設置 Agent 工作目錄",
     "attach": "新增附件",
     "voiceInput": "語音輸入",
+    "queue": "加入佇列",
+    "stop": "停止",
     "mcp": {
       "badge": "MCP {count}",
       "title": "已啟用 MCP",
@@ -50,6 +52,18 @@
       }
     }
   },
+  "pendingInput": {
+    "steer": "引導",
+    "queueCount": "待發 {count}/{max}",
+    "resumeQueue": "繼續發送",
+    "toSteer": "轉為引導",
+    "locked": "已鎖定",
+    "reorder": "調整順序",
+    "files": "{count} 個檔案",
+    "attachmentsOnly": "{count} 個附件",
+    "empty": "空訊息",
+    "limitReached": "等待區已滿（最多 {max} 條）。"
+  },
   "features": {
     "webSearch": "網路搜尋",
     "artifactThinking": "Artifact 思考",
@@ -130,7 +144,16 @@
     "verbosity": "回答詳略",
     "verbosityPlaceholder": "選擇詳略等級",
     "currentCustomPrompt": "目前自訂",
-    "useDefault": "使用預設值"
+    "useDefault": "使用預設值",
+    "decreaseValue": "減少 {label}",
+    "increaseValue": "增加 {label}",
+    "toggleValue": "切換 {label}",
+    "validation": {
+      "finiteNumber": "必須是有限數字",
+      "nonNegativeInteger": "必須是非負整數",
+      "contextLengthAtLeastMaxTokens": "必須大於或等於最大輸出",
+      "maxTokensWithinContextLength": "必須小於或等於上下文長度"
+    }
   },
   "workspace": {
     "collapse": "收起",
diff --git a/src/renderer/src/pages/ChatPage.vue b/src/renderer/src/pages/ChatPage.vue
index 0d5fee63f..1c50d8a76 100644
--- a/src/renderer/src/pages/ChatPage.vue
+++ b/src/renderer/src/pages/ChatPage.vue
@@ -33,7 +33,19 @@
             :processing="isHandlingInteraction"
             @respond="onToolInteractionRespond"
           />
-          <template v-else>
+          <PendingInputLane
+            :steer-items="pendingInputStore.steerItems"
+            :queue-items="pendingInputStore.queueItems"
+            :disable-steer-action="pendingInputStore.isAtCapacity"
+            :show-resume-queue="showResumePendingQueue"
+            class="mb-1.5"
+            @update-queue="onPendingInputUpdate"
+            @move-queue="onPendingInputMove"
+            @convert-queue-to-steer="onPendingInputConvert"
+            @delete-queue="onPendingInputDelete"
+            @resume-queue="onResumePendingQueue"
+          />
+          <template v-if="!activePendingInteraction">
             <ChatInputBox
               ref="chatInputRef"
               v-model="message"
@@ -50,7 +62,8 @@
               <template #toolbar>
                 <ChatInputToolbar
                   :is-generating="isGenerating"
-                  :send-disabled="isAcpWorkdirMissing || !message.trim()"
+                  :has-input="hasDraftInput"
+                  :send-disabled="isQueueSubmitDisabled"
                   @attach="onAttach"
                   @send="onSubmit"
                   @stop="onStop"
@@ -79,11 +92,13 @@ import type {
 } from '@/components/chat/messageListItems'
 import ChatInputBox from '@/components/chat/ChatInputBox.vue'
 import ChatInputToolbar from '@/components/chat/ChatInputToolbar.vue'
+import PendingInputLane from '@/components/chat/PendingInputLane.vue'
 import ChatStatusBar from '@/components/chat/ChatStatusBar.vue'
 import ChatToolInteractionOverlay from '@/components/chat/ChatToolInteractionOverlay.vue'
 import TraceDialog from '@/components/trace/TraceDialog.vue'
 import { useSessionStore } from '@/stores/ui/session'
 import { useMessageStore } from '@/stores/ui/message'
+import { usePendingInputStore } from '@/stores/ui/pendingInput'
 import { useModelStore } from '@/stores/modelStore'
 import { usePresenter } from '@/composables/usePresenter'
 import type {
@@ -100,6 +115,7 @@ const props = defineProps<{
 
 const sessionStore = useSessionStore()
 const messageStore = useMessageStore()
+const pendingInputStore = usePendingInputStore()
 const modelStore = useModelStore()
 const newAgentPresenter = usePresenter('newAgentPresenter')
 const { t } = useI18n()
@@ -116,7 +132,6 @@ const isAcpWorkdirMissing = computed(() => {
   }
   return !activeSession.projectDir?.trim()
 })
-const isInputSubmitDisabled = computed(() => isAcpWorkdirMissing.value || isGenerating.value)
 
 // --- Auto-scroll ---
 const scrollContainer = ref<HTMLDivElement>()
@@ -143,10 +158,12 @@ watch(
   () => props.sessionId,
   async (id) => {
     if (id) {
-      await messageStore.loadMessages(id)
+      await Promise.all([messageStore.loadMessages(id), pendingInputStore.loadPendingInputs(id)])
       await nextTick()
       scrollToBottom()
+      return
     }
+    pendingInputStore.clear()
   },
   { immediate: true }
 )
@@ -391,31 +408,78 @@ const pendingInteractions = computed<PendingInteractionView[]>(() => {
 })
 
 const activePendingInteraction = computed(() => pendingInteractions.value[0] ?? null)
+const isAwaitingToolQuestionFollowUp = computed(() => {
+  let latestUserOrderSeq = 0
+
+  for (const message of messageStore.messages) {
+    if (message.role === 'user') {
+      latestUserOrderSeq = Math.max(latestUserOrderSeq, message.orderSeq)
+    }
+  }
+
+  return messageStore.messages.some((message) => {
+    if (message.role !== 'assistant' || message.orderSeq <= latestUserOrderSeq) {
+      return false
+    }
+
+    return parseAssistantBlocks(message.content).some(
+      (block) =>
+        block.type === 'action' &&
+        block.action_type === 'question_request' &&
+        block.status === 'success' &&
+        block.extra?.needsUserAction === false &&
+        block.extra?.questionResolution === 'replied' &&
+        typeof block.extra?.answerText !== 'string'
+    )
+  })
+})
+const hasInputText = computed(() => Boolean(message.value.trim()))
+const hasAttachments = computed(() => attachedFiles.value.length > 0)
+const hasDraftInput = computed(() => hasInputText.value || hasAttachments.value)
+const isQueueSubmitDisabled = computed(
+  () =>
+    isAcpWorkdirMissing.value ||
+    !hasDraftInput.value ||
+    Boolean(activePendingInteraction.value) ||
+    isHandlingInteraction.value ||
+    pendingInputStore.isAtCapacity
+)
+const isInputSubmitDisabled = computed(
+  () =>
+    isAcpWorkdirMissing.value ||
+    Boolean(activePendingInteraction.value) ||
+    isHandlingInteraction.value ||
+    pendingInputStore.isAtCapacity ||
+    !hasDraftInput.value
+)
+const showResumePendingQueue = computed(
+  () =>
+    !isGenerating.value &&
+    !activePendingInteraction.value &&
+    !isAwaitingToolQuestionFollowUp.value &&
+    pendingInputStore.queueItems.length > 0
+)
 
 async function onSubmit() {
-  if (isGenerating.value) return
   if (isAcpWorkdirMissing.value) return
   if (activePendingInteraction.value || isHandlingInteraction.value) return
   const text = message.value.trim()
-  if (!text) return
   const files = [...attachedFiles.value]
+  if (!text && files.length === 0) return
+  await pendingInputStore.queueInput(props.sessionId, { text, files })
   message.value = ''
   attachedFiles.value = []
-  messageStore.addOptimisticUserMessage(props.sessionId, text, files)
-  await sessionStore.sendMessage(props.sessionId, { text, files })
 }
 
 async function onCommandSubmit(command: string) {
-  if (isGenerating.value) return
   if (isAcpWorkdirMissing.value) return
   if (activePendingInteraction.value || isHandlingInteraction.value) return
   const text = command.trim()
   if (!text) return
 
   const files = [...attachedFiles.value]
+  await pendingInputStore.queueInput(props.sessionId, { text, files })
   attachedFiles.value = []
-  messageStore.addOptimisticUserMessage(props.sessionId, text, files)
-  await sessionStore.sendMessage(props.sessionId, { text, files })
 }
 
 function onAttach() {
@@ -519,11 +583,40 @@ function onMessageTrace(messageId: string) {
   traceMessageId.value = messageId
 }
 
+async function onPendingInputUpdate(payload: { itemId: string; text: string }) {
+  const target = pendingInputStore.queueItems.find((item) => item.id === payload.itemId)
+  if (!target) {
+    return
+  }
+
+  await pendingInputStore.updateQueueInput(props.sessionId, payload.itemId, {
+    text: payload.text,
+    files: target.payload.files ?? []
+  })
+}
+
+async function onPendingInputMove(payload: { itemId: string; toIndex: number }) {
+  await pendingInputStore.moveQueueInput(props.sessionId, payload.itemId, payload.toIndex)
+}
+
+async function onPendingInputConvert(itemId: string) {
+  await pendingInputStore.convertToSteer(props.sessionId, itemId)
+}
+
+async function onPendingInputDelete(itemId: string) {
+  await pendingInputStore.deleteInput(props.sessionId, itemId)
+}
+
+async function onResumePendingQueue() {
+  await pendingInputStore.resumeQueue(props.sessionId)
+}
+
 onMounted(() => {
   window.addEventListener('context-menu-ask-ai', handleContextMenuAskAI)
 })
 
 onUnmounted(() => {
   window.removeEventListener('context-menu-ask-ai', handleContextMenuAskAI)
+  pendingInputStore.clear()
 })
 </script>
diff --git a/src/renderer/src/stores/ui/pendingInput.ts b/src/renderer/src/stores/ui/pendingInput.ts
new file mode 100644
index 000000000..342aaa4ba
--- /dev/null
+++ b/src/renderer/src/stores/ui/pendingInput.ts
@@ -0,0 +1,168 @@
+import { computed, onScopeDispose, ref } from 'vue'
+import { defineStore } from 'pinia'
+import { usePresenter } from '@/composables/usePresenter'
+import { SESSION_EVENTS } from '@/events'
+import type { PendingSessionInputRecord, SendMessageInput } from '@shared/types/agent-interface'
+
+const MAX_PENDING_INPUTS = 5
+
+export const usePendingInputStore = defineStore('pendingInput', () => {
+  const newAgentPresenter = usePresenter('newAgentPresenter')
+
+  const currentSessionId = ref<string | null>(null)
+  const items = ref<PendingSessionInputRecord[]>([])
+  const loading = ref(false)
+  const error = ref<string | null>(null)
+
+  const steerItems = computed(() => items.value.filter((item) => item.mode === 'steer'))
+  const queueItems = computed(() =>
+    items.value
+      .filter((item) => item.mode === 'queue')
+      .sort((left, right) => (left.queueOrder ?? 0) - (right.queueOrder ?? 0))
+  )
+  const activeCount = computed(() => items.value.length)
+  const isAtCapacity = computed(() => activeCount.value >= MAX_PENDING_INPUTS)
+
+  async function loadPendingInputs(sessionId: string): Promise<void> {
+    const requestedId = sessionId
+    currentSessionId.value = requestedId
+    loading.value = true
+    error.value = null
+    try {
+      const loadedItems = await newAgentPresenter.listPendingInputs(requestedId)
+      if (requestedId !== currentSessionId.value) {
+        return
+      }
+      items.value = loadedItems
+    } catch (e) {
+      if (requestedId !== currentSessionId.value) {
+        return
+      }
+      error.value = `Failed to load pending inputs: ${e}`
+    } finally {
+      if (requestedId === currentSessionId.value) {
+        loading.value = false
+      }
+    }
+  }
+
+  async function queueInput(sessionId: string, input: string | SendMessageInput): Promise<void> {
+    error.value = null
+    try {
+      await newAgentPresenter.queuePendingInput(sessionId, input)
+      if (currentSessionId.value === sessionId) {
+        await loadPendingInputs(sessionId)
+      }
+    } catch (e) {
+      error.value = `Failed to queue message: ${e}`
+      throw e
+    }
+  }
+
+  async function updateQueueInput(
+    sessionId: string,
+    itemId: string,
+    input: string | SendMessageInput
+  ): Promise<void> {
+    error.value = null
+    try {
+      const updated = await newAgentPresenter.updateQueuedInput(sessionId, itemId, input)
+      items.value = items.value.map((item) => (item.id === updated.id ? updated : item))
+      if (currentSessionId.value === sessionId) {
+        await loadPendingInputs(sessionId)
+      }
+    } catch (e) {
+      error.value = `Failed to update queued message: ${e}`
+      throw e
+    }
+  }
+
+  async function moveQueueInput(sessionId: string, itemId: string, toIndex: number): Promise<void> {
+    error.value = null
+    try {
+      items.value = await newAgentPresenter.moveQueuedInput(sessionId, itemId, toIndex)
+    } catch (e) {
+      error.value = `Failed to reorder queued message: ${e}`
+      throw e
+    }
+  }
+
+  async function convertToSteer(sessionId: string, itemId: string): Promise<void> {
+    error.value = null
+    try {
+      const updated = await newAgentPresenter.convertPendingInputToSteer(sessionId, itemId)
+      items.value = items.value.map((item) => (item.id === updated.id ? updated : item))
+      if (currentSessionId.value === sessionId) {
+        await loadPendingInputs(sessionId)
+      }
+    } catch (e) {
+      error.value = `Failed to convert queued message to steer: ${e}`
+      throw e
+    }
+  }
+
+  async function deleteInput(sessionId: string, itemId: string): Promise<void> {
+    error.value = null
+    try {
+      await newAgentPresenter.deletePendingInput(sessionId, itemId)
+      items.value = items.value.filter((item) => item.id !== itemId)
+    } catch (e) {
+      error.value = `Failed to delete queued message: ${e}`
+      throw e
+    }
+  }
+
+  async function resumeQueue(sessionId: string): Promise<void> {
+    error.value = null
+    try {
+      await newAgentPresenter.resumePendingQueue(sessionId)
+      if (currentSessionId.value === sessionId) {
+        await loadPendingInputs(sessionId)
+      }
+    } catch (e) {
+      error.value = `Failed to resume queue: ${e}`
+      throw e
+    }
+  }
+
+  function clear(): void {
+    currentSessionId.value = null
+    items.value = []
+    loading.value = false
+    error.value = null
+  }
+
+  const pendingInputsHandler = (_: unknown, msg: { sessionId: string }) => {
+    if (!msg?.sessionId || msg.sessionId !== currentSessionId.value) {
+      return
+    }
+    void loadPendingInputs(msg.sessionId)
+  }
+
+  window.electron.ipcRenderer.on(SESSION_EVENTS.PENDING_INPUTS_UPDATED, pendingInputsHandler)
+  onScopeDispose(() => {
+    window.electron.ipcRenderer.removeListener(
+      SESSION_EVENTS.PENDING_INPUTS_UPDATED,
+      pendingInputsHandler
+    )
+  })
+
+  return {
+    currentSessionId,
+    items,
+    loading,
+    error,
+    steerItems,
+    queueItems,
+    activeCount,
+    isAtCapacity,
+    loadPendingInputs,
+    queueInput,
+    updateQueueInput,
+    moveQueueInput,
+    convertToSteer,
+    deleteInput,
+    resumeQueue,
+    clear
+  }
+})
diff --git a/src/renderer/src/stores/ui/session.ts b/src/renderer/src/stores/ui/session.ts
index 0eacf4234..58cb56b91 100644
--- a/src/renderer/src/stores/ui/session.ts
+++ b/src/renderer/src/stores/ui/session.ts
@@ -6,7 +6,6 @@ import { SESSION_EVENTS } from '@/events'
 import type {
   SessionWithState,
   CreateSessionInput,
-  MessageFile,
   SendMessageInput
 } from '@shared/types/agent-interface'
 import { downloadBlob } from '@/lib/download'
@@ -202,14 +201,6 @@ export const useSessionStore = defineStore('session', () => {
       const session = await newAgentPresenter.createSession(input, webContentsId)
       activeSessionId.value = session.id
 
-      if (input.message?.trim()) {
-        messageStore.addOptimisticUserMessage(
-          session.id,
-          input.message,
-          (input.files ?? []) as MessageFile[]
-        )
-      }
-
       await fetchSessions()
       pageRouter.goToChat(session.id)
     } catch (e) {
diff --git a/src/shared/types/agent-interface.d.ts b/src/shared/types/agent-interface.d.ts
index a849ce5d1..3166b2919 100644
--- a/src/shared/types/agent-interface.d.ts
+++ b/src/shared/types/agent-interface.d.ts
@@ -59,6 +59,26 @@ export interface IAgentImplementation {
     context?: { projectDir?: string | null; emitRefreshBeforeStream?: boolean }
   ): Promise<void>
 
+  /** Manage waiting lane inputs */
+  listPendingInputs?(sessionId: string): Promise<PendingSessionInputRecord[]>
+  queuePendingInput?(
+    sessionId: string,
+    content: string | SendMessageInput
+  ): Promise<PendingSessionInputRecord>
+  updateQueuedInput?(
+    sessionId: string,
+    itemId: string,
+    content: string | SendMessageInput
+  ): Promise<PendingSessionInputRecord>
+  moveQueuedInput?(
+    sessionId: string,
+    itemId: string,
+    toIndex: number
+  ): Promise<PendingSessionInputRecord[]>
+  convertPendingInputToSteer?(sessionId: string, itemId: string): Promise<PendingSessionInputRecord>
+  deletePendingInput?(sessionId: string, itemId: string): Promise<void>
+  resumePendingQueue?(sessionId: string): Promise<void>
+
   /** Cancel an in-progress generation */
   cancelGeneration(sessionId: string): Promise<void>
 
@@ -166,6 +186,22 @@ export interface SendMessageInput {
   files?: MessageFile[]
 }
 
+export type PendingSessionInputMode = 'queue' | 'steer'
+export type PendingSessionInputState = 'pending' | 'claimed' | 'consumed'
+
+export interface PendingSessionInputRecord {
+  id: string
+  sessionId: string
+  mode: PendingSessionInputMode
+  state: PendingSessionInputState
+  payload: SendMessageInput
+  queueOrder: number | null
+  claimedAt: number | null
+  consumedAt: number | null
+  createdAt: number
+  updatedAt: number
+}
+
 export type AssistantBlockType =
   | 'content'
   | 'search'
diff --git a/src/shared/types/presenters/new-agent.presenter.d.ts b/src/shared/types/presenters/new-agent.presenter.d.ts
index 3b96710ac..9e35bf0ba 100644
--- a/src/shared/types/presenters/new-agent.presenter.d.ts
+++ b/src/shared/types/presenters/new-agent.presenter.d.ts
@@ -8,6 +8,7 @@ import type {
   SessionGenerationSettings,
   SessionCompactionState,
   LegacyImportStatus,
+  PendingSessionInputRecord,
   SendMessageInput,
   ToolInteractionResponse,
   ToolInteractionResult,
@@ -23,6 +24,24 @@ export interface INewAgentPresenter {
     projectDir: string
     permissionMode?: PermissionMode
   }): Promise<SessionWithState>
+  listPendingInputs(sessionId: string): Promise<PendingSessionInputRecord[]>
+  queuePendingInput(
+    sessionId: string,
+    content: string | SendMessageInput
+  ): Promise<PendingSessionInputRecord>
+  updateQueuedInput(
+    sessionId: string,
+    itemId: string,
+    content: string | SendMessageInput
+  ): Promise<PendingSessionInputRecord>
+  moveQueuedInput(
+    sessionId: string,
+    itemId: string,
+    toIndex: number
+  ): Promise<PendingSessionInputRecord[]>
+  convertPendingInputToSteer(sessionId: string, itemId: string): Promise<PendingSessionInputRecord>
+  deletePendingInput(sessionId: string, itemId: string): Promise<void>
+  resumePendingQueue(sessionId: string): Promise<void>
   sendMessage(sessionId: string, content: string | SendMessageInput): Promise<void>
   retryMessage(sessionId: string, messageId: string): Promise<void>
   deleteMessage(sessionId: string, messageId: string): Promise<void>
diff --git a/src/shared/utils/generationSettingsValidation.ts b/src/shared/utils/generationSettingsValidation.ts
new file mode 100644
index 000000000..b1cd514d8
--- /dev/null
+++ b/src/shared/utils/generationSettingsValidation.ts
@@ -0,0 +1,76 @@
+import type { SessionGenerationSettings } from '../types/agent-interface'
+
+export type GenerationNumericField =
+  | 'temperature'
+  | 'contextLength'
+  | 'maxTokens'
+  | 'thinkingBudget'
+
+export type GenerationNumericValidationCode =
+  | 'finite_number'
+  | 'non_negative_integer'
+  | 'context_length_below_max_tokens'
+  | 'max_tokens_exceed_context_length'
+
+type GenerationRelationContext = Pick<SessionGenerationSettings, 'contextLength' | 'maxTokens'>
+
+export const parseFiniteNumericValue = (value: unknown): number | undefined => {
+  if (typeof value === 'number') {
+    return Number.isFinite(value) ? value : undefined
+  }
+
+  if (typeof value !== 'string') {
+    return undefined
+  }
+
+  const normalized = value.trim()
+  if (!normalized) {
+    return undefined
+  }
+
+  const numeric = Number(normalized)
+  return Number.isFinite(numeric) ? numeric : undefined
+}
+
+export const isNonNegativeInteger = (value: unknown): value is number =>
+  typeof value === 'number' && Number.isFinite(value) && Number.isInteger(value) && value >= 0
+
+export const toValidNonNegativeInteger = (value: unknown): number | undefined => {
+  const numeric = parseFiniteNumericValue(value)
+  return isNonNegativeInteger(numeric) ? numeric : undefined
+}
+
+export const normalizeLegacyThinkingBudgetValue = (value: unknown): number | undefined =>
+  toValidNonNegativeInteger(value)
+
+export const validateGenerationNumericField = (
+  field: GenerationNumericField,
+  value: unknown,
+  context: Partial<GenerationRelationContext> = {}
+): GenerationNumericValidationCode | null => {
+  const numeric = parseFiniteNumericValue(value)
+
+  if (field === 'temperature') {
+    return numeric === undefined ? 'finite_number' : null
+  }
+
+  if (!isNonNegativeInteger(numeric)) {
+    return 'non_negative_integer'
+  }
+
+  if (field === 'contextLength') {
+    const maxTokens = context.maxTokens
+    if (isNonNegativeInteger(maxTokens) && numeric < maxTokens) {
+      return 'context_length_below_max_tokens'
+    }
+  }
+
+  if (field === 'maxTokens') {
+    const contextLength = context.contextLength
+    if (isNonNegativeInteger(contextLength) && numeric > contextLength) {
+      return 'max_tokens_exceed_context_length'
+    }
+  }
+
+  return null
+}
diff --git a/test/main/lib/agentRuntime/processTree.test.ts b/test/main/lib/agentRuntime/processTree.test.ts
new file mode 100644
index 000000000..53a5bc7bb
--- /dev/null
+++ b/test/main/lib/agentRuntime/processTree.test.ts
@@ -0,0 +1,184 @@
+import { EventEmitter } from 'events'
+import { afterEach, describe, expect, it, vi } from 'vitest'
+
+vi.mock('child_process', () => ({
+  spawn: vi.fn()
+}))
+
+import { spawn } from 'child_process'
+import { terminateProcessTree } from '../../../../src/main/lib/agentRuntime/processTree'
+
+class MockSpawnedProcess extends EventEmitter {
+  stdout = new EventEmitter()
+  stderr = null
+  stdin = null
+
+  constructor(stdoutData = '') {
+    super()
+    queueMicrotask(() => {
+      if (stdoutData) {
+        this.stdout.emit('data', Buffer.from(stdoutData, 'utf-8'))
+      }
+      this.emit('close')
+    })
+  }
+}
+
+class MockChildProcess extends EventEmitter {
+  pid: number
+  exitCode: number | null = null
+  signalCode: NodeJS.Signals | null = null
+
+  constructor(pid: number) {
+    super()
+    this.pid = pid
+  }
+}
+
+describe('terminateProcessTree', () => {
+  const originalPlatform = Object.getOwnPropertyDescriptor(process, 'platform')
+  const originalKill = process.kill
+
+  afterEach(() => {
+    vi.useRealTimers()
+    vi.restoreAllMocks()
+    if (originalPlatform) {
+      Object.defineProperty(process, 'platform', originalPlatform)
+    }
+    process.kill = originalKill
+  })
+
+  it('uses taskkill /T /F on Windows', async () => {
+    Object.defineProperty(process, 'platform', {
+      configurable: true,
+      value: 'win32'
+    })
+
+    vi.mocked(spawn).mockImplementation(() => {
+      const child = new MockSpawnedProcess()
+      queueMicrotask(() => child.emit('close'))
+      return child as never
+    })
+
+    const child = new MockChildProcess(321)
+    queueMicrotask(() => {
+      child.signalCode = 'SIGTERM'
+      child.emit('close', null, 'SIGTERM')
+    })
+
+    await expect(terminateProcessTree(child as never, { graceMs: 10 })).resolves.toBe(true)
+    expect(spawn).toHaveBeenCalledWith('taskkill', ['/PID', '321', '/T', '/F'], {
+      stdio: 'ignore'
+    })
+  })
+
+  it('kills Unix process groups before escalating to SIGKILL', async () => {
+    vi.useFakeTimers()
+    Object.defineProperty(process, 'platform', {
+      configurable: true,
+      value: 'linux'
+    })
+
+    process.kill = vi.fn(((_pid: number, signal?: NodeJS.Signals) => {
+      if (_pid === -654 && signal === 'SIGKILL') {
+        queueMicrotask(() => {
+          target.signalCode = 'SIGKILL'
+          target.emit('close', null, 'SIGKILL')
+        })
+      }
+      return true
+    }) as typeof process.kill)
+
+    const target = new MockChildProcess(654)
+    const termination = terminateProcessTree(target as never, { graceMs: 10 })
+
+    await vi.advanceTimersByTimeAsync(10)
+    await expect(termination).resolves.toBe(true)
+
+    expect(spawn).not.toHaveBeenCalled()
+    expect(process.kill).toHaveBeenNthCalledWith(1, -654, 'SIGTERM')
+    expect(process.kill).toHaveBeenNthCalledWith(2, -654, 'SIGKILL')
+  })
+
+  it('falls back to recursively killing descendants when Unix process-group signaling fails', async () => {
+    vi.useFakeTimers()
+    Object.defineProperty(process, 'platform', {
+      configurable: true,
+      value: 'linux'
+    })
+
+    vi.mocked(spawn).mockImplementation((command, args) => {
+      if (command === 'pgrep') {
+        const parentPid = args[1]
+        if (parentPid === '777') {
+          return new MockSpawnedProcess('778\n') as never
+        }
+        if (parentPid === '778') {
+          return new MockSpawnedProcess('779\n') as never
+        }
+        return new MockSpawnedProcess() as never
+      }
+
+      return new MockSpawnedProcess() as never
+    })
+
+    process.kill = vi.fn(((pid: number, signal?: NodeJS.Signals) => {
+      if (pid === -777) {
+        const error = new Error('group not found') as NodeJS.ErrnoException
+        error.code = 'ESRCH'
+        throw error
+      }
+
+      if (pid === 777 && signal === 'SIGKILL') {
+        queueMicrotask(() => {
+          target.signalCode = 'SIGKILL'
+          target.emit('close', null, 'SIGKILL')
+        })
+      }
+
+      return true
+    }) as typeof process.kill)
+
+    const target = new MockChildProcess(777)
+    const termination = terminateProcessTree(target as never, { graceMs: 10 })
+
+    await vi.advanceTimersByTimeAsync(10)
+    await expect(termination).resolves.toBe(true)
+
+    expect(process.kill).toHaveBeenNthCalledWith(1, -777, 'SIGTERM')
+    expect(process.kill).toHaveBeenNthCalledWith(2, 777, 'SIGTERM')
+    expect(process.kill).toHaveBeenNthCalledWith(3, -777, 'SIGKILL')
+    expect(process.kill).toHaveBeenNthCalledWith(4, 777, 'SIGKILL')
+
+    expect(spawn).toHaveBeenNthCalledWith(1, 'pgrep', ['-P', '777'], {
+      stdio: ['ignore', 'pipe', 'ignore']
+    })
+    expect(spawn).toHaveBeenNthCalledWith(2, 'pgrep', ['-P', '778'], {
+      stdio: ['ignore', 'pipe', 'ignore']
+    })
+    expect(spawn).toHaveBeenNthCalledWith(3, 'pgrep', ['-P', '779'], {
+      stdio: ['ignore', 'pipe', 'ignore']
+    })
+    expect(spawn).toHaveBeenNthCalledWith(4, 'kill', ['-TERM', '779'], {
+      stdio: 'ignore'
+    })
+    expect(spawn).toHaveBeenNthCalledWith(5, 'kill', ['-TERM', '778'], {
+      stdio: 'ignore'
+    })
+    expect(spawn).toHaveBeenNthCalledWith(6, 'pgrep', ['-P', '777'], {
+      stdio: ['ignore', 'pipe', 'ignore']
+    })
+    expect(spawn).toHaveBeenNthCalledWith(7, 'pgrep', ['-P', '778'], {
+      stdio: ['ignore', 'pipe', 'ignore']
+    })
+    expect(spawn).toHaveBeenNthCalledWith(8, 'pgrep', ['-P', '779'], {
+      stdio: ['ignore', 'pipe', 'ignore']
+    })
+    expect(spawn).toHaveBeenNthCalledWith(9, 'kill', ['-KILL', '779'], {
+      stdio: 'ignore'
+    })
+    expect(spawn).toHaveBeenNthCalledWith(10, 'kill', ['-KILL', '778'], {
+      stdio: 'ignore'
+    })
+  })
+})
diff --git a/test/main/presenter/agentPresenter/acp/agentBashHandler.test.ts b/test/main/presenter/agentPresenter/acp/agentBashHandler.test.ts
index af9fcfbb8..07ed95469 100644
--- a/test/main/presenter/agentPresenter/acp/agentBashHandler.test.ts
+++ b/test/main/presenter/agentPresenter/acp/agentBashHandler.test.ts
@@ -1,8 +1,11 @@
+import path from 'path'
 import { afterEach, describe, expect, it, vi } from 'vitest'
 import { backgroundExecSessionManager } from '../../../../../src/main/lib/agentRuntime/backgroundExecSessionManager'
 import { AgentBashHandler } from '../../../../../src/main/presenter/agentPresenter/acp/agentBashHandler'
 
 describe('AgentBashHandler', () => {
+  const workspaceRoot = path.resolve('/workspace')
+
   afterEach(() => {
     vi.restoreAllMocks()
   })
@@ -23,12 +26,14 @@ describe('AgentBashHandler', () => {
     const runShellProcess = vi
       .spyOn(handler as never, 'runShellProcess' as never)
       .mockResolvedValueOnce({
+        kind: 'completed',
         output: 'Error: rtk find does not support compound predicates or actions',
         exitCode: 2,
         timedOut: false,
         offloaded: false
       })
       .mockResolvedValueOnce({
+        kind: 'completed',
         output: './src/main.ts\n./src/App.vue\n',
         exitCode: 0,
         timedOut: false,
@@ -44,14 +49,14 @@ describe('AgentBashHandler', () => {
     expect(runShellProcess).toHaveBeenNthCalledWith(
       1,
       'rtk find . -type f -name "*.ts" -o -name "*.vue" | grep "^./src"',
-      '/workspace',
+      workspaceRoot,
       120000,
       expect.objectContaining({ env: { PATH: '/bin' } })
     )
     expect(runShellProcess).toHaveBeenNthCalledWith(
       2,
       originalCommand,
-      '/workspace',
+      workspaceRoot,
       120000,
       expect.objectContaining({ env: { PATH: '/bin' } })
     )
@@ -79,6 +84,7 @@ describe('AgentBashHandler', () => {
     const runShellProcess = vi
       .spyOn(handler as never, 'runShellProcess' as never)
       .mockResolvedValue({
+        kind: 'completed',
         output: 'permission denied',
         exitCode: 2,
         timedOut: false,
@@ -113,6 +119,7 @@ describe('AgentBashHandler', () => {
     const runShellProcess = vi
       .spyOn(handler as never, 'runShellProcess' as never)
       .mockResolvedValue({
+        kind: 'completed',
         output: 'Error: rtk find does not support compound predicates or actions',
         exitCode: null,
         timedOut: true,
@@ -162,10 +169,15 @@ describe('AgentBashHandler', () => {
     )
 
     expect(runShellProcess).not.toHaveBeenCalled()
-    expect(startSpy).toHaveBeenCalledWith('conv-1', originalCommand, '/workspace', {
-      timeout: 120000,
-      env: { PATH: '/bin' }
-    })
+    expect(startSpy).toHaveBeenCalledWith(
+      'conv-1',
+      originalCommand,
+      workspaceRoot,
+      expect.objectContaining({
+        timeout: 120000,
+        env: { PATH: '/bin' }
+      })
+    )
     expect(result.output).toEqual({ status: 'running', sessionId: 'bg_123' })
     expect(result.rtkApplied).toBe(false)
     expect(result.rtkMode).toBe('bypass')
@@ -173,4 +185,143 @@ describe('AgentBashHandler', () => {
       'Bypassed RTK rewrite: unsupported find compound predicates or actions'
     )
   })
+
+  it('returns a running session when foreground exec exceeds yieldMs', async () => {
+    const handler = new AgentBashHandler(['/workspace'])
+
+    vi.spyOn(handler as never, 'prepareCommand' as never).mockResolvedValue({
+      originalCommand: 'bun run dev caps gpt-4o',
+      command: 'bun run dev caps gpt-4o',
+      env: { PATH: '/bin' },
+      rewritten: false,
+      rtkApplied: false,
+      rtkMode: 'bypass'
+    })
+
+    const startSpy = vi
+      .spyOn(backgroundExecSessionManager, 'start')
+      .mockResolvedValue({ sessionId: 'bg_yield', status: 'running' })
+    const waitSpy = vi
+      .spyOn(backgroundExecSessionManager, 'waitForCompletionOrYield')
+      .mockResolvedValue({ kind: 'running', sessionId: 'bg_yield' })
+    const writeSpy = vi.spyOn(backgroundExecSessionManager, 'write').mockImplementation(() => {})
+    const removeSpy = vi.spyOn(backgroundExecSessionManager, 'remove').mockResolvedValue()
+
+    const result = await handler.executeCommand(
+      {
+        command: 'bun run dev caps gpt-4o',
+        description: 'Start dev server',
+        yieldMs: 250
+      },
+      {
+        conversationId: 'conv-1'
+      }
+    )
+
+    expect(writeSpy).toHaveBeenCalledWith('conv-1', 'bg_yield', '', true)
+    expect(startSpy).toHaveBeenCalledWith(
+      'conv-1',
+      'bun run dev caps gpt-4o',
+      workspaceRoot,
+      expect.objectContaining({
+        timeout: 120000,
+        env: { PATH: '/bin' }
+      })
+    )
+    expect(waitSpy).toHaveBeenCalledWith('conv-1', 'bg_yield', 250)
+    expect(removeSpy).not.toHaveBeenCalled()
+    expect(result.output).toEqual({ status: 'running', sessionId: 'bg_yield' })
+  })
+
+  it('cleans up completed foreground sessions that finish inside the yield window', async () => {
+    const handler = new AgentBashHandler(['/workspace'])
+
+    vi.spyOn(handler as never, 'prepareCommand' as never).mockResolvedValue({
+      originalCommand: 'pnpm test --help',
+      command: 'pnpm test --help',
+      env: { PATH: '/bin' },
+      rewritten: false,
+      rtkApplied: false,
+      rtkMode: 'bypass'
+    })
+
+    vi.spyOn(backgroundExecSessionManager, 'start').mockResolvedValue({
+      sessionId: 'bg_done',
+      status: 'running'
+    })
+    const writeSpy = vi.spyOn(backgroundExecSessionManager, 'write').mockImplementation(() => {})
+    vi.spyOn(backgroundExecSessionManager, 'waitForCompletionOrYield').mockResolvedValue({
+      kind: 'completed',
+      result: {
+        status: 'done',
+        output: 'usage',
+        exitCode: 0,
+        offloaded: false,
+        timedOut: false
+      }
+    })
+    const removeSpy = vi.spyOn(backgroundExecSessionManager, 'remove').mockResolvedValue()
+
+    const result = await handler.executeCommand(
+      {
+        command: 'pnpm test --help',
+        description: 'Show help'
+      },
+      {
+        conversationId: 'conv-1'
+      }
+    )
+
+    expect(writeSpy).toHaveBeenCalledWith('conv-1', 'bg_done', '', true)
+    expect(removeSpy).toHaveBeenCalledWith('conv-1', 'bg_done')
+    expect(result.output).toContain('usage')
+    expect(result.output).toContain('Exit Code: 0')
+  })
+
+  it('keeps completed foreground sessions when output was offloaded', async () => {
+    const handler = new AgentBashHandler(['/workspace'])
+
+    vi.spyOn(handler as never, 'prepareCommand' as never).mockResolvedValue({
+      originalCommand: 'pnpm test --reporter=json',
+      command: 'pnpm test --reporter=json',
+      env: { PATH: '/bin' },
+      rewritten: false,
+      rtkApplied: false,
+      rtkMode: 'bypass'
+    })
+
+    vi.spyOn(backgroundExecSessionManager, 'start').mockResolvedValue({
+      sessionId: 'bg_offloaded',
+      status: 'running'
+    })
+    vi.spyOn(backgroundExecSessionManager, 'waitForCompletionOrYield').mockResolvedValue({
+      kind: 'completed',
+      result: {
+        status: 'done',
+        output: 'last lines',
+        exitCode: 0,
+        offloaded: true,
+        outputFilePath: '/tmp/bgexec_bg_offloaded.log',
+        timedOut: false
+      }
+    })
+    const writeSpy = vi.spyOn(backgroundExecSessionManager, 'write').mockImplementation(() => {})
+    const removeSpy = vi.spyOn(backgroundExecSessionManager, 'remove').mockResolvedValue()
+
+    const result = await handler.executeCommand(
+      {
+        command: 'pnpm test --reporter=json',
+        description: 'Run tests'
+      },
+      {
+        conversationId: 'conv-1'
+      }
+    )
+
+    expect(writeSpy).toHaveBeenCalledWith('conv-1', 'bg_offloaded', '', true)
+    expect(removeSpy).not.toHaveBeenCalled()
+    expect(result.output).toContain('last lines')
+    expect(result.output).toContain('Exit Code: 0')
+    expect(result.output).toContain('Output offloaded: /tmp/bgexec_bg_offloaded.log')
+  })
 })
diff --git a/test/main/presenter/agentPresenter/acp/backgroundExecSessionManager.test.ts b/test/main/presenter/agentPresenter/acp/backgroundExecSessionManager.test.ts
index c7f649ed3..5da43d700 100644
--- a/test/main/presenter/agentPresenter/acp/backgroundExecSessionManager.test.ts
+++ b/test/main/presenter/agentPresenter/acp/backgroundExecSessionManager.test.ts
@@ -33,6 +33,7 @@ describe('BackgroundExecSessionManager', () => {
   })
 
   afterEach(() => {
+    vi.useRealTimers()
     vi.restoreAllMocks()
     ;(manager as never).sessions.clear()
   })
@@ -55,6 +56,7 @@ describe('BackgroundExecSessionManager', () => {
     closePromise: Promise.resolve(),
     resolveClose: () => {},
     closeSettled: true,
+    timedOut: false,
     ...overrides
   })
 
@@ -123,4 +125,93 @@ describe('BackgroundExecSessionManager', () => {
       })
     }
   })
+
+  it('waits for completion and returns a completion snapshot before cleanup', async () => {
+    const session = createSession({
+      status: 'done',
+      outputBuffer: 'build complete'
+    })
+    setSession(session)
+
+    const result = await manager.waitForCompletionOrYield('conv-1', 'bg_123', 10)
+
+    expect(result).toEqual({
+      kind: 'completed',
+      result: {
+        status: 'done',
+        output: 'build complete',
+        exitCode: null,
+        offloaded: true,
+        outputFilePath: '/mock/session/bgexec_bg_123.log',
+        timedOut: false
+      }
+    })
+  })
+
+  it('returns running when the session outlives the yield window', async () => {
+    vi.useFakeTimers()
+
+    const session = createSession({
+      status: 'running',
+      closePromise: new Promise<void>(() => {})
+    })
+    setSession(session)
+
+    const resultPromise = manager.waitForCompletionOrYield('conv-1', 'bg_123', 10)
+    await vi.advanceTimersByTimeAsync(10)
+
+    await expect(resultPromise).resolves.toEqual({
+      kind: 'running',
+      sessionId: 'bg_123'
+    })
+  })
+
+  it('clears the yield timer when the session closes before the yield window elapses', async () => {
+    vi.useFakeTimers()
+
+    const clearTimeoutSpy = vi.spyOn(globalThis, 'clearTimeout')
+    const session = createSession({
+      status: 'running',
+      outputBuffer: 'build complete'
+    })
+
+    session.closePromise = Promise.resolve().then(() => {
+      session.status = 'done'
+    })
+
+    setSession(session)
+
+    await expect(manager.waitForCompletionOrYield('conv-1', 'bg_123', 1000)).resolves.toEqual({
+      kind: 'completed',
+      result: {
+        status: 'done',
+        output: 'build complete',
+        exitCode: null,
+        offloaded: true,
+        outputFilePath: '/mock/session/bgexec_bg_123.log',
+        timedOut: false
+      }
+    })
+
+    expect(clearTimeoutSpy).toHaveBeenCalledTimes(1)
+  })
+
+  it('exposes timedOut metadata through poll and log', async () => {
+    const session = createSession({
+      status: 'killed',
+      outputBuffer: 'timeout tail',
+      totalOutputLength: 12,
+      timedOut: true,
+      outputFilePath: null
+    })
+    setSession(session)
+
+    const poll = await manager.poll('conv-1', 'bg_123')
+    const log = await manager.log('conv-1', 'bg_123', 0, 20)
+
+    expect(poll.timedOut).toBe(true)
+    expect(log.timedOut).toBe(true)
+    expect(poll.output).toBe('timeout tail')
+    expect(log.output).toBe('timeout tail')
+  })
 })
diff --git a/test/main/presenter/agentPresenter/message/systemEnvPromptBuilder.test.ts b/test/main/presenter/agentPresenter/message/systemEnvPromptBuilder.test.ts
index d0f65d0c0..4fef8fe73 100644
--- a/test/main/presenter/agentPresenter/message/systemEnvPromptBuilder.test.ts
+++ b/test/main/presenter/agentPresenter/message/systemEnvPromptBuilder.test.ts
@@ -125,6 +125,7 @@ describe('systemEnvPromptBuilder', () => {
     })
 
     expect(prompt).toContain('exec(background: true)')
+    expect(prompt).toContain('yield window')
     expect(prompt).not.toContain('YoBrowser')
     expect(prompt).not.toContain('process(list|poll|log|write|kill|remove)')
   })
diff --git a/test/main/presenter/deepchatAgentPresenter/contextBuilder.test.ts b/test/main/presenter/deepchatAgentPresenter/contextBuilder.test.ts
index 46f551b06..3578d593f 100644
--- a/test/main/presenter/deepchatAgentPresenter/contextBuilder.test.ts
+++ b/test/main/presenter/deepchatAgentPresenter/contextBuilder.test.ts
@@ -2,6 +2,7 @@ import { describe, it, expect, vi, beforeEach } from 'vitest'
 import {
   buildContext,
   buildResumeContext,
+  fitMessagesToContextWindow,
   truncateContext
 } from '@/presenter/deepchatAgentPresenter/contextBuilder'
 
@@ -503,3 +504,26 @@ describe('buildResumeContext', () => {
     ])
   })
 })
+
+describe('fitMessagesToContextWindow', () => {
+  it('drops older history before protected steer and queued user tail', () => {
+    const result = fitMessagesToContextWindow(
+      [
+        { role: 'system', content: 'Sys' },
+        { role: 'user', content: 'A'.repeat(40) },
+        { role: 'assistant', content: 'B'.repeat(40) },
+        { role: 'user', content: 'Steer instruction' },
+        { role: 'user', content: 'Queued target' }
+      ],
+      14,
+      4,
+      2
+    )
+
+    expect(result).toEqual([
+      { role: 'system', content: 'Sys' },
+      { role: 'user', content: 'Steer instruction' },
+      { role: 'user', content: 'Queued target' }
+    ])
+  })
+})
diff --git a/test/main/presenter/deepchatAgentPresenter/deepchatAgentPresenter.test.ts b/test/main/presenter/deepchatAgentPresenter/deepchatAgentPresenter.test.ts
index ba26d41bd..9fbf6e805 100644
--- a/test/main/presenter/deepchatAgentPresenter/deepchatAgentPresenter.test.ts
+++ b/test/main/presenter/deepchatAgentPresenter/deepchatAgentPresenter.test.ts
@@ -21,7 +21,8 @@ vi.mock('@/events', () => ({
     ACTIVATED: 'session:activated',
     DEACTIVATED: 'session:deactivated',
     STATUS_CHANGED: 'session:status-changed',
-    COMPACTION_UPDATED: 'session:compaction-updated'
+    COMPACTION_UPDATED: 'session:compaction-updated',
+    PENDING_INPUTS_UPDATED: 'session:pending-inputs-updated'
   },
   STREAM_EVENTS: {
     RESPONSE: 'stream:response',
@@ -147,6 +148,17 @@ function createMockSqlitePresenter() {
       listByMessageId: vi.fn().mockReturnValue([]),
       deleteByMessageIds: vi.fn(),
       deleteBySessionId: vi.fn()
+    },
+    deepchatPendingInputsTable: {
+      insert: vi.fn(),
+      get: vi.fn(),
+      listBySession: vi.fn().mockReturnValue([]),
+      listClaimed: vi.fn().mockReturnValue([]),
+      listActiveBySession: vi.fn().mockReturnValue([]),
+      countActiveBySession: vi.fn().mockReturnValue(0),
+      update: vi.fn(),
+      delete: vi.fn(),
+      deleteBySession: vi.fn()
     }
   } as any
 }
@@ -294,6 +306,54 @@ describe('DeepChatAgentPresenter', () => {
       )
       consoleSpy.mockRestore()
     })
+
+    it('only recovers claimed pending inputs for sessions that still exist', () => {
+      const consoleSpy = vi.spyOn(console, 'log').mockImplementation(() => {})
+      sqlitePresenter.deepchatPendingInputsTable.listClaimed.mockReturnValue([
+        {
+          id: 'pending-existing',
+          session_id: 's1',
+          mode: 'queue',
+          state: 'claimed',
+          payload_json: '{"text":"hello","files":[]}',
+          queue_order: 1,
+          claimed_at: 123,
+          consumed_at: null,
+          created_at: 1,
+          updated_at: 1
+        },
+        {
+          id: 'pending-missing',
+          session_id: 'missing-session',
+          mode: 'queue',
+          state: 'claimed',
+          payload_json: '{"text":"orphan","files":[]}',
+          queue_order: 2,
+          claimed_at: 456,
+          consumed_at: null,
+          created_at: 2,
+          updated_at: 2
+        }
+      ])
+      sqlitePresenter.deepchatSessionsTable.get.mockImplementation((sessionId: string) =>
+        sessionId === 's1' ? { id: 's1' } : null
+      )
+
+      new DeepChatAgentPresenter(llmProvider, configPresenter, sqlitePresenter, toolPresenter)
+
+      expect(sqlitePresenter.deepchatPendingInputsTable.update).toHaveBeenCalledTimes(1)
+      expect(sqlitePresenter.deepchatPendingInputsTable.update).toHaveBeenCalledWith(
+        'pending-existing',
+        {
+          state: 'pending',
+          claimed_at: null
+        }
+      )
+      expect(consoleSpy).toHaveBeenCalledWith(
+        'DeepChatAgent: recovered 1 sessions with claimed pending inputs'
+      )
+      consoleSpy.mockRestore()
+    })
   })
 
   describe('initSession', () => {
@@ -1171,7 +1231,7 @@ describe('DeepChatAgentPresenter', () => {
       await expect(agent.getGenerationSettings('unknown')).resolves.toBeNull()
     })
 
-    it('updates generation settings with sanitize and clamp', async () => {
+    it('updates generation settings with minimal validation and keeps invalid fields unchanged', async () => {
       await agent.initSession('s1', { providerId: 'openai', modelId: 'gpt-4' })
 
       const updated = await agent.updateGenerationSettings('s1', {
@@ -1183,40 +1243,54 @@ describe('DeepChatAgentPresenter', () => {
         verbosity: 'invalid' as any
       })
 
-      expect(updated.temperature).toBe(2)
-      expect(updated.contextLength).toBe(2048)
-      expect(updated.maxTokens).toBe(2048)
-      expect(updated.thinkingBudget).toBe(0)
+      expect(updated.temperature).toBe(9)
+      expect(updated.contextLength).toBe(128000)
+      expect(updated.maxTokens).toBe(4096)
+      expect(updated.thinkingBudget).toBe(512)
       expect(updated.reasoningEffort).toBe('minimal')
       expect(updated.verbosity).toBe('medium')
 
       expect(sqlitePresenter.deepchatSessionsTable.updateGenerationSettings).toHaveBeenCalledWith(
         's1',
         expect.objectContaining({
-          temperature: 2,
-          contextLength: 2048,
-          maxTokens: 2048,
-          thinkingBudget: 0,
+          temperature: 9,
+          contextLength: 128000,
+          maxTokens: 4096,
+          thinkingBudget: 512,
           reasoningEffort: 'minimal',
           verbosity: 'medium'
         })
       )
     })
 
-    it('preserves portrait sentinel budgets when updating generation settings', async () => {
-      configPresenter.getThinkingBudgetRange.mockReturnValue({ min: 0, max: 24576, default: -1 })
+    it('treats legacy negative thinking budget rows as disabled and ignores new negative updates', async () => {
+      sqlitePresenter.deepchatSessionsTable.get.mockReturnValue({
+        id: 's2',
+        provider_id: 'gemini',
+        model_id: 'gemini-2.5-pro',
+        permission_mode: 'full_access',
+        system_prompt: 'You are a helpful assistant.',
+        temperature: 0.7,
+        context_length: 128000,
+        max_tokens: 4096,
+        thinking_budget: -1,
+        reasoning_effort: 'medium',
+        verbosity: 'medium'
+      })
 
-      await agent.initSession('s1', { providerId: 'gemini', modelId: 'gemini-2.5-pro' })
+      const persisted = await agent.getGenerationSettings('s2')
+      expect(persisted).not.toHaveProperty('thinkingBudget')
 
+      await agent.initSession('s1', { providerId: 'openai', modelId: 'gpt-4' })
       const updated = await agent.updateGenerationSettings('s1', {
         thinkingBudget: -1
       })
 
-      expect(updated.thinkingBudget).toBe(-1)
+      expect(updated.thinkingBudget).toBe(512)
       expect(sqlitePresenter.deepchatSessionsTable.updateGenerationSettings).toHaveBeenCalledWith(
         's1',
         expect.objectContaining({
-          thinkingBudget: -1
+          thinkingBudget: 512
         })
       )
     })
diff --git a/test/main/presenter/newAgentPresenter/integration.test.ts b/test/main/presenter/newAgentPresenter/integration.test.ts
index 98f9bf935..33a47274b 100644
--- a/test/main/presenter/newAgentPresenter/integration.test.ts
+++ b/test/main/presenter/newAgentPresenter/integration.test.ts
@@ -1,6 +1,7 @@
 import { describe, it, expect, vi, beforeEach } from 'vitest'
 import { NewAgentPresenter } from '@/presenter/newAgentPresenter/index'
 import { DeepChatAgentPresenter } from '@/presenter/deepchatAgentPresenter/index'
+import { estimateMessagesTokens } from '@/presenter/deepchatAgentPresenter/contextBuilder'
 import { NewSessionHooksBridge } from '@/presenter/hooksNotifications/newSessionBridge'
 
 vi.mock('nanoid', () => {
@@ -22,7 +23,8 @@ vi.mock('@/events', async (importOriginal) => {
       ACTIVATED: 'session:activated',
       DEACTIVATED: 'session:deactivated',
       STATUS_CHANGED: 'session:status-changed',
-      COMPACTION_UPDATED: 'session:compaction-updated'
+      COMPACTION_UPDATED: 'session:compaction-updated',
+      PENDING_INPUTS_UPDATED: 'session:pending-inputs-updated'
     },
     STREAM_EVENTS: {
       RESPONSE: 'stream:response',
@@ -54,6 +56,7 @@ function createMockSqlitePresenter() {
   const sessionsStore = new Map<string, any>()
   const deepchatSessionsStore = new Map<string, any>()
   const messagesStore = new Map<string, any>()
+  const pendingInputsStore = new Map<string, any>()
   let messagesList: any[] = []
 
   return {
@@ -86,6 +89,11 @@ function createMockSqlitePresenter() {
       update: vi.fn(),
       delete: vi.fn((id: string) => sessionsStore.delete(id))
     },
+    newEnvironmentsTable: {
+      syncPath: vi.fn(),
+      listPathsForSession: vi.fn().mockReturnValue([]),
+      syncForSession: vi.fn()
+    },
     deepchatSessionsTable: {
       create: vi.fn(
         (
@@ -338,10 +346,81 @@ function createMockSqlitePresenter() {
       deleteByMessageIds: vi.fn(),
       deleteBySessionId: vi.fn()
     },
+    deepchatPendingInputsTable: {
+      insert: vi.fn((row: any) => {
+        const now = row.createdAt ?? Date.now()
+        pendingInputsStore.set(row.id, {
+          id: row.id,
+          session_id: row.sessionId,
+          mode: row.mode,
+          state: row.state ?? 'pending',
+          payload_json: row.payloadJson,
+          queue_order: row.queueOrder ?? null,
+          claimed_at: row.claimedAt ?? null,
+          consumed_at: row.consumedAt ?? null,
+          created_at: now,
+          updated_at: row.updatedAt ?? now
+        })
+      }),
+      get: vi.fn((id: string) => pendingInputsStore.get(id)),
+      listBySession: vi.fn((sessionId: string) =>
+        Array.from(pendingInputsStore.values())
+          .filter((row) => row.session_id === sessionId)
+          .sort((left, right) => left.created_at - right.created_at)
+      ),
+      listClaimed: vi.fn(() =>
+        Array.from(pendingInputsStore.values())
+          .filter((row) => row.state === 'claimed')
+          .sort((left, right) => left.created_at - right.created_at)
+      ),
+      listActiveBySession: vi.fn((sessionId: string) =>
+        Array.from(pendingInputsStore.values())
+          .filter((row) => row.session_id === sessionId && row.state !== 'consumed')
+          .sort((left, right) => {
+            const modeDiff = left.mode === right.mode ? 0 : left.mode === 'steer' ? -1 : 1
+            if (modeDiff !== 0) return modeDiff
+            const leftOrder =
+              left.mode === 'queue' ? (left.queue_order ?? 2147483647) : left.created_at
+            const rightOrder =
+              right.mode === 'queue' ? (right.queue_order ?? 2147483647) : right.created_at
+            if (leftOrder !== rightOrder) return leftOrder - rightOrder
+            return left.created_at - right.created_at
+          })
+      ),
+      countActiveBySession: vi.fn(
+        (sessionId: string) =>
+          Array.from(pendingInputsStore.values()).filter(
+            (row) =>
+              row.session_id === sessionId &&
+              row.state !== 'consumed' &&
+              !(row.mode === 'queue' && row.state === 'claimed')
+          ).length
+      ),
+      update: vi.fn((id: string, fields: any) => {
+        const row = pendingInputsStore.get(id)
+        if (!row) return
+        pendingInputsStore.set(id, {
+          ...row,
+          ...fields,
+          updated_at: Date.now()
+        })
+      }),
+      delete: vi.fn((id: string) => {
+        pendingInputsStore.delete(id)
+      }),
+      deleteBySession: vi.fn((sessionId: string) => {
+        for (const [id, row] of pendingInputsStore.entries()) {
+          if (row.session_id === sessionId) {
+            pendingInputsStore.delete(id)
+          }
+        }
+      })
+    },
     // Expose internal stores for assertion
     _sessionsStore: sessionsStore,
     _deepchatSessionsStore: deepchatSessionsStore,
     _messagesStore: messagesStore,
+    _pendingInputsStore: pendingInputsStore,
     _getMessagesList: () => messagesList
   } as any
 }
@@ -633,6 +712,7 @@ describe('Integration: multi-turn context', () => {
   let sqlitePresenter: ReturnType<typeof createMockSqlitePresenter>
   let llmProvider: ReturnType<typeof createMockLlmProviderPresenter>
   let configPresenter: ReturnType<typeof createMockConfigPresenter>
+  let deepchatAgent: DeepChatAgentPresenter
   let agentPresenter: NewAgentPresenter
 
   beforeEach(() => {
@@ -641,7 +721,7 @@ describe('Integration: multi-turn context', () => {
     llmProvider = createMockLlmProviderPresenter()
     configPresenter = createMockConfigPresenter()
 
-    const deepchatAgent = new DeepChatAgentPresenter(
+    deepchatAgent = new DeepChatAgentPresenter(
       llmProvider,
       configPresenter,
       sqlitePresenter,
@@ -679,7 +759,6 @@ describe('Integration: multi-turn context', () => {
     const secondCallMessages = providerInstance.coreStream.mock.calls[1][0]
     expect(secondCallMessages[0].role).toBe('system')
     expect(secondCallMessages[0].content).toContain('You are a helpful assistant.')
-    expect(secondCallMessages[0].content).toContain('## Runtime Capabilities')
     // Should contain prior user and assistant messages before the new user message
     expect(secondCallMessages.length).toBeGreaterThanOrEqual(3) // system + at least history + new user
     expect(secondCallMessages[secondCallMessages.length - 1]).toEqual({
@@ -712,6 +791,355 @@ describe('Integration: multi-turn context', () => {
     expect(lastUserContent.text).toBe('Follow up (object)')
     expect(lastUserContent.files).toHaveLength(1)
   })
+
+  it('keeps queued messages out of formal history until the current turn completes', async () => {
+    let releaseFirstTurn: (() => void) | null = null
+    const providerInstance = {
+      coreStream: vi
+        .fn()
+        .mockImplementationOnce(async function* () {
+          await new Promise<void>((resolve) => {
+            releaseFirstTurn = resolve
+          })
+          yield { type: 'text', content: 'First response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+        .mockImplementation(async function* () {
+          yield { type: 'text', content: 'Queued response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+    }
+    llmProvider.getProviderInstance.mockReturnValue(providerInstance)
+
+    const session = await agentPresenter.createSession(
+      { agentId: 'deepchat', message: 'First turn', projectDir: null },
+      1
+    )
+    await new Promise((r) => setTimeout(r, 20))
+
+    await agentPresenter.queuePendingInput(session.id, 'Queued follow up')
+
+    const pendingBeforeRelease = await agentPresenter.listPendingInputs(session.id)
+    expect(pendingBeforeRelease).toHaveLength(1)
+    expect(pendingBeforeRelease[0].mode).toBe('queue')
+
+    const beforeMessages = sqlitePresenter.deepchatMessagesTable.getBySession(session.id)
+    const beforeUserMessages = beforeMessages.filter((message: any) => message.role === 'user')
+    expect(beforeUserMessages).toHaveLength(1)
+    expect(JSON.parse(beforeUserMessages[0].content).text).toBe('First turn')
+
+    releaseFirstTurn?.()
+    await new Promise((r) => setTimeout(r, 80))
+
+    const afterMessages = sqlitePresenter.deepchatMessagesTable.getBySession(session.id)
+    const afterUserMessages = afterMessages.filter((message: any) => message.role === 'user')
+    expect(afterUserMessages).toHaveLength(2)
+    expect(JSON.parse(afterUserMessages[1].content).text).toBe('Queued follow up')
+    await expect(agentPresenter.listPendingInputs(session.id)).resolves.toEqual([])
+  })
+
+  it('injects steer inputs before the next queued user message', async () => {
+    let releaseFirstTurn: (() => void) | null = null
+    const providerInstance = {
+      coreStream: vi
+        .fn()
+        .mockImplementationOnce(async function* () {
+          await new Promise<void>((resolve) => {
+            releaseFirstTurn = resolve
+          })
+          yield { type: 'text', content: 'First response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+        .mockImplementation(async function* () {
+          yield { type: 'text', content: 'Second response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+    }
+    llmProvider.getProviderInstance.mockReturnValue(providerInstance)
+
+    const session = await agentPresenter.createSession(
+      { agentId: 'deepchat', message: 'Turn one', projectDir: null },
+      1
+    )
+    await new Promise((r) => setTimeout(r, 20))
+
+    await agentPresenter.queuePendingInput(session.id, 'Steer instruction')
+    await agentPresenter.queuePendingInput(session.id, 'Queued target')
+
+    const pendingInputs = await agentPresenter.listPendingInputs(session.id)
+    expect(pendingInputs).toHaveLength(2)
+    await agentPresenter.convertPendingInputToSteer(session.id, pendingInputs[0].id)
+
+    releaseFirstTurn?.()
+    await new Promise((r) => setTimeout(r, 80))
+
+    expect(providerInstance.coreStream).toHaveBeenCalledTimes(2)
+    const secondCallMessages = providerInstance.coreStream.mock.calls[1][0]
+    const trailingUserMessages = secondCallMessages.filter(
+      (message: any) => message.role === 'user'
+    )
+
+    expect(trailingUserMessages[trailingUserMessages.length - 2]).toEqual({
+      role: 'user',
+      content: 'Steer instruction'
+    })
+    expect(trailingUserMessages[trailingUserMessages.length - 1]).toEqual({
+      role: 'user',
+      content: 'Queued target'
+    })
+    await expect(agentPresenter.listPendingInputs(session.id)).resolves.toEqual([])
+  })
+
+  it('rebudgets long steer inputs before streaming the next queued turn', async () => {
+    let releaseFirstTurn: (() => void) | null = null
+    const firstPrompt = 'P'.repeat(2000)
+    const firstResponse = 'R'.repeat(2000)
+    const steerFileContent = 'S'.repeat(8000)
+    const providerInstance = {
+      coreStream: vi
+        .fn()
+        .mockImplementationOnce(async function* () {
+          await new Promise<void>((resolve) => {
+            releaseFirstTurn = resolve
+          })
+          yield { type: 'text', content: firstResponse }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+        .mockImplementation(async function* () {
+          yield { type: 'text', content: 'Second response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+    }
+    llmProvider.getProviderInstance.mockReturnValue(providerInstance)
+
+    const session = await agentPresenter.createSession(
+      { agentId: 'deepchat', message: firstPrompt, projectDir: null },
+      1
+    )
+    await new Promise((r) => setTimeout(r, 20))
+
+    await agentPresenter.updateSessionGenerationSettings(session.id, {
+      contextLength: 2048,
+      maxTokens: 128
+    })
+
+    await agentPresenter.queuePendingInput(session.id, {
+      text: 'Steer with attachment',
+      files: [
+        {
+          name: 'steer.txt',
+          path: '/tmp/steer.txt',
+          mimeType: 'text/plain',
+          content: steerFileContent
+        } as any
+      ]
+    })
+    await agentPresenter.queuePendingInput(session.id, 'Queued target')
+
+    const pendingInputs = await agentPresenter.listPendingInputs(session.id)
+    expect(pendingInputs).toHaveLength(2)
+    await agentPresenter.convertPendingInputToSteer(session.id, pendingInputs[0].id)
+
+    releaseFirstTurn?.()
+    await new Promise((r) => setTimeout(r, 80))
+
+    expect(providerInstance.coreStream).toHaveBeenCalledTimes(2)
+    const secondCallMessages = providerInstance.coreStream.mock.calls[1][0]
+    const secondCallContents = secondCallMessages.map((message: any) =>
+      typeof message.content === 'string' ? message.content : JSON.stringify(message.content)
+    )
+    const trailingUserMessages = secondCallMessages.filter(
+      (message: any) => message.role === 'user'
+    )
+
+    expect(secondCallContents).not.toContain(firstPrompt)
+    expect(secondCallContents).not.toContain(firstResponse)
+    expect(estimateMessagesTokens(secondCallMessages) + 128).toBeLessThanOrEqual(2048)
+    expect(trailingUserMessages[trailingUserMessages.length - 2].content).toEqual(
+      expect.stringContaining('[Attached File 1]')
+    )
+    expect(trailingUserMessages[trailingUserMessages.length - 2].content).toEqual(
+      expect.stringContaining('steer.txt')
+    )
+    expect(trailingUserMessages[trailingUserMessages.length - 1]).toEqual({
+      role: 'user',
+      content: 'Queued target'
+    })
+  })
+
+  it('pauses queued prompts until a tool follow-up answer is actually sent', async () => {
+    const providerInstance = {
+      coreStream: vi.fn(async function* (messages: any[]) {
+        const lastUserMessage = messages.filter((message) => message.role === 'user').at(-1)
+        yield {
+          type: 'text',
+          content: `Handled: ${
+            typeof lastUserMessage?.content === 'string' ? lastUserMessage.content : 'unknown'
+          }`
+        }
+        yield { type: 'stop', stop_reason: 'end_turn' }
+      })
+    }
+    llmProvider.getProviderInstance.mockReturnValue(providerInstance)
+
+    await deepchatAgent.initSession('s-follow-up', { providerId: 'openai', modelId: 'gpt-4' })
+    ;(deepchatAgent as any).runtimeState.get('s-follow-up').status = 'generating'
+
+    await deepchatAgent.queuePendingInput('s-follow-up', 'Older queued prompt')
+    expect(await deepchatAgent.listPendingInputs('s-follow-up')).toHaveLength(1)
+
+    sqlitePresenter.deepchatMessagesTable.insert({
+      id: 'm-follow-up',
+      sessionId: 's-follow-up',
+      orderSeq: 1,
+      role: 'assistant',
+      content: JSON.stringify([
+        {
+          type: 'tool_call',
+          status: 'pending',
+          timestamp: 1,
+          tool_call: { id: 'tc-follow-up', name: 'ask_question', params: '{}', response: '' }
+        },
+        {
+          type: 'action',
+          action_type: 'question_request',
+          status: 'pending',
+          timestamp: 2,
+          content: 'Need more detail',
+          tool_call: { id: 'tc-follow-up', name: 'ask_question', params: '{}' },
+          extra: {
+            needsUserAction: true,
+            questionText: 'Need more detail'
+          }
+        }
+      ]),
+      status: 'pending'
+    })
+
+    await expect(
+      deepchatAgent.respondToolInteraction('s-follow-up', 'm-follow-up', 'tc-follow-up', {
+        kind: 'question_other'
+      })
+    ).resolves.toEqual({ resumed: false, waitingForUserMessage: true })
+
+    await new Promise((r) => setTimeout(r, 20))
+    expect(providerInstance.coreStream).not.toHaveBeenCalled()
+    await expect(deepchatAgent.listPendingInputs('s-follow-up')).resolves.toHaveLength(1)
+
+    await deepchatAgent.resumePendingQueue('s-follow-up')
+    await new Promise((r) => setTimeout(r, 20))
+    expect(providerInstance.coreStream).not.toHaveBeenCalled()
+    await expect(deepchatAgent.listPendingInputs('s-follow-up')).resolves.toHaveLength(1)
+
+    await deepchatAgent.queuePendingInput('s-follow-up', 'Actual follow-up answer')
+    await new Promise((r) => setTimeout(r, 80))
+
+    expect(providerInstance.coreStream).toHaveBeenCalledTimes(2)
+    const firstFollowUpCall = providerInstance.coreStream.mock.calls[0][0]
+    const secondQueuedCall = providerInstance.coreStream.mock.calls[1][0]
+    expect(firstFollowUpCall.filter((message: any) => message.role === 'user').at(-1)).toEqual({
+      role: 'user',
+      content: 'Actual follow-up answer'
+    })
+    expect(secondQueuedCall.filter((message: any) => message.role === 'user').at(-1)).toEqual({
+      role: 'user',
+      content: 'Older queued prompt'
+    })
+
+    const userMessagesAfterFollowUp = sqlitePresenter.deepchatMessagesTable
+      .getBySession('s-follow-up')
+      .filter((message: any) => message.role === 'user')
+    expect(userMessagesAfterFollowUp).toHaveLength(2)
+    expect(JSON.parse(userMessagesAfterFollowUp[0].content).text).toBe('Actual follow-up answer')
+    expect(JSON.parse(userMessagesAfterFollowUp[1].content).text).toBe('Older queued prompt')
+    await expect(deepchatAgent.listPendingInputs('s-follow-up')).resolves.toEqual([])
+  })
+
+  it('sendMessage starts a fresh turn from an errored session', async () => {
+    const providerInstance = {
+      coreStream: vi
+        .fn()
+        .mockImplementationOnce(async function* () {
+          throw new Error('provider offline')
+        })
+        .mockImplementation(async function* () {
+          yield { type: 'text', content: 'Recovered response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+    }
+    llmProvider.getProviderInstance.mockReturnValue(providerInstance)
+
+    const session = await agentPresenter.createSession(
+      { agentId: 'deepchat', message: 'Fail first', projectDir: null },
+      1
+    )
+    await new Promise((r) => setTimeout(r, 50))
+
+    const failedSession = await agentPresenter.getSession(session.id)
+    expect(failedSession?.status).toBe('error')
+
+    await agentPresenter.sendMessage(session.id, 'Recover after error')
+    await new Promise((r) => setTimeout(r, 80))
+
+    const recoveredSession = await agentPresenter.getSession(session.id)
+    expect(recoveredSession?.status).toBe('idle')
+    expect(providerInstance.coreStream).toHaveBeenCalledTimes(2)
+
+    const messages = sqlitePresenter.deepchatMessagesTable.getBySession(session.id)
+    const userMessages = messages.filter((message: any) => message.role === 'user')
+    expect(userMessages).toHaveLength(2)
+    expect(JSON.parse(userMessages[1].content).text).toBe('Recover after error')
+    await expect(agentPresenter.listPendingInputs(session.id)).resolves.toEqual([])
+  })
+
+  it('resumePendingQueue drains queued turns after a session error', async () => {
+    let releaseFirstTurn: (() => void) | null = null
+    const providerInstance = {
+      coreStream: vi
+        .fn()
+        .mockImplementationOnce(async function* () {
+          await new Promise<void>((resolve) => {
+            releaseFirstTurn = resolve
+          })
+          throw new Error('network down')
+        })
+        .mockImplementation(async function* () {
+          yield { type: 'text', content: 'Recovered queued response' }
+          yield { type: 'stop', stop_reason: 'end_turn' }
+        })
+    }
+    llmProvider.getProviderInstance.mockReturnValue(providerInstance)
+
+    const session = await agentPresenter.createSession(
+      { agentId: 'deepchat', message: 'Turn that errors', projectDir: null },
+      1
+    )
+    await new Promise((r) => setTimeout(r, 20))
+
+    await agentPresenter.queuePendingInput(session.id, 'Queued while failing')
+    releaseFirstTurn?.()
+    await new Promise((r) => setTimeout(r, 80))
+
+    const failedSession = await agentPresenter.getSession(session.id)
+    expect(failedSession?.status).toBe('error')
+
+    const pendingAfterError = await agentPresenter.listPendingInputs(session.id)
+    expect(pendingAfterError).toHaveLength(1)
+    expect(pendingAfterError[0].mode).toBe('queue')
+
+    await agentPresenter.resumePendingQueue(session.id)
+    await new Promise((r) => setTimeout(r, 80))
+
+    const recoveredSession = await agentPresenter.getSession(session.id)
+    expect(recoveredSession?.status).toBe('idle')
+    expect(providerInstance.coreStream).toHaveBeenCalledTimes(2)
+
+    const messages = sqlitePresenter.deepchatMessagesTable.getBySession(session.id)
+    const userMessages = messages.filter((message: any) => message.role === 'user')
+    expect(userMessages).toHaveLength(2)
+    expect(JSON.parse(userMessages[1].content).text).toBe('Queued while failing')
+    await expect(agentPresenter.listPendingInputs(session.id)).resolves.toEqual([])
+  })
 })
 
 describe('Integration: crash recovery', () => {
diff --git a/test/renderer/components/ChatPage.test.ts b/test/renderer/components/ChatPage.test.ts
index d5048210e..abf794b3c 100644
--- a/test/renderer/components/ChatPage.test.ts
+++ b/test/renderer/components/ChatPage.test.ts
@@ -8,7 +8,31 @@ const passthrough = (name: string) =>
     template: '<div><slot /></div>'
   })
 
-const setup = async () => {
+const buildAssistantMessage = (content: unknown) => ({
+  id: 'm1',
+  sessionId: 's1',
+  orderSeq: 1,
+  role: 'assistant' as const,
+  content: JSON.stringify(content),
+  status: 'sent' as const,
+  isContextEdge: 0,
+  metadata: JSON.stringify({
+    model: 'dimcode-acp',
+    provider: 'acp',
+    reasoningStartTime: 1_200,
+    reasoningEndTime: 4_500
+  }),
+  traceCount: 0,
+  createdAt: 1,
+  updatedAt: 1
+})
+
+type SetupOptions = {
+  messages?: Array<Record<string, unknown>>
+  pendingInputStorePatch?: Record<string, unknown>
+}
+
+const setup = async (options: SetupOptions = {}) => {
   vi.resetModules()
 
   const sessionStore = reactive({
@@ -26,32 +50,15 @@ const setup = async () => {
   })
 
   const messageStore = reactive({
-    messages: [
-      {
-        id: 'm1',
-        sessionId: 's1',
-        orderSeq: 1,
-        role: 'assistant' as const,
-        content: JSON.stringify([
-          {
-            type: 'reasoning_content',
-            content: 'thinking',
-            status: 'success',
-            timestamp: 1
-          }
-        ]),
-        status: 'sent' as const,
-        isContextEdge: 0,
-        metadata: JSON.stringify({
-          model: 'dimcode-acp',
-          provider: 'acp',
-          reasoningStartTime: 1_200,
-          reasoningEndTime: 4_500
-        }),
-        traceCount: 0,
-        createdAt: 1,
-        updatedAt: 1
-      }
+    messages: options.messages ?? [
+      buildAssistantMessage([
+        {
+          type: 'reasoning_content',
+          content: 'thinking',
+          status: 'success',
+          timestamp: 1
+        }
+      ])
     ],
     isStreaming: false,
     streamingBlocks: [],
@@ -61,6 +68,22 @@ const setup = async () => {
     addOptimisticUserMessage: vi.fn()
   })
 
+  const pendingInputStore = reactive({
+    items: [],
+    steerItems: [],
+    queueItems: [],
+    isAtCapacity: false,
+    loadPendingInputs: vi.fn().mockResolvedValue(undefined),
+    queueInput: vi.fn().mockResolvedValue(undefined),
+    updateQueueInput: vi.fn().mockResolvedValue(undefined),
+    moveQueueInput: vi.fn().mockResolvedValue(undefined),
+    convertToSteer: vi.fn().mockResolvedValue(undefined),
+    deleteInput: vi.fn().mockResolvedValue(undefined),
+    resumeQueue: vi.fn().mockResolvedValue(undefined),
+    clear: vi.fn(),
+    ...options.pendingInputStorePatch
+  })
+
   const modelStore = reactive({
     findModelByIdOrName: vi.fn((id: string) => ({
       model: {
@@ -85,6 +108,9 @@ const setup = async () => {
   vi.doMock('@/stores/ui/message', () => ({
     useMessageStore: () => messageStore
   }))
+  vi.doMock('@/stores/ui/pendingInput', () => ({
+    usePendingInputStore: () => pendingInputStore
+  }))
   vi.doMock('@/stores/modelStore', () => ({
     useModelStore: () => modelStore
   }))
@@ -124,16 +150,61 @@ const setup = async () => {
     })
   }))
   vi.doMock('@/components/chat/ChatInputBox.vue', () => ({
-    default: passthrough('ChatInputBox')
+    default: defineComponent({
+      name: 'ChatInputBox',
+      props: {
+        files: {
+          type: Array,
+          default: () => []
+        },
+        submitDisabled: {
+          type: Boolean,
+          default: false
+        }
+      },
+      template: '<div class="chat-input-box-stub"><slot name="toolbar" /></div>'
+    })
   }))
   vi.doMock('@/components/chat/ChatInputToolbar.vue', () => ({
-    default: passthrough('ChatInputToolbar')
+    default: defineComponent({
+      name: 'ChatInputToolbar',
+      props: {
+        isGenerating: {
+          type: Boolean,
+          default: false
+        },
+        hasInput: {
+          type: Boolean,
+          default: false
+        },
+        sendDisabled: {
+          type: Boolean,
+          default: false
+        }
+      },
+      template: '<div class="chat-input-toolbar-stub" />'
+    })
+  }))
+  vi.doMock('@/components/chat/PendingInputLane.vue', () => ({
+    default: defineComponent({
+      name: 'PendingInputLane',
+      props: {
+        showResumeQueue: {
+          type: Boolean,
+          default: false
+        }
+      },
+      template: '<div class="pending-input-lane-stub" />'
+    })
   }))
   vi.doMock('@/components/chat/ChatStatusBar.vue', () => ({
     default: passthrough('ChatStatusBar')
   }))
   vi.doMock('@/components/chat/ChatToolInteractionOverlay.vue', () => ({
-    default: passthrough('ChatToolInteractionOverlay')
+    default: defineComponent({
+      name: 'ChatToolInteractionOverlay',
+      template: '<div class="chat-tool-interaction-overlay-stub" />'
+    })
   }))
   vi.doMock('@/components/trace/TraceDialog.vue', () => ({
     default: passthrough('TraceDialog')
@@ -150,7 +221,8 @@ const setup = async () => {
 
   return {
     wrapper,
-    messageStore
+    messageStore,
+    pendingInputStore
   }
 }
 
@@ -169,4 +241,139 @@ describe('ChatPage', () => {
     expect(messages[0].usage.reasoning_start_time).toBe(1_200)
     expect(messages[0].usage.reasoning_end_time).toBe(4_500)
   })
+
+  it('keeps pending lane visible below the tool interaction overlay', async () => {
+    const { wrapper } = await setup({
+      messages: [
+        buildAssistantMessage([
+          {
+            type: 'action',
+            action_type: 'question_request',
+            status: 'pending',
+            tool_call: {
+              id: 'tool-1',
+              name: 'question',
+              params: '{}'
+            }
+          }
+        ])
+      ],
+      pendingInputStorePatch: {
+        items: [
+          {
+            id: 'p1',
+            mode: 'queue',
+            payload: { text: 'queued', files: [] }
+          }
+        ],
+        queueItems: [
+          {
+            id: 'p1',
+            mode: 'queue',
+            payload: { text: 'queued', files: [] }
+          }
+        ]
+      }
+    })
+
+    const html = wrapper.html()
+    expect(wrapper.find('.chat-tool-interaction-overlay-stub').exists()).toBe(true)
+    expect(wrapper.find('.pending-input-lane-stub').exists()).toBe(true)
+    expect(wrapper.find('.chat-input-box-stub').exists()).toBe(false)
+    expect(html.indexOf('chat-tool-interaction-overlay-stub')).toBeLessThan(
+      html.indexOf('pending-input-lane-stub')
+    )
+  })
+
+  it('renders pending lane above the input box when no tool interaction is active', async () => {
+    const { wrapper } = await setup({
+      pendingInputStorePatch: {
+        items: [
+          {
+            id: 'p1',
+            mode: 'queue',
+            payload: { text: 'queued', files: [] }
+          }
+        ],
+        queueItems: [
+          {
+            id: 'p1',
+            mode: 'queue',
+            payload: { text: 'queued', files: [] }
+          }
+        ]
+      }
+    })
+
+    const html = wrapper.html()
+    expect(wrapper.find('.pending-input-lane-stub').exists()).toBe(true)
+    expect(wrapper.find('.chat-input-box-stub').exists()).toBe(true)
+    expect(wrapper.findComponent({ name: 'PendingInputLane' }).props('showResumeQueue')).toBe(true)
+    expect(html.indexOf('pending-input-lane-stub')).toBeLessThan(
+      html.indexOf('chat-input-box-stub')
+    )
+  })
+
+  it('hides resume queue while waiting for a tool follow-up answer', async () => {
+    const { wrapper } = await setup({
+      messages: [
+        buildAssistantMessage([
+          {
+            type: 'action',
+            action_type: 'question_request',
+            status: 'success',
+            tool_call: {
+              id: 'tool-1',
+              name: 'question',
+              params: '{}'
+            },
+            extra: {
+              needsUserAction: false,
+              questionResolution: 'replied'
+            }
+          }
+        ])
+      ],
+      pendingInputStorePatch: {
+        items: [
+          {
+            id: 'p1',
+            mode: 'queue',
+            payload: { text: 'queued', files: [] }
+          }
+        ],
+        queueItems: [
+          {
+            id: 'p1',
+            mode: 'queue',
+            payload: { text: 'queued', files: [] }
+          }
+        ]
+      }
+    })
+
+    expect(wrapper.findComponent({ name: 'PendingInputLane' }).props('showResumeQueue')).toBe(false)
+  })
+
+  it('allows queueing attachment-only drafts', async () => {
+    const { wrapper, pendingInputStore } = await setup()
+    const file = { name: 'a.txt', path: '/tmp/a.txt', mimeType: 'text/plain' }
+
+    const inputBox = wrapper.findComponent({ name: 'ChatInputBox' })
+    inputBox.vm.$emit('update:files', [file])
+    await flushPromises()
+
+    const toolbar = wrapper.findComponent({ name: 'ChatInputToolbar' })
+    expect(toolbar.props('hasInput')).toBe(true)
+    expect(toolbar.props('sendDisabled')).toBe(false)
+    expect(inputBox.props('submitDisabled')).toBe(false)
+
+    inputBox.vm.$emit('submit')
+    await flushPromises()
+
+    expect(pendingInputStore.queueInput).toHaveBeenCalledWith('s1', {
+      text: '',
+      files: [file]
+    })
+  })
 })
diff --git a/test/renderer/components/ChatStatusBar.test.ts b/test/renderer/components/ChatStatusBar.test.ts
index 0a4d47800..cfaebc9db 100644
--- a/test/renderer/components/ChatStatusBar.test.ts
+++ b/test/renderer/components/ChatStatusBar.test.ts
@@ -11,9 +11,9 @@ type TestGenerationSettings = {
   temperature: number
   contextLength: number
   maxTokens: number
-  thinkingBudget: number
-  reasoningEffort: ReasoningEffort
-  verbosity: 'low' | 'medium' | 'high'
+  thinkingBudget?: number
+  reasoningEffort?: ReasoningEffort
+  verbosity?: 'low' | 'medium' | 'high'
 }
 
 type ExtraModelGroup = {
@@ -34,7 +34,8 @@ type SetupOptions = {
   preferredModel?: { providerId: string; modelId: string } | null
   extraModelGroups?: ExtraModelGroup[]
   reasoningEffortDefault?: ReasoningEffort
-  sessionSettings?: Partial<TestGenerationSettings>
+  sessionSettings?: Partial<TestGenerationSettings> | null
+  draftGenerationSettings?: Partial<TestGenerationSettings>
   reasoningPortrait?: ReasoningPortrait | null
   projectPath?: string | null
   acpDraftSessionId?: string | null
@@ -68,22 +69,14 @@ const ButtonStub = defineComponent({
     '<button v-bind="$attrs" :disabled="disabled" @click="$emit(\'click\', $event)"><slot /></button>'
 })
 
-const SliderStub = defineComponent({
-  name: 'Slider',
-  props: {
-    modelValue: { type: Array, default: () => [] }
-  },
-  emits: ['update:modelValue'],
-  template: '<div class="slider-stub" />'
-})
-
 const InputStub = defineComponent({
   name: 'Input',
   props: {
-    modelValue: { type: String, default: '' }
+    modelValue: { type: [String, Number], default: '' }
   },
   emits: ['update:modelValue'],
-  template: '<input class="input-stub" />'
+  template:
+    '<input class="input-stub" v-bind="$attrs" :value="modelValue ?? \'\'" @input="$emit(\'update:modelValue\', $event.target.value)" />'
 })
 
 const SelectStub = defineComponent({
@@ -103,7 +96,7 @@ const SwitchStub = defineComponent({
   },
   emits: ['update:modelValue'],
   template:
-    '<button class="switch-stub" :data-model-value="String(modelValue)" :disabled="disabled" @click="$emit(\'update:modelValue\', !modelValue)" />'
+    '<button class="switch-stub" v-bind="$attrs" :data-model-value="String(modelValue)" :disabled="disabled" @click="$emit(\'update:modelValue\', !modelValue)" />'
 })
 
 const createAcpConfigState = (
@@ -189,7 +182,7 @@ const setup = async (options: SetupOptions = {}) => {
     ({
       supported: true,
       defaultEnabled: true,
-      mode: 'effort',
+      mode: 'mixed',
       budget: { min: 0, max: 8192, default: 512 },
       ...(options.supportsEffort === false
         ? {}
@@ -295,9 +288,19 @@ const setup = async (options: SetupOptions = {}) => {
     thinkingBudget: undefined as number | undefined,
     reasoningEffort: undefined as 'minimal' | 'low' | 'medium' | 'high' | undefined,
     verbosity: undefined as 'low' | 'medium' | 'high' | undefined,
+    ...options.draftGenerationSettings,
     updateGenerationSettings: vi.fn((patch: Record<string, unknown>) =>
       Object.assign(draftStore, patch)
-    )
+    ),
+    resetGenerationSettings: vi.fn(() => {
+      draftStore.systemPrompt = undefined
+      draftStore.temperature = undefined
+      draftStore.contextLength = undefined
+      draftStore.maxTokens = undefined
+      draftStore.thinkingBudget = undefined
+      draftStore.reasoningEffort = undefined
+      draftStore.verbosity = undefined
+    })
   })
 
   const projectStore = reactive({
@@ -355,10 +358,13 @@ const setup = async (options: SetupOptions = {}) => {
     ...options.sessionSettings
   }
 
+  const sessionSettingsResult =
+    options.sessionSettings === null ? null : ({ ...baseSessionSettings } as TestGenerationSettings)
+
   const newAgentPresenter = {
     getPermissionMode: vi.fn().mockResolvedValue('full_access'),
     setPermissionMode: vi.fn().mockResolvedValue(undefined),
-    getSessionGenerationSettings: vi.fn().mockResolvedValue(baseSessionSettings),
+    getSessionGenerationSettings: vi.fn().mockResolvedValue(sessionSettingsResult),
     getAcpSessionConfigOptions: vi.fn().mockResolvedValue(options.acpSessionConfig ?? null),
     setAcpSessionConfigOption: vi
       .fn()
@@ -473,7 +479,6 @@ const setup = async (options: SetupOptions = {}) => {
     global: {
       stubs: {
         Button: ButtonStub,
-        Slider: SliderStub,
         Input: InputStub,
         DropdownMenu: passthrough('DropdownMenu'),
         DropdownMenuContent: passthrough('DropdownMenuContent'),
@@ -514,6 +519,29 @@ const setup = async (options: SetupOptions = {}) => {
   }
 }
 
+const findNumericInput = (wrapper: Awaited<ReturnType<typeof setup>>['wrapper'], control: string) =>
+  wrapper.find(`input[data-setting-control="${control}"]`)
+
+const findNumericButton = (
+  wrapper: Awaited<ReturnType<typeof setup>>['wrapper'],
+  control: string,
+  action: 'increment' | 'decrement'
+) => wrapper.find(`button[data-setting-control="${control}"][data-setting-action="${action}"]`)
+
+const findThinkingBudgetToggle = (wrapper: Awaited<ReturnType<typeof setup>>['wrapper']) =>
+  wrapper.find('.switch-stub[data-setting-control="thinkingBudget-toggle"]')
+
+const commitNumericInput = async (
+  wrapper: Awaited<ReturnType<typeof setup>>['wrapper'],
+  control: string,
+  value: string
+) => {
+  const input = findNumericInput(wrapper, control)
+  await input.trigger('focus')
+  await input.setValue(value)
+  await input.trigger('blur')
+}
+
 describe('ChatStatusBar model and session panels', () => {
   it('passes system prompt section to the unified session panel in deepchat and hides it in ACP', async () => {
     const deepchat = await setup({ agentId: 'deepchat', hasActiveSession: false })
@@ -704,8 +732,154 @@ describe('ChatStatusBar model and session panels', () => {
   it('uses unified defaults for draft model settings', async () => {
     const { wrapper } = await setup({ agentId: 'deepchat', hasActiveSession: false })
 
+    expect((wrapper.vm as any).localSettings.temperature).toBe(0.7)
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(16000)
+    expect((wrapper.vm as any).localSettings.maxTokens).toBe(4096)
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBe(512)
+  })
+
+  it('ignores existing draft generation overrides when loading draft model defaults', async () => {
+    const { wrapper, draftStore } = await setup({
+      agentId: 'deepchat',
+      hasActiveSession: false,
+      draftGenerationSettings: {
+        temperature: 1.9,
+        contextLength: 64000,
+        maxTokens: 8192,
+        thinkingBudget: 2048
+      }
+    })
+
+    expect(draftStore.temperature).toBe(1.9)
+    expect(draftStore.contextLength).toBe(64000)
+    expect((wrapper.vm as any).localSettings.temperature).toBe(0.7)
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(16000)
+    expect((wrapper.vm as any).localSettings.maxTokens).toBe(4096)
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBe(512)
+  })
+
+  it('falls back to model defaults when the active session has no saved generation settings', async () => {
+    const { wrapper, newAgentPresenter } = await setup({
+      agentId: 'deepchat',
+      hasActiveSession: true,
+      activeProviderId: 'openai',
+      activeModelId: 'gpt-4',
+      sessionSettings: null
+    })
+
+    expect(newAgentPresenter.getSessionGenerationSettings).toHaveBeenCalledWith('s1')
+    expect((wrapper.vm as any).localSettings).toEqual({
+      systemPrompt: 'Default prompt',
+      temperature: 0.7,
+      contextLength: 16000,
+      maxTokens: 4096,
+      thinkingBudget: 512,
+      reasoningEffort: 'medium',
+      verbosity: 'medium'
+    })
+  })
+
+  it('steps numeric settings with buttons and blocks invalid relation commits', async () => {
+    const { wrapper } = await setup({ agentId: 'deepchat', hasActiveSession: false })
+    await (wrapper.vm as any).openModelSettings('openai', 'gpt-4')
+    await flushPromises()
+
+    await findNumericButton(wrapper, 'temperature', 'increment').trigger('click')
+    expect((wrapper.vm as any).localSettings.temperature).toBe(0.8)
+
+    await findNumericButton(wrapper, 'contextLength', 'decrement').trigger('click')
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(14976)
+
+    await findNumericButton(wrapper, 'thinkingBudget', 'increment').trigger('click')
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBe(640)
+
+    await commitNumericInput(wrapper, 'contextLength', '2048')
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(14976)
+    expect((wrapper.vm as any).localSettings.maxTokens).toBe(4096)
+    expect((findNumericInput(wrapper, 'contextLength').element as HTMLInputElement).value).toBe(
+      '2048'
+    )
+    expect(wrapper.text()).toContain(
+      'chat.advancedSettings.validation.contextLengthAtLeastMaxTokens'
+    )
+
+    await commitNumericInput(wrapper, 'maxTokens', '2048')
+    expect((wrapper.vm as any).localSettings.maxTokens).toBe(2048)
+
+    await commitNumericInput(wrapper, 'contextLength', '2048')
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(2048)
+  })
+
+  it('keeps invalid numeric drafts visible and only commits valid values', async () => {
+    const { wrapper, draftStore } = await setup({ agentId: 'deepchat', hasActiveSession: false })
+    await (wrapper.vm as any).openModelSettings('openai', 'gpt-4')
+    await flushPromises()
+
+    const temperatureInput = findNumericInput(wrapper, 'temperature')
+    await temperatureInput.trigger('focus')
+    await temperatureInput.setValue('-3.2')
+
+    expect((wrapper.vm as any).localSettings.temperature).toBe(0.7)
+    expect((temperatureInput.element as HTMLInputElement).value).toBe('-3.2')
+
+    await temperatureInput.trigger('blur')
+    expect((wrapper.vm as any).localSettings.temperature).toBe(-3.2)
+    expect(draftStore.temperature).toBe(-3.2)
+
+    await commitNumericInput(wrapper, 'contextLength', '100.5')
+    await commitNumericInput(wrapper, 'maxTokens', '999999')
+
     expect((wrapper.vm as any).localSettings.contextLength).toBe(16000)
     expect((wrapper.vm as any).localSettings.maxTokens).toBe(4096)
+    expect((findNumericInput(wrapper, 'contextLength').element as HTMLInputElement).value).toBe(
+      '100.5'
+    )
+    expect((findNumericInput(wrapper, 'maxTokens').element as HTMLInputElement).value).toBe(
+      '999999'
+    )
+    expect(wrapper.text()).toContain('chat.advancedSettings.validation.nonNegativeInteger')
+    expect(wrapper.text()).toContain(
+      'chat.advancedSettings.validation.maxTokensWithinContextLength'
+    )
+    expect(draftStore.contextLength).toBeUndefined()
+    expect(draftStore.maxTokens).toBeUndefined()
+  })
+
+  it('treats negative thinking budget sentinels as switch-off state', async () => {
+    const { wrapper, configPresenter } = await setup({
+      agentId: 'deepchat',
+      hasActiveSession: false,
+      reasoningPortrait: {
+        supported: true,
+        defaultEnabled: true,
+        mode: 'budget',
+        budget: { min: 0, max: 8192, default: -1, auto: -1 },
+        verbosity: 'medium',
+        verbosityOptions: ['low', 'medium', 'high']
+      }
+    })
+    configPresenter.getModelConfig.mockReturnValue({
+      temperature: 0.7,
+      contextLength: 16000,
+      maxTokens: 4096,
+      thinkingBudget: -1,
+      verbosity: 'medium'
+    })
+
+    await (wrapper.vm as any).openModelSettings('anthropic', 'claude-3-5-sonnet')
+    await flushPromises()
+
+    expect(findThinkingBudgetToggle(wrapper).attributes('data-model-value')).toBe('false')
+    expect(findNumericInput(wrapper, 'thinkingBudget').exists()).toBe(false)
+    expect(wrapper.text()).toContain('common.disabled')
+
+    await findThinkingBudgetToggle(wrapper).trigger('click')
+    expect(findThinkingBudgetToggle(wrapper).attributes('data-model-value')).toBe('true')
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBe(0)
+
+    await findThinkingBudgetToggle(wrapper).trigger('click')
+    expect(findThinkingBudgetToggle(wrapper).attributes('data-model-value')).toBe('false')
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBeUndefined()
   })
 
   it('prefers preferredModel over defaultModel for draft selection', async () => {
@@ -729,10 +903,12 @@ describe('ChatStatusBar model and session panels', () => {
       activeProviderId: 'openai',
       activeModelId: 'gpt-4'
     })
+    await (wrapper.vm as any).openModelSettings('openai', 'gpt-4')
+    await flushPromises()
 
-    ;(wrapper.vm as any).onTemperatureSlider([0.9])
-    ;(wrapper.vm as any).onTemperatureSlider([1.1])
-    ;(wrapper.vm as any).onTemperatureSlider([1.2])
+    await commitNumericInput(wrapper, 'temperature', '0.9')
+    await commitNumericInput(wrapper, 'temperature', '1.1')
+    await commitNumericInput(wrapper, 'temperature', '1.2')
 
     vi.advanceTimersByTime(299)
     await flushPromises()
@@ -751,6 +927,138 @@ describe('ChatStatusBar model and session panels', () => {
     vi.useRealTimers()
   })
 
+  it('turns thinking budget off with the switch and clears the persisted field', async () => {
+    vi.useFakeTimers()
+
+    const { wrapper, newAgentPresenter } = await setup({
+      hasActiveSession: true,
+      activeProviderId: 'openai',
+      activeModelId: 'gpt-4'
+    })
+    await (wrapper.vm as any).openModelSettings('openai', 'gpt-4')
+    await flushPromises()
+
+    await findThinkingBudgetToggle(wrapper).trigger('click')
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBeUndefined()
+
+    vi.advanceTimersByTime(300)
+    await flushPromises()
+
+    expect(newAgentPresenter.updateSessionGenerationSettings).toHaveBeenCalledWith(
+      's1',
+      expect.objectContaining({ thinkingBudget: undefined })
+    )
+
+    vi.runOnlyPendingTimers()
+    vi.useRealTimers()
+  })
+
+  it('keeps invalid drafts and field errors when an older session response returns later', async () => {
+    vi.useFakeTimers()
+
+    const firstResponse = createDeferred<TestGenerationSettings>()
+
+    const { wrapper, newAgentPresenter } = await setup({
+      hasActiveSession: true,
+      activeProviderId: 'openai',
+      activeModelId: 'gpt-4'
+    })
+
+    newAgentPresenter.updateSessionGenerationSettings.mockImplementation(
+      () => firstResponse.promise
+    )
+
+    await (wrapper.vm as any).openModelSettings('openai', 'gpt-4')
+    await flushPromises()
+
+    await commitNumericInput(wrapper, 'temperature', '1.1')
+    vi.advanceTimersByTime(300)
+    await flushPromises()
+
+    await commitNumericInput(wrapper, 'contextLength', '100.5')
+
+    firstResponse.resolve({
+      systemPrompt: 'Default prompt',
+      temperature: 1.1,
+      contextLength: 16000,
+      maxTokens: 4096,
+      thinkingBudget: 512,
+      reasoningEffort: 'medium',
+      verbosity: 'medium'
+    })
+    await flushPromises()
+
+    expect((wrapper.vm as any).localSettings.temperature).toBe(1.1)
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(16000)
+    expect((findNumericInput(wrapper, 'contextLength').element as HTMLInputElement).value).toBe(
+      '100.5'
+    )
+    expect(wrapper.text()).toContain('chat.advancedSettings.validation.nonNegativeInteger')
+
+    vi.runOnlyPendingTimers()
+    vi.useRealTimers()
+  })
+
+  it('keeps thinking budget off when an older session response returns later', async () => {
+    vi.useFakeTimers()
+
+    const firstResponse = createDeferred<TestGenerationSettings>()
+    const secondResponse = createDeferred<TestGenerationSettings>()
+    const responseQueue = [firstResponse.promise, secondResponse.promise]
+
+    const { wrapper, newAgentPresenter } = await setup({
+      hasActiveSession: true,
+      activeProviderId: 'openai',
+      activeModelId: 'gpt-4'
+    })
+
+    newAgentPresenter.updateSessionGenerationSettings.mockImplementation(
+      () => responseQueue.shift() ?? Promise.reject(new Error('missing mocked response'))
+    )
+
+    await (wrapper.vm as any).openModelSettings('openai', 'gpt-4')
+    await flushPromises()
+
+    await findNumericButton(wrapper, 'thinkingBudget', 'increment').trigger('click')
+    vi.advanceTimersByTime(300)
+    await flushPromises()
+
+    await findThinkingBudgetToggle(wrapper).trigger('click')
+
+    firstResponse.resolve({
+      systemPrompt: 'Default prompt',
+      temperature: 0.7,
+      contextLength: 16000,
+      maxTokens: 4096,
+      thinkingBudget: 640,
+      reasoningEffort: 'medium',
+      verbosity: 'medium'
+    })
+    await flushPromises()
+
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBeUndefined()
+    expect(findThinkingBudgetToggle(wrapper).attributes('data-model-value')).toBe('false')
+
+    vi.advanceTimersByTime(300)
+    await flushPromises()
+
+    secondResponse.resolve({
+      systemPrompt: 'Default prompt',
+      temperature: 0.7,
+      contextLength: 16000,
+      maxTokens: 4096,
+      reasoningEffort: 'medium',
+      verbosity: 'medium'
+    } as TestGenerationSettings)
+    await flushPromises()
+
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBeUndefined()
+    expect(findThinkingBudgetToggle(wrapper).attributes('data-model-value')).toBe('false')
+
+    vi.runOnlyPendingTimers()
+    vi.useRealTimers()
+  })
+
   it('switches active non-ACP session model via session store', async () => {
     const { wrapper, sessionStore } = await setup({
       agentId: 'deepchat',
@@ -838,6 +1146,58 @@ describe('ChatStatusBar model and session panels', () => {
     })
   })
 
+  it('resets draft numeric overrides when switching models without an active session', async () => {
+    const { wrapper, draftStore, configPresenter } = await setup({
+      agentId: 'deepchat',
+      hasActiveSession: false
+    })
+    configPresenter.getModelConfig.mockImplementation((modelId: string, providerId: string) => {
+      if (providerId === 'anthropic' && modelId === 'claude-3-5-sonnet') {
+        return {
+          temperature: 0.2,
+          contextLength: 32000,
+          maxTokens: 2048,
+          thinkingBudget: 256,
+          reasoningEffort: 'low',
+          verbosity: 'high'
+        }
+      }
+      return {
+        temperature: 0.7,
+        contextLength: 16000,
+        maxTokens: 4096,
+        thinkingBudget: 512,
+        reasoningEffort: 'medium',
+        verbosity: 'medium'
+      }
+    })
+    ;(wrapper.vm as any).onTemperatureInput('1.5')
+    ;(wrapper.vm as any).commitTemperatureInput()
+    ;(wrapper.vm as any).onContextLengthInput('8192')
+    ;(wrapper.vm as any).commitContextLengthInput()
+    ;(wrapper.vm as any).onMaxTokensInput('1024')
+    ;(wrapper.vm as any).commitMaxTokensInput()
+    ;(wrapper.vm as any).onThinkingBudgetInput('1024')
+    ;(wrapper.vm as any).commitThinkingBudgetInput()
+
+    expect(draftStore.temperature).toBe(1.5)
+    expect(draftStore.contextLength).toBe(8192)
+    expect(draftStore.maxTokens).toBe(1024)
+    expect(draftStore.thinkingBudget).toBe(1024)
+
+    await (wrapper.vm as any).selectModel('anthropic', 'claude-3-5-sonnet')
+    await flushPromises()
+
+    expect(draftStore.temperature).toBeUndefined()
+    expect(draftStore.contextLength).toBeUndefined()
+    expect(draftStore.maxTokens).toBeUndefined()
+    expect(draftStore.thinkingBudget).toBeUndefined()
+    expect((wrapper.vm as any).localSettings.temperature).toBe(0.2)
+    expect((wrapper.vm as any).localSettings.contextLength).toBe(32000)
+    expect((wrapper.vm as any).localSettings.maxTokens).toBe(2048)
+    expect((wrapper.vm as any).localSettings.thinkingBudget).toBe(256)
+  })
+
   it('uses ACP model id for the displayed icon', async () => {
     const { wrapper } = await setup({
       agentId: 'dimcode-acp',
diff --git a/test/renderer/components/PendingInputLane.test.ts b/test/renderer/components/PendingInputLane.test.ts
new file mode 100644
index 000000000..0cf1f3621
--- /dev/null
+++ b/test/renderer/components/PendingInputLane.test.ts
@@ -0,0 +1,192 @@
+import { describe, expect, it, vi } from 'vitest'
+import { defineComponent } from 'vue'
+import { mount } from '@vue/test-utils'
+import type { PendingSessionInputRecord } from '@shared/types/agent-interface'
+
+vi.mock('vue-i18n', () => ({
+  useI18n: () => ({
+    t: (key: string, params?: Record<string, number>) => {
+      switch (key) {
+        case 'chat.pendingInput.steer':
+          return 'Steer'
+        case 'chat.pendingInput.queueCount':
+          return `Queue ${params?.count}/${params?.max}`
+        case 'chat.pendingInput.resumeQueue':
+          return 'Resume queue'
+        case 'chat.pendingInput.toSteer':
+          return 'Steer'
+        case 'chat.pendingInput.locked':
+          return 'Locked'
+        case 'chat.pendingInput.reorder':
+          return 'Reorder'
+        case 'chat.pendingInput.files':
+          return `${params?.count} files`
+        case 'chat.pendingInput.attachmentsOnly':
+          return `${params?.count} attachments`
+        case 'chat.pendingInput.empty':
+          return 'Empty message'
+        case 'chat.pendingInput.limitReached':
+          return `Waiting lane is full (${params?.max}).`
+        case 'common.cancel':
+          return 'Cancel'
+        case 'common.save':
+          return 'Save'
+        default:
+          return key
+      }
+    }
+  })
+}))
+
+vi.mock('@iconify/vue', () => ({
+  Icon: defineComponent({
+    name: 'Icon',
+    props: {
+      icon: {
+        type: String,
+        required: true
+      }
+    },
+    template: '<span :data-icon="icon" />'
+  })
+}))
+
+vi.mock('@shadcn/components/ui/button', () => ({
+  Button: defineComponent({
+    name: 'Button',
+    props: {
+      disabled: {
+        type: Boolean,
+        default: false
+      }
+    },
+    emits: ['click'],
+    template: '<button :disabled="disabled" @click="$emit(\'click\', $event)"><slot /></button>'
+  })
+}))
+
+vi.mock('vuedraggable', () => ({
+  default: defineComponent({
+    name: 'Draggable',
+    props: {
+      list: {
+        type: Array,
+        required: true
+      },
+      disabled: {
+        type: Boolean,
+        default: false
+      }
+    },
+    template: `
+      <div data-testid="draggable" :data-disabled="disabled ? 'true' : 'false'">
+        <div v-for="element in list" :key="element.id">
+          <slot name="item" :element="element" />
+        </div>
+      </div>
+    `
+  })
+}))
+
+import PendingInputLane from '@/components/chat/PendingInputLane.vue'
+
+function buildPendingInput(
+  id: string,
+  mode: 'queue' | 'steer',
+  overrides: Partial<PendingSessionInputRecord> = {}
+): PendingSessionInputRecord {
+  return {
+    id,
+    sessionId: 's1',
+    mode,
+    state: 'pending',
+    payload: {
+      text: `${mode}-${id}`,
+      files: []
+    },
+    queueOrder: mode === 'queue' ? Number(id.replace(/\D+/g, '') || '1') : null,
+    claimedAt: null,
+    consumedAt: null,
+    createdAt: 1,
+    updatedAt: 1,
+    ...overrides
+  }
+}
+
+describe('PendingInputLane', () => {
+  it('renders a single pending rail with compact rows for steer and queue items', () => {
+    const wrapper = mount(PendingInputLane, {
+      props: {
+        steerItems: [buildPendingInput('steer-1', 'steer')],
+        queueItems: [buildPendingInput('queue-1', 'queue'), buildPendingInput('queue-2', 'queue')]
+      }
+    })
+
+    expect(wrapper.findAll('[data-testid="pending-rail"]')).toHaveLength(1)
+    expect(wrapper.findAll('[data-testid="pending-row"]')).toHaveLength(3)
+
+    const queueMain = wrapper.find('[data-mode="queue"] [data-testid="pending-row-main"] span')
+    expect(queueMain.classes()).toContain('truncate')
+
+    const steerText = wrapper.find('[data-mode="steer"] [title]')
+    expect(steerText.classes()).toContain('truncate')
+  })
+
+  it('shows inline file badges and becomes internally scrollable when more than three items exist', () => {
+    const wrapper = mount(PendingInputLane, {
+      props: {
+        steerItems: [buildPendingInput('steer-1', 'steer')],
+        queueItems: [
+          buildPendingInput('queue-1', 'queue', {
+            payload: {
+              text: 'queue-1',
+              files: [{ name: 'a.txt', path: '/a.txt', mimeType: 'text/plain', size: 1 }]
+            }
+          }),
+          buildPendingInput('queue-2', 'queue'),
+          buildPendingInput('queue-3', 'queue')
+        ]
+      }
+    })
+
+    expect(wrapper.get('[data-testid="pending-rail-list"]').attributes('data-scrollable')).toBe(
+      'true'
+    )
+    expect(wrapper.text()).toContain('1 files')
+  })
+
+  it('expands only the active queue item for inline editing and disables drag while editing', async () => {
+    const wrapper = mount(PendingInputLane, {
+      props: {
+        steerItems: [],
+        queueItems: [buildPendingInput('queue-1', 'queue'), buildPendingInput('queue-2', 'queue')]
+      }
+    })
+
+    const mainButtons = wrapper.findAll('[data-testid="pending-row-main"]')
+    await mainButtons[0].trigger('click')
+
+    expect(wrapper.findAll('[data-testid="pending-edit-textarea"]')).toHaveLength(1)
+    const queueRows = wrapper.findAll('[data-mode="queue"]')
+    expect(queueRows[0].attributes('data-editing')).toBe('true')
+    expect(queueRows[1].attributes('data-editing')).toBe('false')
+    expect(wrapper.get('[data-testid="draggable"]').attributes('data-disabled')).toBe('true')
+  })
+
+  it('shows resume queue action only when requested and emits the event', async () => {
+    const wrapper = mount(PendingInputLane, {
+      props: {
+        steerItems: [],
+        queueItems: [buildPendingInput('queue-1', 'queue')],
+        showResumeQueue: true
+      }
+    })
+
+    const buttons = wrapper.findAll('button')
+    const resumeButton = buttons.find((button) => button.text() === 'Resume queue')
+
+    expect(resumeButton).toBeTruthy()
+    await resumeButton!.trigger('click')
+    expect(wrapper.emitted('resume-queue')).toHaveLength(1)
+  })
+})
diff --git a/test/renderer/stores/pendingInputStore.test.ts b/test/renderer/stores/pendingInputStore.test.ts
new file mode 100644
index 000000000..a130ab7e3
--- /dev/null
+++ b/test/renderer/stores/pendingInputStore.test.ts
@@ -0,0 +1,151 @@
+import { createPinia, setActivePinia } from 'pinia'
+import { describe, expect, it, vi } from 'vitest'
+
+function createDeferred<T>() {
+  let resolve!: (value: T) => void
+  let reject!: (error?: unknown) => void
+  const promise = new Promise<T>((innerResolve, innerReject) => {
+    resolve = innerResolve
+    reject = innerReject
+  })
+  return { promise, resolve, reject }
+}
+
+const createPendingItem = (id: string, sessionId: string) => ({
+  id,
+  sessionId,
+  mode: 'queue' as const,
+  state: 'pending' as const,
+  payload: {
+    text: id,
+    files: []
+  },
+  queueOrder: 0,
+  claimedAt: null,
+  consumedAt: null,
+  createdAt: 1,
+  updatedAt: 1
+})
+
+const setupStore = async () => {
+  vi.resetModules()
+  setActivePinia(createPinia())
+
+  const newAgentPresenter = {
+    listPendingInputs: vi.fn(),
+    queuePendingInput: vi.fn(),
+    updateQueuedInput: vi.fn(),
+    moveQueuedInput: vi.fn(),
+    convertPendingInputToSteer: vi.fn(),
+    deletePendingInput: vi.fn(),
+    resumePendingQueue: vi.fn()
+  }
+
+  vi.doMock('@/composables/usePresenter', () => ({
+    usePresenter: () => newAgentPresenter
+  }))
+  ;(
+    window as typeof window & {
+      electron: {
+        ipcRenderer: {
+          on: ReturnType<typeof vi.fn>
+          removeListener: ReturnType<typeof vi.fn>
+        }
+      }
+    }
+  ).electron = {
+    ipcRenderer: {
+      on: vi.fn(),
+      removeListener: vi.fn()
+    }
+  }
+
+  const { usePendingInputStore } = await import('@/stores/ui/pendingInput')
+
+  return {
+    store: usePendingInputStore(),
+    newAgentPresenter
+  }
+}
+
+describe('pendingInput store', () => {
+  it('ignores stale load results after the active session changes', async () => {
+    const { store, newAgentPresenter } = await setupStore()
+    const firstLoad = createDeferred<ReturnType<typeof createPendingItem>[]>()
+    const secondLoad = createDeferred<ReturnType<typeof createPendingItem>[]>()
+
+    newAgentPresenter.listPendingInputs
+      .mockReturnValueOnce(firstLoad.promise)
+      .mockReturnValueOnce(secondLoad.promise)
+
+    const firstPromise = store.loadPendingInputs('s1')
+    const secondPromise = store.loadPendingInputs('s2')
+
+    secondLoad.resolve([createPendingItem('p2', 's2')])
+    await secondPromise
+
+    expect(store.currentSessionId).toBe('s2')
+    expect(store.items).toEqual([createPendingItem('p2', 's2')])
+    expect(store.loading).toBe(false)
+    expect(store.error).toBeNull()
+
+    firstLoad.resolve([createPendingItem('p1', 's1')])
+    await firstPromise
+
+    expect(store.currentSessionId).toBe('s2')
+    expect(store.items).toEqual([createPendingItem('p2', 's2')])
+    expect(store.loading).toBe(false)
+    expect(store.error).toBeNull()
+  })
+
+  it('preserves clear state when an in-flight load later fails', async () => {
+    const { store, newAgentPresenter } = await setupStore()
+    const load = createDeferred<ReturnType<typeof createPendingItem>[]>()
+
+    newAgentPresenter.listPendingInputs.mockReturnValueOnce(load.promise)
+
+    const loadPromise = store.loadPendingInputs('s1')
+    expect(store.currentSessionId).toBe('s1')
+    expect(store.loading).toBe(true)
+
+    store.clear()
+
+    expect(store.currentSessionId).toBeNull()
+    expect(store.items).toEqual([])
+    expect(store.loading).toBe(false)
+    expect(store.error).toBeNull()
+
+    load.reject(new Error('stale failure'))
+    await loadPromise
+
+    expect(store.currentSessionId).toBeNull()
+    expect(store.items).toEqual([])
+    expect(store.loading).toBe(false)
+    expect(store.error).toBeNull()
+  })
+
+  it('removes the pending inputs listener when the store is disposed', async () => {
+    const { store } = await setupStore()
+    const ipcRenderer = (
+      window as typeof window & {
+        electron: {
+          ipcRenderer: {
+            on: ReturnType<typeof vi.fn>
+            removeListener: ReturnType<typeof vi.fn>
+          }
+        }
+      }
+    ).electron.ipcRenderer
+
+    expect(ipcRenderer.on).toHaveBeenCalledTimes(1)
+
+    const [eventName, pendingInputsHandler] = ipcRenderer.on.mock.calls[0]
+
+    expect(eventName).toBe('session:pending-inputs-updated')
+    expect(typeof pendingInputsHandler).toBe('function')
+
+    store.$dispose()
+
+    expect(ipcRenderer.removeListener).toHaveBeenCalledWith(eventName, pendingInputsHandler)
+  })
+})