ghostwright · mcheemaa · Apr 12, 2026 · Apr 12, 2026 · Apr 12, 2026 · chatgpt-codex-connector
diff --git a/bun.lock b/bun.lock
diff --git a/package.json b/package.json
@@ -17,7 +17,6 @@
   },
   "dependencies": {
     "@anthropic-ai/claude-agent-sdk": "^0.2.77",
-    "@anthropic-ai/sdk": "^0.80.0",
     "@modelcontextprotocol/sdk": "^1.28.0",
     "@slack/bolt": "^4.6.0",
     "croner": "^10.0.1",
@@ -26,8 +25,7 @@
     "resend": "^6.9.4",
     "telegraf": "^4.16.3",
     "yaml": "^2.6.0",
-    "zod": "^3.24.0",
-    "zod-to-json-schema": "^3.25.1"
+    "zod": "^3.24.0"
   },
   "devDependencies": {
     "@biomejs/biome": "^1.9.0",

diff --git a/src/agent/__tests__/judge-query.test.ts b/src/agent/__tests__/judge-query.test.ts
@@ -0,0 +1,95 @@
+import { describe, expect, test } from "bun:test";
+import { z } from "zod/v4";
+import { parseJsonFromResponse } from "../judge-query.ts";
+
+// parseJsonFromResponse is the shape-normalization layer for judge subprocess output.
+// Models sometimes return markdown fences, leading prose, or trailing whitespace even
+// when asked for raw JSON. These tests lock in the tolerance window: we accept the
+// well-formed common cases and reject anything that cannot be safely parsed.
+
+const Schema = z.object({
+	verdict: z.enum(["pass", "fail"]),
+	confidence: z.number().min(0).max(1),
+	reasoning: z.string(),
+});
+
+describe("parseJsonFromResponse", () => {
+	test("parses raw JSON object", () => {
+		const text = '{"verdict":"pass","confidence":0.95,"reasoning":"Looks clean."}';
+		const result = parseJsonFromResponse(text, Schema);
+		expect(result.verdict).toBe("pass");
+		expect(result.confidence).toBe(0.95);
+	});
+
+	test("parses JSON wrapped in markdown json code fence", () => {
+		const text = '```json\n{"verdict":"fail","confidence":0.8,"reasoning":"Issue detected."}\n```';
+		const result = parseJsonFromResponse(text, Schema);
+		expect(result.verdict).toBe("fail");
+		expect(result.reasoning).toBe("Issue detected.");
+	});
+
+	test("parses JSON wrapped in plain markdown code fence", () => {
+		const text = '```\n{"verdict":"pass","confidence":1,"reasoning":"ok"}\n```';
+		const result = parseJsonFromResponse(text, Schema);
+		expect(result.verdict).toBe("pass");
+	});
+
+	test("handles leading/trailing whitespace", () => {
+		const text = '\n\n  {"verdict":"pass","confidence":0.5,"reasoning":"fine"}  \n';
+		const result = parseJsonFromResponse(text, Schema);
+		expect(result.verdict).toBe("pass");
+	});
+
+	test("recovers JSON from surrounding prose via brace scan", () => {
+		const text = 'Here is my analysis: {"verdict":"fail","confidence":0.72,"reasoning":"Unsafe pattern"}. Thank you.';
+		const result = parseJsonFromResponse(text, Schema);
+		expect(result.verdict).toBe("fail");
+		expect(result.confidence).toBe(0.72);
+	});
+
+	test("throws a clear error on empty response", () => {
+		expect(() => parseJsonFromResponse("", Schema)).toThrow(/empty/i);
+		expect(() => parseJsonFromResponse("   \n\n  ", Schema)).toThrow(/empty/i);
+	});
+
+	test("throws on text with no JSON object at all", () => {
+		expect(() => parseJsonFromResponse("I cannot comply with this request.", Schema)).toThrow(/non-JSON|invalid/i);
+	});
+
+	test("throws on malformed JSON", () => {
+		const text = '{"verdict":"pass", "confidence":';
+		expect(() => parseJsonFromResponse(text, Schema)).toThrow(/invalid JSON|non-JSON/i);
+	});
+
+	test("throws on JSON that violates the schema", () => {
+		const text = '{"verdict":"maybe","confidence":0.9,"reasoning":"..."}';
+		expect(() => parseJsonFromResponse(text, Schema)).toThrow(/schema validation/i);
+	});
+
+	test("throws on JSON missing required fields", () => {
+		const text = '{"verdict":"pass"}';
+		expect(() => parseJsonFromResponse(text, Schema)).toThrow(/schema validation/i);
+	});
+
+	test("throws on confidence out of range", () => {
+		const text = '{"verdict":"pass","confidence":1.5,"reasoning":"over"}';
+		expect(() => parseJsonFromResponse(text, Schema)).toThrow(/schema validation/i);
+	});
+
+	test("error message includes truncated response for debugging", () => {
+		const text = "not json at all, just prose with no object";
+		expect(() => parseJsonFromResponse(text, Schema)).toThrow(/not json/i);
+	});
+
+	test("parses nested structures", () => {
+		const Nested = z.object({
+			flags: z.array(z.object({ category: z.string(), severity: z.enum(["critical", "warning", "info"]) })),
+			verdict: z.enum(["pass", "fail"]),
+		});
+		const text = '```json\n{"flags":[{"category":"safety","severity":"critical"}],"verdict":"fail"}\n```';
+		const result = parseJsonFromResponse(text, Nested);
+		expect(result.flags).toHaveLength(1);
+		expect(result.flags[0].severity).toBe("critical");
+		expect(result.verdict).toBe("fail");
+	});
+});
diff --git a/src/agent/judge-query.ts b/src/agent/judge-query.ts
@@ -0,0 +1,206 @@
+import { query } from "@anthropic-ai/claude-agent-sdk";
+import { z } from "zod/v4";
+import type { PhantomConfig } from "../config/types.ts";
+import { extractTextFromMessage } from "./message-utils.ts";
+
+// Judge subprocess integration. Routes LLM judge calls through the same
+// Agent SDK `query()` subprocess as the main agent so that auth, provider,
+// and base URL flow through a single path. The older raw Anthropic SDK
+// integration (`client.messages.parse`) is gone; structured output is now
+// produced by prompt instruction + JSON.parse + Zod validation.
+
+export type JudgeQueryOptions<T> = {
+	systemPrompt: string;
+	userMessage: string;
+	schema: z.ZodType<T>;
+	model?: string;
+	maxTokens?: number;
+};
+
+export type JudgeQueryResult<T> = {
+	verdict: "pass" | "fail";
+	confidence: number;
+	reasoning: string;
+	data: T;
+	model: string;
+	inputTokens: number;
+	outputTokens: number;
+	costUsd: number;
+	durationMs: number;
+};
+
+// Minimum permissive schema shape so we can surface verdict/confidence/reasoning
+// on the envelope when the concrete schema opts into those fields.
+type JudgeEnvelopeFields = {
+	verdict?: "pass" | "fail";
+	confidence?: number;
+	reasoning?: string;
+	overall_reasoning?: string;
+};
+
+const JSON_BLOCK = /^```(?:json)?\s*\n?/;
+const TRAILING_BLOCK = /\n?```\s*$/;
+
+/**
+ * Parse and validate a JSON response returned by a judge subprocess.
+ *
+ * Handles three common model output shapes:
+ *  1. Raw JSON object (preferred, matches the prompt instruction)
+ *  2. JSON wrapped in a ```json ... ``` code fence
+ *  3. Prose around a JSON object, recovered by taking the substring from the
+ *     first `{` to the last `}`
+ *
+ * Any remaining format noise causes a clear error. Zod validation catches
+ * structural mismatches. No silent fallback to partial data.
+ */
+export function parseJsonFromResponse<T>(text: string, schema: z.ZodType<T>): T {
+	if (!text || text.trim().length === 0) {
+		throw new Error("Judge returned empty response");
+	}
+
+	let cleaned = text.trim();
+	if (cleaned.startsWith("```")) {
+		cleaned = cleaned.replace(JSON_BLOCK, "").replace(TRAILING_BLOCK, "").trim();
+	}
+
+	let raw: unknown;
+	try {
+		raw = JSON.parse(cleaned);
+	} catch {
+		// Second chance: find the outermost JSON object in the text.
+		// Useful when a model prepends/appends commentary despite the prompt.
+		const firstBrace = cleaned.indexOf("{");
+		const lastBrace = cleaned.lastIndexOf("}");
+		if (firstBrace === -1 || lastBrace === -1 || lastBrace <= firstBrace) {
+			throw new Error(`Judge returned non-JSON response: ${truncate(text, 200)}`);
+		}
+		try {
+			raw = JSON.parse(cleaned.slice(firstBrace, lastBrace + 1));
+		} catch (err) {
+			const msg = err instanceof Error ? err.message : String(err);
+			throw new Error(`Judge returned invalid JSON: ${msg}. Response: ${truncate(text, 200)}`);
+		}
+	}
+
+	const result = schema.safeParse(raw);
+	if (!result.success) {
+		throw new Error(`Judge output failed schema validation: ${formatZodError(result.error)}`);
+	}
+	return result.data;
+}
+
+/**
+ * Run a focused evaluation query through the Agent SDK subprocess.
+ *
+ * The judge prompt is assembled from the caller's system prompt plus a JSON
+ * schema contract. `maxTurns: 1` and `effort: "low"` keep judge latency and
+ * cost bounded; MCP servers, hooks, and session persistence are all disabled
+ * because judges are stateless evaluators, not interactive agents.
+ */
+export async function runJudgeQuery<T>(
+	config: PhantomConfig,
+	options: JudgeQueryOptions<T>,
+): Promise<JudgeQueryResult<T>> {
+	const startTime = Date.now();
+	const resolvedModel = options.model ?? config.judge_model ?? config.model;
+
+	const schemaJson = z.toJSONSchema(options.schema);
+	const judgePrompt = buildJudgePrompt(options.systemPrompt, schemaJson);
+
+	const queryStream = query({
+		prompt: options.userMessage,
+		options: {
+			model: resolvedModel,
+			permissionMode: "bypassPermissions",
+			allowDangerouslySkipPermissions: true,
+			systemPrompt: {
+				type: "preset" as const,
+				preset: "claude_code" as const,
+				append: judgePrompt,
+			},
+			maxTurns: 1,
+			effort: "low",
+			persistSession: false,
+		},
+	});
+
+	let responseText = "";
+	let inputTokens = 0;
+	let outputTokens = 0;
+	let resultCostUsd = 0;
+	let errored: string | null = null;
+
+	for await (const message of queryStream) {
+		switch (message.type) {
+			case "assistant": {
+				const content = extractTextFromMessage(message.message);
+				if (content) responseText = content;
+				break;
+			}
+			case "result": {
+				const msg = message as {
+					subtype: string;
+					result?: string;
+					total_cost_usd?: number;
+					usage?: { input_tokens?: number; output_tokens?: number };
+				};
+				if (msg.subtype === "success" && msg.result) {
+					responseText = msg.result;
+				}
+				if (msg.subtype !== "success") {
+					errored = msg.subtype;
+				}
+				inputTokens = msg.usage?.input_tokens ?? 0;
+				outputTokens = msg.usage?.output_tokens ?? 0;
+				resultCostUsd = msg.total_cost_usd ?? 0;
+				break;
+			}
+		}
+	}
+
+	if (errored) {
+		throw new Error(`Judge subprocess ended with ${errored}`);
+	}
+
+	const parsed = parseJsonFromResponse<T>(responseText, options.schema);
+	const envelope = parsed as T & JudgeEnvelopeFields;
+
+	return {
+		verdict: envelope.verdict ?? "pass",
+		confidence: typeof envelope.confidence === "number" ? envelope.confidence : 1.0,
+		reasoning: envelope.reasoning ?? envelope.overall_reasoning ?? "",
+		data: parsed,
+		model: resolvedModel,
+		inputTokens,
+		outputTokens,
+		costUsd: resultCostUsd,
+		durationMs: Date.now() - startTime,
+	};
+}
+
+function buildJudgePrompt(systemPrompt: string, schemaJson: unknown): string {
+	return [
+		systemPrompt,
+		"",
+		"You MUST respond with ONLY a JSON object that conforms to the schema below.",
+		"Do not include markdown code fences, prose, explanations, or any text outside the JSON object.",
+		"The first character of your response must be `{` and the last must be `}`.",
+		"",
+		"Schema:",
+		JSON.stringify(schemaJson, null, 2),
+	].join("\n");
+}
+
+function formatZodError(error: z.ZodError): string {
+	const issues = error.issues.slice(0, 3).map((issue) => {
+		const path = issue.path.length > 0 ? issue.path.join(".") : "(root)";
+		return `${path}: ${issue.message}`;
+	});
+	const suffix = error.issues.length > 3 ? ` (+${error.issues.length - 3} more)` : "";
+	return `${issues.join("; ")}${suffix}`;
+}
+
+function truncate(text: string, max: number): string {
+	if (text.length <= max) return text;
+	return `${text.slice(0, max)}...`;
+}