diff --git a/src/commands/benchmark-job/run.ts b/src/commands/benchmark-job/run.ts index 1a228191..98badd76 100644 --- a/src/commands/benchmark-job/run.ts +++ b/src/commands/benchmark-job/run.ts @@ -326,9 +326,7 @@ export async function runBenchmarkJob(options: RunOptions) { const agentConfigs = parsedAgents.map((agent) => ({ name: agent.name, modelName: agent.model, - timeoutSeconds: options.timeout - ? parseInt(options.timeout, 10) - : undefined, + timeoutSeconds: options.timeout ? parseInt(options.timeout, 10) : 7200, // Default to 2 hours environmentVariables: Object.keys(providedEnvVars).length > 0 ? providedEnvVars : undefined, secrets, @@ -345,7 +343,9 @@ export async function runBenchmarkJob(options: RunOptions) { // Output result if (!options.output || options.output === "text") { - console.log(`Benchmark job created: ${job.id}`); + console.log( + `Benchmark job created: ${job.id} (agent timeout = ${agentConfigs[0].timeoutSeconds}s)`, + ); console.log(`Follow the run with rli benchmark-job watch ${job.id}`); } else { output(job, { format: options.output, defaultFormat: "json" }); diff --git a/src/screens/BenchmarkJobCreateScreen.tsx b/src/screens/BenchmarkJobCreateScreen.tsx index 565e0171..502c94e8 100644 --- a/src/screens/BenchmarkJobCreateScreen.tsx +++ b/src/screens/BenchmarkJobCreateScreen.tsx @@ -539,6 +539,8 @@ export function BenchmarkJobCreateScreen({ if (!isNaN(timeout) && timeout > 0) { config.timeoutSeconds = timeout; } + } else { + config.timeoutSeconds = 7200; // Default to 2 hours } return config;