Skip to content

Commit 2ba22ec

Browse files
committed
Add benchmark manifest runner
1 parent c4380f2 commit 2ba22ec

5 files changed

Lines changed: 527 additions & 283 deletions

File tree

benchmarks/manifests/smoke.toml

Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
# Smoke benchmark matrix for local validation.
2+
#
3+
# Override the server at runtime with `izwi --server <URL> bench run ...`,
4+
# or set `server` here for a fixed target.
5+
6+
[[benchmarks]]
7+
name = "chat-short-c1"
8+
command = "chat"
9+
model = "Qwen3.5-4B"
10+
iterations = 1
11+
concurrent = 1
12+
warmup = false
13+
prompt = "Summarize why batching helps transformer prefill in one sentence."
14+
max_tokens = 64
15+
16+
[[benchmarks]]
17+
name = "asr-short-c1"
18+
command = "asr"
19+
model = "parakeet-tdt-0.6b-v3"
20+
file = "../../data/test.wav"
21+
iterations = 1
22+
concurrent = 1
23+
warmup = false

crates/izwi-cli/README.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -147,6 +147,7 @@ izwi bench tts --model qwen3-tts-0.6b-base --iterations 5 --concurrent 2
147147
izwi bench asr --model parakeet-tdt-0.6b-v3 --file data/test.wav --iterations 3 --concurrent 2
148148
izwi bench throughput --duration 10 --concurrent 2
149149
izwi --output-format json bench chat --iterations 5
150+
izwi --output-format json bench run benchmarks/local.toml
150151
```
151152

152153
### Config

crates/izwi-cli/src/app/cli.rs

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -537,6 +537,13 @@ pub enum BenchCommands {
537537
#[arg(short, long, default_value = "1")]
538538
concurrent: u32,
539539
},
540+
541+
/// Run a benchmark manifest
542+
Run {
543+
/// Benchmark manifest path (TOML)
544+
#[arg(value_name = "PATH")]
545+
manifest: PathBuf,
546+
},
540547
}
541548

542549
#[derive(Subcommand)]

0 commit comments

Comments
 (0)