Files
strix-halo-optimizations/tests/benchmark_flags.bats
Felipe Cardoso 6ab08537ca fix: address code review findings — batch args, venv path, serve flags
- Fix missing BATCH_ARGS in long-context commands (both benchmark scripts)
- Fix CLAUDE.md stale venv path (data/venv → .venv) and add serve/power docs
- Add -b/--batch to bin/benchmark help text
- Add --no-think flag to serve script (--reasoning-budget 0)
- Sanitize model names in eval run directories
- Simplify agentic setup to use requirements.txt
- Add serve --help test, batch flag assertions to existing tests
- Add requirements.txt for reproducible venv setup (Python 3.13)
2026-03-31 10:10:48 +02:00

55 lines
1.7 KiB
Bash

#!/usr/bin/env bats
# Tests for benchmark script filtering flags
load test_helper.sh
@test "baseline --help shows usage and exits 0" {
run bash "$PROJECT_ROOT/scripts/benchmark/run-baseline.sh" --help
assert_success
assert_output --partial "Usage"
assert_output --partial "--max-size"
assert_output --partial "--category"
assert_output --partial "--skip-longctx"
assert_output --partial "--kv-types"
assert_output --partial "--batch"
}
@test "run-suite --help shows usage and exits 0" {
run bash "$PROJECT_ROOT/scripts/benchmark/run-suite.sh" --help
assert_success
assert_output --partial "Usage"
assert_output --partial "--max-size"
assert_output --partial "--category"
assert_output --partial "--skip-longctx"
assert_output --partial "--tag"
assert_output --partial "--kv-types"
assert_output --partial "--batch"
}
@test "benchmark dispatcher shows help with no args" {
run bash "$PROJECT_ROOT/bin/benchmark"
assert_failure
assert_output --partial "Commands"
assert_output --partial "--max-size"
assert_output --partial "--skip-longctx"
assert_output --partial "--kv-types"
assert_output --partial "--batch"
}
@test "serve --help shows usage and exits 0" {
run bash "$PROJECT_ROOT/bin/serve" --help
assert_success
assert_output --partial "Usage"
assert_output --partial "--model"
assert_output --partial "--ngram"
assert_output --partial "--no-think"
assert_output --partial "--ctx"
assert_output --partial "--port"
}
@test "benchmark dispatcher passes --help through to baseline" {
run bash "$PROJECT_ROOT/bin/benchmark" baseline --help
assert_success
assert_output --partial "Usage"
}