Skip to content

Commit dcf0c56

Browse files
committed
feat: add benchmark command in Makefile
1 parent c6df03d commit dcf0c56

1 file changed

Lines changed: 15 additions & 1 deletion

File tree

Makefile

Lines changed: 15 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
.DEFAULT_GOAL := help
2-
.PHONY: help install install-dev lint lint-fix format typecheck test test-cov quality clean setup teardown all
2+
.PHONY: help install install-dev lint lint-fix format typecheck test test-cov quality clean setup teardown all balatrobench
33

44
# Colors for output
55
YELLOW := \033[33m
@@ -91,3 +91,17 @@ teardown: ## Stop LiteLLM server and Balatro processes
9191
@echo "$(YELLOW)Stopping Balatro...$(RESET)"
9292
@./balatro.sh --kill 2>/dev/null || true
9393
@echo "$(GREEN)✓ Services stopped$(RESET)"
94+
95+
balatrobench: ## Run benchmark for all models and generate analysis
96+
@echo "$(YELLOW)Starting benchmark runs for all models...$(RESET)"
97+
@echo "$(YELLOW)Running cerebras/gpt-oss-120b...$(RESET)"
98+
@balatrollm --runs-dir ./balatrobench --runs 3 --model cerebras/gpt-oss-120b || true
99+
@echo "$(YELLOW)Running cerebras/qwen-3-235b-a22b-thinking-2507...$(RESET)"
100+
@balatrollm --runs-dir ./balatrobench --runs 3 --model cerebras/qwen-3-235b-a22b-thinking-2507 || true
101+
@echo "$(YELLOW)Running cerebras/qwen-3-235b-a22b-instruct-2507...$(RESET)"
102+
@balatrollm --runs-dir ./balatrobench --runs 3 --model cerebras/qwen-3-235b-a22b-instruct-2507 || true
103+
@echo "$(YELLOW)Running groq/openai/gpt-oss-20b...$(RESET)"
104+
@balatrollm --runs-dir ./balatrobench --runs 3 --model groq/openai/gpt-oss-20b || true
105+
@echo "$(YELLOW)Generating benchmark analysis...$(RESET)"
106+
@balatrollm benchmark --runs-dir balatrobench/runs --output-dir balatrobench/benchmarks
107+
@echo "$(GREEN)✓ Benchmark completed$(RESET)"

0 commit comments

Comments
 (0)