Skip to content

Commit a57e4af

Browse files
committed
test: configure raw diversity eval budgets
1 parent 86f30c6 commit a57e4af

File tree

3 files changed

+6
-1
lines changed

3 files changed

+6
-1
lines changed

benchmarks/baselines/eval-baseline-summary.json

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,8 @@
1919
"hitAt10": 1,
2020
"mrrAt10": 0.875,
2121
"ndcgAt10": 0.9127302324517832,
22+
"distinctTop3Ratio": 1,
23+
"rawDistinctTop3Ratio": 1,
2224
"latencyMs": {
2325
"p50": 26.173166000000037,
2426
"p95": 52.931082999999944,

benchmarks/budgets/default.json

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,9 +5,11 @@
55
"thresholds": {
66
"hitAt5MaxDrop": 0.03,
77
"mrrAt10MaxDrop": 0.03,
8+
"rawDistinctTop3RatioMaxDrop": 0.1,
89
"p95LatencyMaxMultiplier": 1.35,
910
"p95LatencyMaxAbsoluteMs": 4000,
1011
"minHitAt5": 0.4,
11-
"minMrrAt10": 0.25
12+
"minMrrAt10": 0.25,
13+
"minRawDistinctTop3Ratio": 0.5
1214
}
1315
}

benchmarks/budgets/github-models.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
"thresholds": {
55
"minHitAt5": 0.5,
66
"minMrrAt10": 0.45,
7+
"minRawDistinctTop3Ratio": 0.5,
78
"p95LatencyMaxAbsoluteMs": 500
89
}
910
}

0 commit comments

Comments
 (0)