test: update retrieval accuracy benchmarks

This commit is contained in:
Johann Schopplich
2025-10-27 13:45:48 +01:00
parent b2c58d2b97
commit 1a5e6199ac
10 changed files with 5686 additions and 5709 deletions

View File

@@ -19,8 +19,8 @@ export interface EvaluationResult {
expected: string
actual: string
correct: boolean
inputTokens: number
outputTokens: number
inputTokens?: number
outputTokens?: number
latencyMs: number
}
@@ -28,8 +28,7 @@ export interface FormatResult {
format: string
accuracy: number
totalTokens: number
avgInputTokens: number
avgLatency: number
averageLatency: number
correctCount: number
totalCount: number
}