mirror of
https://github.com/voson-wang/toon.git
synced 2026-01-29 23:34:10 +08:00
test: refactor accuracy benchmark generation
This commit is contained in:
@@ -18,7 +18,7 @@ export interface EvaluationResult {
|
||||
model: string
|
||||
expected: string
|
||||
actual: string
|
||||
correct: boolean
|
||||
isCorrect: boolean
|
||||
inputTokens?: number
|
||||
outputTokens?: number
|
||||
latencyMs: number
|
||||
|
||||
Reference in New Issue
Block a user