refactor: token efficiency benchmark code

2026-01-29 23:34:10 +08:00 · 2025-10-28 07:42:49 +01:00
parent 8836831de3
commit 8b9924ff05
3 changed files with 52 additions and 41 deletions
--- a/benchmarks/src/evaluate.ts
+++ b/benchmarks/src/evaluate.ts
@@ -81,7 +81,8 @@ async function validateAnswer(
  }:
  { actual: string, expected: string, question: string },
 ): Promise<boolean> {
-  const prompt = `You are validating answers to questions about structured data.
+  const prompt = `
+You are validating answers to questions about structured data.

 Question: ${question}
 Expected answer: ${expected}
@@ -93,7 +94,8 @@ Is the actual answer correct? Consider:
 - Minor formatting differences are acceptable
 - Case-insensitive comparison for text

-Respond with only "YES" or "NO".`
+Respond with only "YES" or "NO".
+`.trim()

  try {
    const { text } = await generateText({