refactor: benchmarks code style

This commit is contained in:
Johann Schopplich
2025-10-28 08:02:57 +01:00
parent 833c99ea38
commit cdd4a20c67
3 changed files with 24 additions and 8 deletions

View File

@@ -28,8 +28,20 @@ export const models: Record<string, LanguageModelV2> = {
* Evaluate a single question with a specific format and model
*/
export async function evaluateQuestion(
{ question, formatName, formattedData, model, modelName}:
{ question: Question, formatName: string, formattedData: string, model: LanguageModelV2, modelName: string },
{
question,
formatName,
formattedData,
model,
modelName,
}:
{
question: Question
formatName: string
formattedData: string
model: LanguageModelV2
modelName: string
},
): Promise<EvaluationResult> {
const prompt = `
Given the following data in ${formatName} format:
@@ -79,7 +91,11 @@ async function validateAnswer(
expected,
question,
}:
{ actual: string, expected: string, question: string },
{
actual: string
expected: string
question: string
},
): Promise<boolean> {
const prompt = `
You are validating answers to questions about structured data.