mirror of
https://github.com/voson-wang/toon.git
synced 2026-01-29 23:34:10 +08:00
1416 lines
35 KiB
JSON
1416 lines
35 KiB
JSON
[
|
|
{
|
|
"id": "q1",
|
|
"prompt": "What is the salary of Constance Mante?",
|
|
"groundTruth": "56176",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q2",
|
|
"prompt": "What department does Alfonso Leffler work in?",
|
|
"groundTruth": "Marketing",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q3",
|
|
"prompt": "What is the email address of Mr. Corey Pfeffer?",
|
|
"groundTruth": "lorenza.kunze@yahoo.com",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q4",
|
|
"prompt": "How many years of experience does Mr. Brendan Harvey have?",
|
|
"groundTruth": "22",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q5",
|
|
"prompt": "Is Tracy Gleason an active employee?",
|
|
"groundTruth": "no",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q6",
|
|
"prompt": "What is the salary of Terri Wilkinson?",
|
|
"groundTruth": "133081",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q7",
|
|
"prompt": "What department does Aubrey Koss work in?",
|
|
"groundTruth": "Engineering",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q8",
|
|
"prompt": "What is the email address of Darren Homenick?",
|
|
"groundTruth": "delpha.russel@gmail.com",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q9",
|
|
"prompt": "How many years of experience does Dr. Ken Heller have?",
|
|
"groundTruth": "5",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q10",
|
|
"prompt": "Is Mr. Wade Collier an active employee?",
|
|
"groundTruth": "yes",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q11",
|
|
"prompt": "What is the salary of Hannah Waelchi?",
|
|
"groundTruth": "109064",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q12",
|
|
"prompt": "What department does Emily Harvey work in?",
|
|
"groundTruth": "Operations",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q13",
|
|
"prompt": "What is the email address of Chester Crist?",
|
|
"groundTruth": "henderson70@yahoo.com",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q14",
|
|
"prompt": "How many years of experience does Barbara Emard have?",
|
|
"groundTruth": "23",
|
|
"type": "field-retrieval",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q15",
|
|
"prompt": "How many employees work in Engineering?",
|
|
"groundTruth": "17",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q16",
|
|
"prompt": "How many employees work in Sales?",
|
|
"groundTruth": "17",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q17",
|
|
"prompt": "How many employees work in Marketing?",
|
|
"groundTruth": "17",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q18",
|
|
"prompt": "How many employees work in HR?",
|
|
"groundTruth": "17",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q19",
|
|
"prompt": "How many employees have a salary greater than 60000?",
|
|
"groundTruth": "91",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q20",
|
|
"prompt": "How many employees have a salary greater than 80000?",
|
|
"groundTruth": "67",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q21",
|
|
"prompt": "How many employees have a salary greater than 100000?",
|
|
"groundTruth": "41",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q22",
|
|
"prompt": "How many employees have a salary greater than 120000?",
|
|
"groundTruth": "26",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q23",
|
|
"prompt": "How many employees are in the dataset?",
|
|
"groundTruth": "100",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q24",
|
|
"prompt": "What is the average salary across all employees?",
|
|
"groundTruth": "96503",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q25",
|
|
"prompt": "How many employees are active?",
|
|
"groundTruth": "78",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q26",
|
|
"prompt": "How many employees are inactive?",
|
|
"groundTruth": "22",
|
|
"type": "aggregation",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q27",
|
|
"prompt": "How many employees in Engineering have a salary greater than 80000?",
|
|
"groundTruth": "12",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q28",
|
|
"prompt": "How many employees in Sales have a salary greater than 80000?",
|
|
"groundTruth": "11",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q29",
|
|
"prompt": "How many employees in Marketing have a salary greater than 80000?",
|
|
"groundTruth": "11",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q30",
|
|
"prompt": "How many employees in HR have a salary greater than 80000?",
|
|
"groundTruth": "12",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q31",
|
|
"prompt": "How many employees in Operations have a salary greater than 80000?",
|
|
"groundTruth": "11",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q32",
|
|
"prompt": "How many active employees have more than 5 years of experience?",
|
|
"groundTruth": "63",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q33",
|
|
"prompt": "How many active employees have more than 10 years of experience?",
|
|
"groundTruth": "53",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q34",
|
|
"prompt": "How many active employees have more than 15 years of experience?",
|
|
"groundTruth": "39",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q35",
|
|
"prompt": "How many employees in Engineering have more than 10 years of experience?",
|
|
"groundTruth": "11",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q36",
|
|
"prompt": "How many employees in Sales have more than 10 years of experience?",
|
|
"groundTruth": "8",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q37",
|
|
"prompt": "How many employees in Marketing have more than 10 years of experience?",
|
|
"groundTruth": "15",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q38",
|
|
"prompt": "How many active employees work in Engineering?",
|
|
"groundTruth": "12",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q39",
|
|
"prompt": "How many active employees work in Sales?",
|
|
"groundTruth": "11",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q40",
|
|
"prompt": "How many active employees work in Marketing?",
|
|
"groundTruth": "14",
|
|
"type": "filtering",
|
|
"dataset": "tabular"
|
|
},
|
|
{
|
|
"id": "q41",
|
|
"prompt": "What is the total for order ORD-0001?",
|
|
"groundTruth": "103.86",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q42",
|
|
"prompt": "What is the status of order ORD-0003?",
|
|
"groundTruth": "shipped",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q43",
|
|
"prompt": "What is the total for order ORD-0005?",
|
|
"groundTruth": "422.5",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q44",
|
|
"prompt": "What is the status of order ORD-0007?",
|
|
"groundTruth": "processing",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q45",
|
|
"prompt": "What is the total for order ORD-0009?",
|
|
"groundTruth": "1822.85",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q46",
|
|
"prompt": "What is the status of order ORD-0011?",
|
|
"groundTruth": "pending",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q47",
|
|
"prompt": "What is the total for order ORD-0013?",
|
|
"groundTruth": "1311.35",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q48",
|
|
"prompt": "What is the status of order ORD-0015?",
|
|
"groundTruth": "cancelled",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q49",
|
|
"prompt": "What is the customer name for order ORD-0002?",
|
|
"groundTruth": "Debbie O'Kon I",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q50",
|
|
"prompt": "What is the customer email for order ORD-0004?",
|
|
"groundTruth": "demetris.hoeger-pollich@yahoo.com",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q51",
|
|
"prompt": "What is the order date for order ORD-0006?",
|
|
"groundTruth": "2025-09-15",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q52",
|
|
"prompt": "How many items are in order ORD-0008?",
|
|
"groundTruth": "3",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q53",
|
|
"prompt": "What is the customer name for order ORD-0010?",
|
|
"groundTruth": "Patty Senger",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q54",
|
|
"prompt": "What is the customer email for order ORD-0012?",
|
|
"groundTruth": "viva.paucek@gmail.com",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q55",
|
|
"prompt": "What is the order date for order ORD-0014?",
|
|
"groundTruth": "2025-09-20",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q56",
|
|
"prompt": "How many items are in order ORD-0016?",
|
|
"groundTruth": "2",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q57",
|
|
"prompt": "What is the customer name for order ORD-0018?",
|
|
"groundTruth": "Dennis Wunsch",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q58",
|
|
"prompt": "What is the customer email for order ORD-0020?",
|
|
"groundTruth": "wilton.oconnell@yahoo.com",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q59",
|
|
"prompt": "How many orders have status \"pending\"?",
|
|
"groundTruth": "10",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q60",
|
|
"prompt": "How many orders have status \"processing\"?",
|
|
"groundTruth": "10",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q61",
|
|
"prompt": "How many orders have status \"shipped\"?",
|
|
"groundTruth": "10",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q62",
|
|
"prompt": "How many orders have status \"delivered\"?",
|
|
"groundTruth": "10",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q63",
|
|
"prompt": "How many orders have status \"cancelled\"?",
|
|
"groundTruth": "10",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q64",
|
|
"prompt": "What is the total revenue across all orders?",
|
|
"groundTruth": "34904.81",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q65",
|
|
"prompt": "What is the average order value?",
|
|
"groundTruth": "698.10",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q66",
|
|
"prompt": "How many orders are in the dataset?",
|
|
"groundTruth": "50",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q67",
|
|
"prompt": "What is the highest order total?",
|
|
"groundTruth": "2152.82",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q68",
|
|
"prompt": "How many orders have a total greater than 200?",
|
|
"groundTruth": "43",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q69",
|
|
"prompt": "How many orders have a total greater than 400?",
|
|
"groundTruth": "37",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q70",
|
|
"prompt": "How many orders have a total greater than 600?",
|
|
"groundTruth": "28",
|
|
"type": "aggregation",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q71",
|
|
"prompt": "How many orders have status \"pending\" and total greater than 300?",
|
|
"groundTruth": "8",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q72",
|
|
"prompt": "How many orders have status \"processing\" and total greater than 300?",
|
|
"groundTruth": "6",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q73",
|
|
"prompt": "How many orders have status \"shipped\" and total greater than 300?",
|
|
"groundTruth": "10",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q74",
|
|
"prompt": "How many orders have status \"delivered\" and total greater than 300?",
|
|
"groundTruth": "9",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q75",
|
|
"prompt": "How many orders have status \"cancelled\" and total greater than 300?",
|
|
"groundTruth": "8",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q76",
|
|
"prompt": "How many orders have status \"pending\" and at least 3 items?",
|
|
"groundTruth": "3",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q77",
|
|
"prompt": "How many orders have status \"processing\" and at least 3 items?",
|
|
"groundTruth": "3",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q78",
|
|
"prompt": "How many orders have status \"shipped\" and at least 3 items?",
|
|
"groundTruth": "5",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q79",
|
|
"prompt": "How many orders have a total greater than 300 and at least 3 items?",
|
|
"groundTruth": "20",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q80",
|
|
"prompt": "How many orders have a total greater than 500 and at least 3 items?",
|
|
"groundTruth": "19",
|
|
"type": "filtering",
|
|
"dataset": "nested"
|
|
},
|
|
{
|
|
"id": "q81",
|
|
"prompt": "What are the views for 2025-01-01?",
|
|
"groundTruth": "4322",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q82",
|
|
"prompt": "What is the revenue for 2025-01-04?",
|
|
"groundTruth": "10432.04",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q83",
|
|
"prompt": "What is the bounce rate for 2025-01-07?",
|
|
"groundTruth": "0.53",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q84",
|
|
"prompt": "How many conversions were there on 2025-01-10?",
|
|
"groundTruth": "32",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q85",
|
|
"prompt": "What are the views for 2025-01-13?",
|
|
"groundTruth": "4096",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q86",
|
|
"prompt": "What is the revenue for 2025-01-16?",
|
|
"groundTruth": "4533.1",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q87",
|
|
"prompt": "What is the bounce rate for 2025-01-19?",
|
|
"groundTruth": "0.63",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q88",
|
|
"prompt": "How many conversions were there on 2025-01-22?",
|
|
"groundTruth": "25",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q89",
|
|
"prompt": "What are the views for 2025-01-25?",
|
|
"groundTruth": "4076",
|
|
"type": "field-retrieval",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q90",
|
|
"prompt": "How many days of data are in the dataset?",
|
|
"groundTruth": "60",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q91",
|
|
"prompt": "What is the total number of views across all dates?",
|
|
"groundTruth": "328320",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q92",
|
|
"prompt": "What is the total number of conversions across all dates?",
|
|
"groundTruth": "1791",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q93",
|
|
"prompt": "What is the total revenue across all dates?",
|
|
"groundTruth": "311695.88",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q94",
|
|
"prompt": "What is the average bounce rate?",
|
|
"groundTruth": "0.53",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q95",
|
|
"prompt": "How many days had more than 5000 views?",
|
|
"groundTruth": "33",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q96",
|
|
"prompt": "How many days had more than 7000 views?",
|
|
"groundTruth": "14",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q97",
|
|
"prompt": "How many days had more than 10 conversions?",
|
|
"groundTruth": "57",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q98",
|
|
"prompt": "How many days had more than 30 conversions?",
|
|
"groundTruth": "26",
|
|
"type": "aggregation",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q99",
|
|
"prompt": "How many days had more than 6000 views and more than 15 conversions?",
|
|
"groundTruth": "20",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q100",
|
|
"prompt": "How many days had more than 7000 views and more than 15 conversions?",
|
|
"groundTruth": "14",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q101",
|
|
"prompt": "How many days had revenue greater than 500 with views above 6000?",
|
|
"groundTruth": "22",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q102",
|
|
"prompt": "How many days had revenue greater than 1000 with views above 6000?",
|
|
"groundTruth": "22",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q103",
|
|
"prompt": "How many days had revenue greater than 1500 with views above 6000?",
|
|
"groundTruth": "22",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q104",
|
|
"prompt": "How many days had revenue greater than 2000 with views above 6000?",
|
|
"groundTruth": "20",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q105",
|
|
"prompt": "How many days had revenue greater than 2500 with views above 6000?",
|
|
"groundTruth": "18",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q106",
|
|
"prompt": "How many days had more than 250 clicks and more than 15 conversions?",
|
|
"groundTruth": "32",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q107",
|
|
"prompt": "How many days had more than 400 clicks and more than 15 conversions?",
|
|
"groundTruth": "9",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q108",
|
|
"prompt": "How many days had revenue greater than 1000 with bounce rate below 0.5?",
|
|
"groundTruth": "22",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q109",
|
|
"prompt": "How many days had revenue greater than 1500 with bounce rate below 0.5?",
|
|
"groundTruth": "22",
|
|
"type": "filtering",
|
|
"dataset": "analytics"
|
|
},
|
|
{
|
|
"id": "q110",
|
|
"prompt": "How many stars does undefined/freeCodeCamp have?",
|
|
"groundTruth": "430886",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q111",
|
|
"prompt": "How many forks does undefined/system-design-primer have?",
|
|
"groundTruth": "52904",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q112",
|
|
"prompt": "How many watchers does undefined/vue have?",
|
|
"groundTruth": "5786",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q113",
|
|
"prompt": "What is the main branch of undefined/CS-Notes?",
|
|
"groundTruth": "master",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q114",
|
|
"prompt": "How many stars does undefined/gitignore have?",
|
|
"groundTruth": "170327",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q115",
|
|
"prompt": "How many forks does undefined/n8n have?",
|
|
"groundTruth": "48578",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q116",
|
|
"prompt": "How many watchers does undefined/yt-dlp have?",
|
|
"groundTruth": "678",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q117",
|
|
"prompt": "What is the main branch of undefined/PowerToys?",
|
|
"groundTruth": "main",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q118",
|
|
"prompt": "How many stars does undefined/free-programming-books-zh_CN have?",
|
|
"groundTruth": "115543",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q119",
|
|
"prompt": "How many forks does undefined/three.js have?",
|
|
"groundTruth": "36054",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q120",
|
|
"prompt": "How many watchers does undefined/GitHub-Chinese-Top-Charts have?",
|
|
"groundTruth": "2607",
|
|
"type": "field-retrieval",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q121",
|
|
"prompt": "How many repositories are in the dataset?",
|
|
"groundTruth": "100",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q122",
|
|
"prompt": "What is the total number of stars across all repositories?",
|
|
"groundTruth": "15413563",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q123",
|
|
"prompt": "What is the total number of forks across all repositories?",
|
|
"groundTruth": "2528243",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q124",
|
|
"prompt": "What is the average number of stars per repository?",
|
|
"groundTruth": "154136",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q125",
|
|
"prompt": "How many repositories use \"main\" as their default branch?",
|
|
"groundTruth": "41",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q126",
|
|
"prompt": "How many repositories use \"master\" as their default branch?",
|
|
"groundTruth": "53",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q127",
|
|
"prompt": "How many repositories have more than 100000 stars?",
|
|
"groundTruth": "77",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q128",
|
|
"prompt": "How many repositories have more than 150000 stars?",
|
|
"groundTruth": "37",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q129",
|
|
"prompt": "How many repositories have more than 200000 stars?",
|
|
"groundTruth": "16",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q130",
|
|
"prompt": "How many repositories have more than 20000 forks?",
|
|
"groundTruth": "49",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q131",
|
|
"prompt": "How many repositories have more than 35000 forks?",
|
|
"groundTruth": "23",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q132",
|
|
"prompt": "How many repositories have more than 50000 forks?",
|
|
"groundTruth": "11",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q133",
|
|
"prompt": "How many repositories have more than 5000 watchers?",
|
|
"groundTruth": "19",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q134",
|
|
"prompt": "How many repositories have more than 8000 watchers?",
|
|
"groundTruth": "4",
|
|
"type": "aggregation",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q135",
|
|
"prompt": "How many repositories have more than 75000 stars and more than 15000 forks?",
|
|
"groundTruth": "57",
|
|
"type": "filtering",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q136",
|
|
"prompt": "How many repositories have more than 100000 stars and more than 20000 forks?",
|
|
"groundTruth": "43",
|
|
"type": "filtering",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q137",
|
|
"prompt": "How many repositories have more than 150000 stars and more than 30000 forks?",
|
|
"groundTruth": "25",
|
|
"type": "filtering",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q138",
|
|
"prompt": "How many repositories have more than 200000 stars and more than 45000 forks?",
|
|
"groundTruth": "6",
|
|
"type": "filtering",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q139",
|
|
"prompt": "How many repositories have more than 100000 stars and more than 7000 watchers?",
|
|
"groundTruth": "6",
|
|
"type": "filtering",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q140",
|
|
"prompt": "How many repositories have more than 150000 stars and more than 9000 watchers?",
|
|
"groundTruth": "1",
|
|
"type": "filtering",
|
|
"dataset": "github"
|
|
},
|
|
{
|
|
"id": "q141",
|
|
"prompt": "What is the level of the log at 2025-11-02T16:55:04.316Z?",
|
|
"groundTruth": "error",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q142",
|
|
"prompt": "What is the endpoint for the log at 2025-10-31T02:31:28.977Z?",
|
|
"groundTruth": "/api/users",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q143",
|
|
"prompt": "What is the status code for the log at 2025-11-01T23:56:56.929Z?",
|
|
"groundTruth": "424",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q144",
|
|
"prompt": "What is the response time for the log at 2025-11-03T12:14:31.017Z?",
|
|
"groundTruth": "2849",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q145",
|
|
"prompt": "What is the level of the log at 2025-11-01T22:06:30.814Z?",
|
|
"groundTruth": "info",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q146",
|
|
"prompt": "What is the endpoint for the log at 2025-11-06T05:48:07.260Z?",
|
|
"groundTruth": "/api/orders",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q147",
|
|
"prompt": "What is the status code for the log at 2025-11-05T23:46:00.144Z?",
|
|
"groundTruth": "435",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q148",
|
|
"prompt": "What is the response time for the log at 2025-10-31T23:56:23.022Z?",
|
|
"groundTruth": "408",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q149",
|
|
"prompt": "What is the level of the log at 2025-11-06T01:23:44.734Z?",
|
|
"groundTruth": "error",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q150",
|
|
"prompt": "What is the endpoint for the log at 2025-11-03T21:54:27.889Z?",
|
|
"groundTruth": "/api/users",
|
|
"type": "field-retrieval",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q151",
|
|
"prompt": "How many log entries are in the dataset?",
|
|
"groundTruth": "75",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q152",
|
|
"prompt": "What is the average response time across all logs?",
|
|
"groundTruth": "2453.41",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q153",
|
|
"prompt": "How many log entries have level \"error\"?",
|
|
"groundTruth": "29",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q154",
|
|
"prompt": "How many log entries have level \"warn\"?",
|
|
"groundTruth": "17",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q155",
|
|
"prompt": "How many log entries have level \"info\"?",
|
|
"groundTruth": "29",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q156",
|
|
"prompt": "How many log entries are for endpoint \"/api/products\"?",
|
|
"groundTruth": "11",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q157",
|
|
"prompt": "How many log entries are for endpoint \"/api/users\"?",
|
|
"groundTruth": "18",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q158",
|
|
"prompt": "How many log entries are for endpoint \"/api/auth\"?",
|
|
"groundTruth": "21",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q159",
|
|
"prompt": "How many log entries are for endpoint \"/api/orders\"?",
|
|
"groundTruth": "11",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q160",
|
|
"prompt": "How many log entries have a status code indicating an error (>= 400)?",
|
|
"groundTruth": "33",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q161",
|
|
"prompt": "How many log entries have a successful status code (200-299)?",
|
|
"groundTruth": "42",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q162",
|
|
"prompt": "How many log entries have a retryable error?",
|
|
"groundTruth": "25",
|
|
"type": "aggregation",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q163",
|
|
"prompt": "How many log entries have level \"error\" and status code >= 400?",
|
|
"groundTruth": "29",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q164",
|
|
"prompt": "How many log entries have level \"warn\" and status code >= 400?",
|
|
"groundTruth": "4",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q165",
|
|
"prompt": "How many log entries have level \"info\" and status code >= 400?",
|
|
"groundTruth": "0",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q166",
|
|
"prompt": "How many log entries are for endpoint \"/api/products\" with status code >= 500?",
|
|
"groundTruth": "5",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q167",
|
|
"prompt": "How many log entries are for endpoint \"/api/users\" with status code >= 500?",
|
|
"groundTruth": "2",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q168",
|
|
"prompt": "How many log entries are for endpoint \"/api/auth\" with status code >= 500?",
|
|
"groundTruth": "3",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q169",
|
|
"prompt": "How many log entries for endpoint \"/api/products\" have a retryable error?",
|
|
"groundTruth": "4",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q170",
|
|
"prompt": "How many log entries for endpoint \"/api/users\" have a retryable error?",
|
|
"groundTruth": "5",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q171",
|
|
"prompt": "How many log entries for endpoint \"/api/auth\" have a retryable error?",
|
|
"groundTruth": "7",
|
|
"type": "filtering",
|
|
"dataset": "event-logs"
|
|
},
|
|
{
|
|
"id": "q172",
|
|
"prompt": "What is the environment in the configuration?",
|
|
"groundTruth": "development",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q173",
|
|
"prompt": "What is the database host?",
|
|
"groundTruth": "guilty-cake.org",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q174",
|
|
"prompt": "What is the database port?",
|
|
"groundTruth": "5432",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q175",
|
|
"prompt": "What is the maximum connection pool size?",
|
|
"groundTruth": "37",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q176",
|
|
"prompt": "What is the session duration?",
|
|
"groundTruth": "86400",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q177",
|
|
"prompt": "What is the minimum connection pool size?",
|
|
"groundTruth": "2",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q178",
|
|
"prompt": "What is the connection pool idle timeout?",
|
|
"groundTruth": "30000",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q179",
|
|
"prompt": "What is the database name?",
|
|
"groundTruth": "real",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q180",
|
|
"prompt": "What is the session refresh threshold?",
|
|
"groundTruth": "3600",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q181",
|
|
"prompt": "What is the version in the configuration?",
|
|
"groundTruth": "6.8.3",
|
|
"type": "field-retrieval",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q182",
|
|
"prompt": "How many roles are defined in permissions?",
|
|
"groundTruth": "3",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q183",
|
|
"prompt": "How many groups are defined in permissions?",
|
|
"groundTruth": "2",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q184",
|
|
"prompt": "How many authentication providers are configured?",
|
|
"groundTruth": "2",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q185",
|
|
"prompt": "How many feature flags are defined?",
|
|
"groundTruth": "2",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q186",
|
|
"prompt": "How many database replicas are configured?",
|
|
"groundTruth": "3",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q187",
|
|
"prompt": "How many authentication providers include the \"admin\" scope?",
|
|
"groundTruth": "1",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q188",
|
|
"prompt": "How many feature flags are enabled?",
|
|
"groundTruth": "0",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q189",
|
|
"prompt": "How many permissions does the admin role have?",
|
|
"groundTruth": "5",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q190",
|
|
"prompt": "What is the total number of permissions across all roles?",
|
|
"groundTruth": "8",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q191",
|
|
"prompt": "How many distinct permissions are defined across all roles?",
|
|
"groundTruth": "5",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q192",
|
|
"prompt": "How many distinct scopes are defined across all authentication providers?",
|
|
"groundTruth": "3",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q193",
|
|
"prompt": "What is the total number of variants across all feature flags?",
|
|
"groundTruth": "3",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q194",
|
|
"prompt": "How many database replicas have a priority greater than 2?",
|
|
"groundTruth": "1",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q195",
|
|
"prompt": "How many feature flags have a rollout percentage greater than 50?",
|
|
"groundTruth": "0",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q196",
|
|
"prompt": "How many groups have more than one role assigned?",
|
|
"groundTruth": "1",
|
|
"type": "aggregation",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q197",
|
|
"prompt": "How many feature flags are enabled with rollout greater than 50%?",
|
|
"groundTruth": "0",
|
|
"type": "filtering",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q198",
|
|
"prompt": "How many groups have the admin role?",
|
|
"groundTruth": "1",
|
|
"type": "filtering",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q199",
|
|
"prompt": "How many database replicas have priority greater than 2 and port 5432?",
|
|
"groundTruth": "1",
|
|
"type": "filtering",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q200",
|
|
"prompt": "How many authentication providers have more than 2 scopes?",
|
|
"groundTruth": "1",
|
|
"type": "filtering",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q201",
|
|
"prompt": "How many roles have at least 5 permissions?",
|
|
"groundTruth": "1",
|
|
"type": "filtering",
|
|
"dataset": "nested-config"
|
|
},
|
|
{
|
|
"id": "q202",
|
|
"prompt": "How many feature flags are disabled with rollout less than 25%?",
|
|
"groundTruth": "2",
|
|
"type": "filtering",
|
|
"dataset": "nested-config"
|
|
}
|
|
] |