Benchmark Run Details

System Prompt

You are a linguistics assistant. For each question, identify which word from the provided 
candidates is the antonym of the given word. Respond with only the antonym word.

Run Summary

Model gemini-2.5-flash-preview-04-17
Benchmark 0016_antonym
Normed Score 100
Run Timestamp 2025-04-24 19:20:08

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0016_antonym:adjectives:0 100 1431 { "model_answer": "sad", "correct_answer": "sad", "is_correct": true }
[+]
0016_antonym:adjectives:1 100 1247 { "model_answer": "dark", "correct_answer": "dark", "is_correct": true }
[+]
0016_antonym:adjectives:10 100 1736 { "model_answer": "flexible", "correct_answer": "flexible", "is_correct": true }
[+]
0016_antonym:adjectives:11 100 1537 { "model_answer": "frugal", "correct_answer": "frugal", "is_correct": true }
[+]
0016_antonym:adjectives:12 100 1841 { "model_answer": "extraordinary", "correct_answer": "extraordinary", "is_correct": true }
[+]
0016_antonym:adjectives:13 100 2151 { "model_answer": "eager", "correct_answer": "eager", "is_correct": true }
[+]
0016_antonym:adjectives:14 100 1736 { "model_answer": "timid", "correct_answer": "timid", "is_correct": true }
[+]
0016_antonym:adjectives:15 100 1144 { "model_answer": "benevolent", "correct_answer": "benevolent", "is_correct": true }
[+]
0016_antonym:adjectives:16 100 1355 { "model_answer": "fake", "correct_answer": "fake", "is_correct": true }
[+]
0016_antonym:adjectives:17 100 1710 { "model_answer": "scarce", "correct_answer": "scarce", "is_correct": true }
[+]
0016_antonym:adjectives:18 100 1161 { "model_answer": "irrational", "correct_answer": "irrational", "is_correct": true }
[+]
0016_antonym:adjectives:19 100 2248 { "model_answer": "varied", "correct_answer": "varied", "is_correct": true }
[+]
0016_antonym:adjectives:2 100 2026 { "model_answer": "stingy", "correct_answer": "stingy", "is_correct": true }
[+]
0016_antonym:adjectives:3 100 1224 { "model_answer": "modern", "correct_answer": "modern", "is_correct": true }
[+]
0016_antonym:adjectives:4 100 1899 { "model_answer": "opaque", "correct_answer": "opaque", "is_correct": true }
[+]
0016_antonym:adjectives:5 100 2397 { "model_answer": "concise", "correct_answer": "concise", "is_correct": true }
[+]
0016_antonym:adjectives:6 100 1646 { "model_answer": "stable", "correct_answer": "stable", "is_correct": true }
[+]
0016_antonym:adjectives:7 100 2246 { "model_answer": "careless", "correct_answer": "careless", "is_correct": true }
[+]
0016_antonym:adjectives:8 100 819 { "model_answer": "deep", "correct_answer": "deep", "is_correct": true }
[+]
0016_antonym:adjectives:9 100 1842 { "model_answer": "fine", "correct_answer": "fine", "is_correct": true }
[+]
0016_antonym:verbs:0 100 2240 { "model_answer": "destroy", "correct_answer": "destroy", "is_correct": true }
[+]
0016_antonym:verbs:1 100 1436 { "model_answer": "decrease", "correct_answer": "decrease", "is_correct": true }
[+]
0016_antonym:verbs:10 100 2108 { "model_answer": "permit", "correct_answer": "permit", "is_correct": true }
[+]
0016_antonym:verbs:11 100 1284 { "model_answer": "gather", "correct_answer": "gather", "is_correct": true }
[+]
0016_antonym:verbs:12 100 1475 { "model_answer": "augment", "correct_answer": "augment", "is_correct": true }
[+]
0016_antonym:verbs:13 100 1540 { "model_answer": "obscure", "correct_answer": "obscure", "is_correct": true }
[+]
0016_antonym:verbs:14 100 1327 { "model_answer": "alleviate", "correct_answer": "alleviate", "is_correct": true }
[+]
0016_antonym:verbs:15 100 1734 { "model_answer": "affirm", "correct_answer": "affirm", "is_correct": true }
[+]
0016_antonym:verbs:16 100 1610 { "model_answer": "encourage", "correct_answer": "encourage", "is_correct": true }
[+]
0016_antonym:verbs:17 100 2288 { "model_answer": "delay", "correct_answer": "delay", "is_correct": true }
[+]
0016_antonym:verbs:18 100 1579 { "model_answer": "confine", "correct_answer": "confine", "is_correct": true }
[+]
0016_antonym:verbs:19 100 1391 { "model_answer": "conclude", "correct_answer": "conclude", "is_correct": true }
[+]
0016_antonym:verbs:2 100 1635 { "model_answer": "depart", "correct_answer": "depart", "is_correct": true }
[+]
0016_antonym:verbs:3 100 1110 { "model_answer": "reject", "correct_answer": "reject", "is_correct": true }
[+]
0016_antonym:verbs:4 100 1100 { "model_answer": "demolish", "correct_answer": "demolish", "is_correct": true }
[+]
0016_antonym:verbs:5 100 1204 { "model_answer": "decelerate", "correct_answer": "decelerate", "is_correct": true }
[+]
0016_antonym:verbs:6 100 1327 { "model_answer": "weaken", "correct_answer": "weaken", "is_correct": true }
[+]
0016_antonym:verbs:7 100 1595 { "model_answer": "criticize", "correct_answer": "criticize", "is_correct": true }
[+]
0016_antonym:verbs:8 100 1146 { "model_answer": "descend", "correct_answer": "descend", "is_correct": true }
[+]
0016_antonym:verbs:9 100 1269 { "model_answer": "reveal", "correct_answer": "reveal", "is_correct": true }
[+]