Benchmark Run Details

Run Summary

Model gemma3:1b:Q4_K_M
Benchmark 0011_word_length
Normed Score 7
Run Timestamp 2025-04-01 18:58:45

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0011_word_length:0 100 694 { "prompt": "How many letters are in the word 'reaction'?", "response": { "length": 8 }, "expected": 8, "is_correct": true }
[+]
0011_word_length:1 0 236 { "prompt": "How many letters are in the word 'game'?", "response": { "length": 5 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:10 0 253 { "prompt": "How many letters are in the word 'understanding'?", "response": { "length": 12 }, "expected": 13, "is_correct": false }
[+]
0011_word_length:11 0 255 { "prompt": "How many letters are in the word 'music'?", "response": { "length": 8 }, "expected": 5, "is_correct": false }
[+]
0011_word_length:12 0 234 { "prompt": "How many letters are in the word 'journey'?", "response": { "length": 8 }, "expected": 7, "is_correct": false }
[+]
0011_word_length:13 0 237 { "prompt": "How many letters are in the word 'significant'?", "response": { "length": 9 }, "expected": 11, "is_correct": false }
[+]
0011_word_length:14 0 234 { "prompt": "How many letters are in the word 'game'?", "response": { "length": 5 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:15 0 232 { "prompt": "How many letters are in the word 'challenge'?", "response": { "length": 7 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:16 0 262 { "prompt": "How many letters are in the word 'excitement'?", "response": { "length": 16 }, "expected": 10, "is_correct": false }
[+]
0011_word_length:17 0 257 { "prompt": "How many letters are in the word 'generation'?", "response": { "length": 18 }, "expected": 10, "is_correct": false }
[+]
0011_word_length:18 0 234 { "prompt": "How many letters are in the word 'technology'?", "response": { "length": 9 }, "expected": 10, "is_correct": false }
[+]
0011_word_length:19 0 246 { "prompt": "How many letters are in the word 'difficult'?", "response": { "length": 19 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:2 0 234 { "prompt": "How many letters are in the word 'cake'?", "response": { "length": 6 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:20 0 257 { "prompt": "How many letters are in the word 'abundance'?", "response": { "length": 11 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:21 0 268 { "prompt": "How many letters are in the word 'education'?", "response": { "length": 10 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:22 0 256 { "prompt": "How many letters are in the word 'mountain'?", "response": { "length": 11 }, "expected": 8, "is_correct": false }
[+]
0011_word_length:23 0 247 { "prompt": "How many letters are in the word 'understanding'?", "response": { "length": 12 }, "expected": 13, "is_correct": false }
[+]
0011_word_length:24 100 243 { "prompt": "How many letters are in the word 'performance'?", "response": { "length": 11 }, "expected": 11, "is_correct": true }
[+]
0011_word_length:25 0 252 { "prompt": "How many letters are in the word 'yesterday'?", "response": { "length": 19 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:26 0 233 { "prompt": "How many letters are in the word 'farm'?", "response": { "length": 8 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:27 0 248 { "prompt": "How many letters are in the word 'conversation'?", "response": { "length": 21 }, "expected": 12, "is_correct": false }
[+]
0011_word_length:28 0 247 { "prompt": "How many letters are in the word 'universe'?", "response": { "length": 44 }, "expected": 8, "is_correct": false }
[+]
0011_word_length:29 0 233 { "prompt": "How many letters are in the word 'garden'?", "response": { "length": 7 }, "expected": 6, "is_correct": false }
[+]
0011_word_length:3 0 234 { "prompt": "How many letters are in the word 'delicious'?", "response": { "length": 8 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:30 0 248 { "prompt": "How many letters are in the word 'notebook'?", "response": { "length": 11 }, "expected": 8, "is_correct": false }
[+]
0011_word_length:31 0 251 { "prompt": "How many letters are in the word 'generation'?", "response": { "length": 18 }, "expected": 10, "is_correct": false }
[+]
0011_word_length:32 0 228 { "prompt": "How many letters are in the word 'hat'?", "response": { "length": 5 }, "expected": 3, "is_correct": false }
[+]
0011_word_length:33 0 249 { "prompt": "How many letters are in the word 'ocean'?", "response": { "length": 10 }, "expected": 5, "is_correct": false }
[+]
0011_word_length:34 0 248 { "prompt": "How many letters are in the word 'important'?", "response": { "length": 16 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:35 0 254 { "prompt": "How many letters are in the word 'profession'?", "response": { "length": 11 }, "expected": 10, "is_correct": false }
[+]
0011_word_length:36 0 233 { "prompt": "How many letters are in the word 'road'?", "response": { "length": 5 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:37 0 253 { "prompt": "How many letters are in the word 'difficult'?", "response": { "length": 19 }, "expected": 9, "is_correct": false }
[+]
0011_word_length:38 0 228 { "prompt": "How many letters are in the word 'music'?", "response": { "length": 8 }, "expected": 5, "is_correct": false }
[+]
0011_word_length:39 0 232 { "prompt": "How many letters are in the word 'sun'?", "response": { "length": 5 }, "expected": 3, "is_correct": false }
[+]
0011_word_length:4 0 229 { "prompt": "How many letters are in the word 'hat'?", "response": { "length": 5 }, "expected": 3, "is_correct": false }
[+]
0011_word_length:5 0 237 { "prompt": "How many letters are in the word 'game'?", "response": { "length": 5 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:6 0 234 { "prompt": "How many letters are in the word 'jelly'?", "response": { "length": 6 }, "expected": 5, "is_correct": false }
[+]
0011_word_length:7 0 252 { "prompt": "How many letters are in the word 'freedom'?", "response": { "length": 16 }, "expected": 7, "is_correct": false }
[+]
0011_word_length:8 0 232 { "prompt": "How many letters are in the word 'farm'?", "response": { "length": 8 }, "expected": 4, "is_correct": false }
[+]
0011_word_length:9 100 239 { "prompt": "How many letters are in the word 'computer'?", "response": { "length": 8 }, "expected": 8, "is_correct": true }
[+]