Benchmark Run Details

System Prompt

You are a spell checking assistant. For each sentence, identify:
1. The incorrectly spelled word exactly as it appears
2. The correct spelling of that word

Run Summary

Model qwen3:4b:Q4_K_M
Benchmark 0015_spell_check
Normed Score 92
Run Timestamp 2025-04-29 04:36:24

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0015_spell_check:attention:0 100 2277 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:1 100 2551 { "response": { "incorrect": "attantion", "correct": "attention" }, "expected": { "incorrect": "attantion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:2 100 2117 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:3 100 2654 { "response": { "incorrect": "attnetion", "correct": "attention" }, "expected": { "incorrect": "attnetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:4 100 2688 { "response": { "incorrect": "attntion", "correct": "attention" }, "expected": { "incorrect": "attntion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:5 100 2326 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:6 100 2438 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:7 100 2506 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:8 100 2897 { "response": { "incorrect": "atttention", "correct": "attention" }, "expected": { "incorrect": "atttention", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:9 100 2547 { "response": { "incorrect": "attenttion", "correct": "attention" }, "expected": { "incorrect": "attenttion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:0 100 2389 { "response": { "incorrect": "demonstraite", "correct": "demonstrate" }, "expected": { "incorrect": "demonstraite", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:1 100 2637 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:2 100 2823 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:3 100 2757 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:4 100 2769 { "response": { "incorrect": "demanstrate", "correct": "demonstrate" }, "expected": { "incorrect": "demanstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:5 100 2574 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:6 100 2413 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:7 100 2521 { "response": { "incorrect": "demonstarte", "correct": "demonstrate" }, "expected": { "incorrect": "demonstarte", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:8 100 2489 { "response": { "incorrect": "deomstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:9 100 2630 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:laboratory:0 100 2456 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:1 100 2783 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:2 100 2460 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:3 100 2396 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:4 100 2457 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:5 100 2438 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:6 100 2555 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:7 100 2724 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:8 100 2561 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:9 100 2324 { "response": { "incorrect": "laberatory", "correct": "laboratory" }, "expected": { "incorrect": "laberatory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laughter:0 100 2031 { "response": { "incorrect": "laughterr", "correct": "laughter" }, "expected": { "incorrect": "laughterr", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:1 100 2065 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:2 100 1895 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:3 100 2411 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:4 100 2144 { "response": { "incorrect": "lafter", "correct": "laughter" }, "expected": { "incorrect": "lafter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:5 100 2096 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:6 100 2618 { "response": { "incorrect": "laugther", "correct": "laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:7 100 2423 { "response": { "incorrect": "laughtter", "correct": "laughter" }, "expected": { "incorrect": "laughtter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:8 100 2219 { "response": { "incorrect": "laughtur", "correct": "laughter" }, "expected": { "incorrect": "laughtur", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:9 0 2194 { "response": { "incorrect": "laugther", "correct": "laugh" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:liaison:0 100 2347 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:1 100 2003 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:2 100 2109 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:3 100 2441 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:4 100 2423 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:5 100 2432 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:6 100 2467 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:7 0 1931 { "response": { "incorrect": "leason", "correct": "mediator" }, "expected": { "incorrect": "leason", "correct": "liaison" }, "is_correct": false }
[+]
0015_spell_check:liaison:8 100 2685 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:9 100 2490 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:orange:0 0 1932 { "response": { "incorrect": "orange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:orange:1 0 1807 { "response": { "incorrect": "orange", "correct": "orange" }, "expected": { "incorrect": "oranje", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:orange:2 100 2146 { "response": { "incorrect": "orang", "correct": "orange" }, "expected": { "incorrect": "orang", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:3 100 2071 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:4 100 2555 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:5 100 2499 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:6 100 2215 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:7 100 2369 { "response": { "incorrect": "oringe", "correct": "orange" }, "expected": { "incorrect": "oringe", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:8 100 2638 { "response": { "incorrect": "orennge", "correct": "orange" }, "expected": { "incorrect": "orennge", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:9 0 2418 { "response": { "incorrect": "orange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:partition:0 100 2198 { "response": { "incorrect": "partioned", "correct": "partitioned" }, "expected": { "incorrect": "partioned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:1 100 2110 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:2 100 2486 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:3 100 2748 { "response": { "incorrect": "partionned", "correct": "partitioned" }, "expected": { "incorrect": "partionned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:4 100 2614 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:5 100 2297 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:6 100 2049 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:7 100 2490 { "response": { "incorrect": "particion", "correct": "partition" }, "expected": { "incorrect": "particion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:8 100 2384 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:9 100 2178 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:party:0 100 2702 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:1 100 2697 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:2 0 2122 { "response": { "incorrect": "parry", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": false }
[+]
0015_spell_check:party:3 100 1945 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:4 100 2439 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:5 100 2588 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:6 100 2737 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:7 0 2830 { "response": { "incorrect": "partee", "correct": "partie" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": false }
[+]
0015_spell_check:party:8 100 1787 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:9 0 2616 { "response": { "incorrect": "parry", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": false }
[+]
0015_spell_check:stable:0 100 2779 { "response": { "incorrect": "staable", "correct": "stable" }, "expected": { "incorrect": "staable", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:1 100 2466 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:2 100 2398 { "response": { "incorrect": "stabal", "correct": "stable" }, "expected": { "incorrect": "stabal", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:3 100 2257 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:4 100 2126 { "response": { "incorrect": "stabel", "correct": "stable" }, "expected": { "incorrect": "stabel", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:5 100 1971 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:6 100 2013 { "response": { "incorrect": "stabl", "correct": "stable" }, "expected": { "incorrect": "stabl", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:7 100 2003 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:8 100 2017 { "response": { "incorrect": "stabble", "correct": "stable" }, "expected": { "incorrect": "stabble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:9 100 2413 { "response": { "incorrect": "stayble", "correct": "stable" }, "expected": { "incorrect": "stayble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:table:0 100 2660 { "response": { "incorrect": "tabele", "correct": "table" }, "expected": { "incorrect": "tabele", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:1 100 2046 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:2 100 2859 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:3 100 2655 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:4 100 2768 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:5 100 2457 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:6 100 3242 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:7 100 2054 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:8 100 2051 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:9 100 2169 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]