Benchmark Run Details

System Prompt

You are a spell checking assistant. For each sentence, identify:
1. The incorrectly spelled word exactly as it appears
2. The correct spelling of that word

Run Summary

Model granite3.3:8b:Q4_K_M
Benchmark 0015_spell_check
Normed Score 81
Run Timestamp 2025-04-28 00:14:36

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0015_spell_check:attention:0 100 3851 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:1 100 2932 { "response": { "incorrect": "attantion", "correct": "attention" }, "expected": { "incorrect": "attantion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:2 100 2648 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:3 100 2868 { "response": { "incorrect": "attnetion", "correct": "attention" }, "expected": { "incorrect": "attnetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:4 0 3420 { "response": { "incorrect": "her children's attntion", "correct": "her children's attention" }, "expected": { "incorrect": "attntion", "correct": "attention" }, "is_correct": false }
[+]
0015_spell_check:attention:5 100 2824 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:6 0 2636 { "response": { "incorrect": "your", "correct": "you're" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": false }
[+]
0015_spell_check:attention:7 100 2752 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:8 100 2770 { "response": { "incorrect": "atttention", "correct": "attention" }, "expected": { "incorrect": "atttention", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:9 0 3138 { "response": { "incorrect": "her attenttion", "correct": "her attention" }, "expected": { "incorrect": "attenttion", "correct": "attention" }, "is_correct": false }
[+]
0015_spell_check:demonstrate:0 100 3973 { "response": { "incorrect": "demonstraite", "correct": "demonstrate" }, "expected": { "incorrect": "demonstraite", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:1 100 3895 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:2 100 4063 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:3 100 3724 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:4 100 3699 { "response": { "incorrect": "demanstrate", "correct": "demonstrate" }, "expected": { "incorrect": "demanstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:5 100 3471 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:6 100 3348 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:7 100 3320 { "response": { "incorrect": "demonstarte", "correct": "demonstrate" }, "expected": { "incorrect": "demonstarte", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:8 100 3249 { "response": { "incorrect": "deomstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:9 100 2868 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:laboratory:0 100 2793 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:1 100 2761 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:2 100 3150 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:3 100 3062 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:4 100 3108 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:5 100 2745 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:6 100 2825 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:7 100 3196 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:8 100 3864 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:9 100 3486 { "response": { "incorrect": "laberatory", "correct": "laboratory" }, "expected": { "incorrect": "laberatory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laughter:0 0 3624 { "response": { "incorrect": "infectious laughterr", "correct": "infectious laughter" }, "expected": { "incorrect": "laughterr", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:1 100 2933 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:2 0 3225 { "response": { "incorrect": "contagious laghter", "correct": "contagious laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:3 0 3593 { "response": { "incorrect": "contagious laghter", "correct": "contagious laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:4 0 2733 { "response": { "incorrect": "infectious", "correct": "laughter" }, "expected": { "incorrect": "lafter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:5 0 2996 { "response": { "incorrect": "contagious laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:6 0 4411 { "response": { "incorrect": "infectious", "correct": "infectious" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:7 0 4119 { "response": { "incorrect": "contagious laughtter", "correct": "contagious laughter" }, "expected": { "incorrect": "laughtter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:8 0 5885 { "response": { "incorrect": "contagious laughtur", "correct": "contagious laughter" }, "expected": { "incorrect": "laughtur", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:9 0 5124 { "response": { "incorrect": "contagious", "correct": "contagious" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:liaison:0 100 3399 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:1 100 4029 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:2 0 3231 { "response": { "incorrect": "schools", "correct": "school's" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": false }
[+]
0015_spell_check:liaison:3 100 2591 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:4 100 2615 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:5 100 3808 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:6 100 4665 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:7 0 3920 { "response": { "incorrect": "leason", "correct": "lesson" }, "expected": { "incorrect": "leason", "correct": "liaison" }, "is_correct": false }
[+]
0015_spell_check:liaison:8 0 4435 { "response": { "incorrect": "liaison", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": false }
[+]
0015_spell_check:liaison:9 100 3915 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:orange:0 100 2884 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:1 100 3009 { "response": { "incorrect": "oranje", "correct": "orange" }, "expected": { "incorrect": "oranje", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:2 100 3156 { "response": { "incorrect": "orang", "correct": "orange" }, "expected": { "incorrect": "orang", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:3 100 2853 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:4 100 2896 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:5 100 2674 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:6 100 3121 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:7 0 2596 { "response": { "incorrect": "orangee", "correct": "orange" }, "expected": { "incorrect": "oringe", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:orange:8 0 2945 { "response": { "incorrect": "orennege", "correct": "orange" }, "expected": { "incorrect": "orennge", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:orange:9 100 2331 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:partition:0 100 3524 { "response": { "incorrect": "partioned", "correct": "partitioned" }, "expected": { "incorrect": "partioned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:1 100 2940 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:2 100 2559 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:3 100 2973 { "response": { "incorrect": "partionned", "correct": "partitioned" }, "expected": { "incorrect": "partionned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:4 100 2440 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:5 100 2631 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:6 100 2854 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:7 100 3849 { "response": { "incorrect": "particion", "correct": "partition" }, "expected": { "incorrect": "particion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:8 100 3082 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:9 100 3062 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:party:0 100 3605 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:1 100 2750 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:2 0 2540 { "response": { "incorrect": "party", "correct": "pary" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": false }
[+]
0015_spell_check:party:3 100 2681 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:4 100 2554 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:5 100 2584 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:6 100 2726 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:7 100 2820 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:8 100 2712 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:9 0 2743 { "response": { "incorrect": "party", "correct": "pary" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": false }
[+]
0015_spell_check:stable:0 100 2397 { "response": { "incorrect": "staable", "correct": "stable" }, "expected": { "incorrect": "staable", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:1 100 2552 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:2 100 2629 { "response": { "incorrect": "stabal", "correct": "stable" }, "expected": { "incorrect": "stabal", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:3 100 2635 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:4 100 2771 { "response": { "incorrect": "stabel", "correct": "stable" }, "expected": { "incorrect": "stabel", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:5 100 2281 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:6 100 2341 { "response": { "incorrect": "stabl", "correct": "stable" }, "expected": { "incorrect": "stabl", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:7 100 2741 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:8 100 3239 { "response": { "incorrect": "stabble", "correct": "stable" }, "expected": { "incorrect": "stabble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:9 100 4318 { "response": { "incorrect": "stayble", "correct": "stable" }, "expected": { "incorrect": "stayble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:table:0 100 4160 { "response": { "incorrect": "tabele", "correct": "table" }, "expected": { "incorrect": "tabele", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:1 100 4303 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:2 100 4073 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:3 100 3768 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:4 100 4229 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:5 100 3932 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:6 100 3992 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:7 100 3791 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:8 100 3780 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:9 100 3634 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]