Benchmark Run Details

System Prompt

You are a spell checking assistant. For each sentence, identify:
1. The incorrectly spelled word exactly as it appears
2. The correct spelling of that word

Run Summary

Model lmstudio/granite-3.3-8b-instruct
Benchmark 0015_spell_check
Normed Score 78
Run Timestamp 2025-04-29 17:11:43

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0015_spell_check:attention:0 100 1991 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:1 100 1814 { "response": { "incorrect": "attantion", "correct": "attention" }, "expected": { "incorrect": "attantion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:2 100 1839 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:3 100 1907 { "response": { "incorrect": "attnetion", "correct": "attention" }, "expected": { "incorrect": "attnetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:4 0 1978 { "response": { "incorrect": "attention", "correct": "attntion" }, "expected": { "incorrect": "attntion", "correct": "attention" }, "is_correct": false }
[+]
0015_spell_check:attention:5 100 1953 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:6 100 1973 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:7 100 2139 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:8 100 2070 { "response": { "incorrect": "atttention", "correct": "attention" }, "expected": { "incorrect": "atttention", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:9 0 2284 { "response": { "incorrect": "her attenttion", "correct": "her attention" }, "expected": { "incorrect": "attenttion", "correct": "attention" }, "is_correct": false }
[+]
0015_spell_check:demonstrate:0 100 2194 { "response": { "incorrect": "demonstraite", "correct": "demonstrate" }, "expected": { "incorrect": "demonstraite", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:1 100 2245 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:2 100 2214 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:3 100 2234 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:4 100 2122 { "response": { "incorrect": "demanstrate", "correct": "demonstrate" }, "expected": { "incorrect": "demanstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:5 100 2298 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:6 100 2247 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:7 100 2400 { "response": { "incorrect": "demonstarte", "correct": "demonstrate" }, "expected": { "incorrect": "demonstarte", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:8 100 1848 { "response": { "incorrect": "deomstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:9 0 3296 { "response": { "type": "object", "properties": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "required": [ "incorrect", "correct" ] }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": false }
[+]
0015_spell_check:laboratory:0 100 1891 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:1 100 1820 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:2 100 1770 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:3 100 1896 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:4 100 1891 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:5 100 1802 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:6 100 1868 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:7 100 1788 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:8 100 1802 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:9 0 4604 { "response": { "type": "object", "properties": { "incorrect": { "type": "string", "value": "laberatory" }, "correct": { "type": "string", "value": "laboratory" } }, "required": [ "incorrect", "correct" ] }, "expected": { "incorrect": "laberatory", "correct": "laboratory" }, "is_correct": false }
[+]
0015_spell_check:laughter:0 0 4603 { "response": { "type": "object", "properties": { "incorrect": { "type": "string", "value": "laughterr" }, "correct": { "type": "string", "value": "laughter" } }, "required": [ "incorrect", "correct" ] }, "expected": { "incorrect": "laughterr", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:1 0 2089 { "response": { "incorrect": "contagious laghter", "correct": "contagious laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:2 0 2203 { "response": { "incorrect": "contagious laghter", "correct": "contagious laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:3 0 2183 { "response": { "incorrect": "contagious laghter", "correct": "contagious laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:4 0 2075 { "response": { "incorrect": "infectious lafter", "correct": "infectious laughter" }, "expected": { "incorrect": "lafter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:5 0 2165 { "response": { "incorrect": "contagious laghter", "correct": "contagious laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:6 0 2122 { "response": { "incorrect": "infectious laugther", "correct": "infectious laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:7 0 2399 { "response": { "incorrect": "contagious laughtter", "correct": "contagious laughter" }, "expected": { "incorrect": "laughtter", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:8 0 1966 { "response": { "incorrect": "contagious laughtur", "correct": "contagious laughter" }, "expected": { "incorrect": "laughtur", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:laughter:9 0 2164 { "response": { "incorrect": "contagious laugther", "correct": "contagious laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": false }
[+]
0015_spell_check:liaison:0 100 1791 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:1 100 1907 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:2 100 1776 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:3 100 1945 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:4 100 1885 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:5 100 1861 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:6 100 1917 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:7 0 2159 { "response": { "incorrect": "leason", "correct": "lesson" }, "expected": { "incorrect": "leason", "correct": "liaison" }, "is_correct": false }
[+]
0015_spell_check:liaison:8 100 1922 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:9 100 1805 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:orange:0 100 1804 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:1 100 1814 { "response": { "incorrect": "oranje", "correct": "orange" }, "expected": { "incorrect": "oranje", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:2 100 1787 { "response": { "incorrect": "orang", "correct": "orange" }, "expected": { "incorrect": "orang", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:3 100 1769 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:4 100 1719 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:5 100 1789 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:6 100 1730 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:7 0 5593 { "response": { "error": "Failed to parse JSON: {\n \"incorrect\": \"incorrectly-spelled\",\n \"correct\": \"incorrect\"\n}\n\n{\n \"type\": \"object\",\n \"properties\": {\n \"incorrect\": {\n \"type\": \"string\",\n \"value\": \"oringe\"\n },\n \"correct\": {\n \"type\": \"string\",\n \"value\": \"orange\"\n }\n },\n \"required\": [\n \"incorrect\",\n \"correct\"\n ]\n}" }, "expected": { "incorrect": "oringe", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:orange:8 0 1780 { "response": { "incorrect": "orennege", "correct": "orange" }, "expected": { "incorrect": "orennge", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:orange:9 0 5863 { "response": { "error": "Failed to parse JSON: {\n \"incorrect\": \"incomly\",\n \"correct\": \"correct\"\n} \n\nCorrection: The sentence provided for checking does not contain an incorrectly spelled word. It seems there might have been a misunderstanding. The correctly spelled sentence is \"I love to eat a slice of orange in the morning.\" \n\nHere's the corrected JSON format:\n\n```json\n{\n \"incorrect\": \"correct\",\n \"correct\": \"correct\" \n}\n```" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": false }
[+]
0015_spell_check:partition:0 100 1792 { "response": { "incorrect": "partioned", "correct": "partitioned" }, "expected": { "incorrect": "partioned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:1 100 1701 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:2 100 1741 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:3 100 1789 { "response": { "incorrect": "partionned", "correct": "partitioned" }, "expected": { "incorrect": "partionned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:4 100 1704 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:5 100 1904 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:6 100 1716 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:7 100 1734 { "response": { "incorrect": "particion", "correct": "partition" }, "expected": { "incorrect": "particion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:8 100 1761 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:9 100 1695 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:party:0 100 1750 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:1 100 1726 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:2 100 1783 { "response": { "incorrect": "pary", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:3 100 1732 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:4 100 1773 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:5 100 1801 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:6 100 1760 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:7 100 1756 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:8 100 1735 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:9 100 1721 { "response": { "incorrect": "pary", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:stable:0 100 1825 { "response": { "incorrect": "staable", "correct": "stable" }, "expected": { "incorrect": "staable", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:1 100 1742 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:2 100 1751 { "response": { "incorrect": "stabal", "correct": "stable" }, "expected": { "incorrect": "stabal", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:3 100 1785 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:4 100 1764 { "response": { "incorrect": "stabel", "correct": "stable" }, "expected": { "incorrect": "stabel", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:5 0 1732 { "response": { "incorrect": "staible", "correct": "steady" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": false }
[+]
0015_spell_check:stable:6 100 1688 { "response": { "incorrect": "stabl", "correct": "stable" }, "expected": { "incorrect": "stabl", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:7 0 1834 { "response": { "incorrect": "stabe", "correct": "steady" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": false }
[+]
0015_spell_check:stable:8 100 1707 { "response": { "incorrect": "stabble", "correct": "stable" }, "expected": { "incorrect": "stabble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:9 100 1721 { "response": { "incorrect": "stayble", "correct": "stable" }, "expected": { "incorrect": "stayble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:table:0 100 1708 { "response": { "incorrect": "tabele", "correct": "table" }, "expected": { "incorrect": "tabele", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:1 100 1700 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:2 100 1648 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:3 0 1693 { "response": { "incorrect": "tabple", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": false }
[+]
0015_spell_check:table:4 100 1703 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:5 100 1747 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:6 100 1741 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:7 100 1655 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:8 0 3048 { "response": { "type": "object", "properties": { "incorrect": "tabel", "correct": "table" }, "required": [ "incorrect", "correct" ] }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": false }
[+]
0015_spell_check:table:9 100 1651 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]