Benchmark Run Details

System Prompt

You are a spell checking assistant. For each sentence, identify:
1. The incorrectly spelled word exactly as it appears
2. The correct spelling of that word

Run Summary

Model gemini-2.5-flash-preview-04-17
Benchmark 0015_spell_check
Normed Score 99
Run Timestamp 2025-04-24 19:25:47

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0015_spell_check:attention:0 100 1218 { "response": { "correct": "attention", "incorrect": "attetion" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:1 100 1788 { "response": { "correct": "attention", "incorrect": "attantion" }, "expected": { "incorrect": "attantion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:2 100 2259 { "response": { "correct": "attention", "incorrect": "attetion" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:3 100 1290 { "response": { "correct": "attention", "incorrect": "attnetion" }, "expected": { "incorrect": "attnetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:4 100 918 { "response": { "correct": "attention", "incorrect": "attntion" }, "expected": { "incorrect": "attntion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:5 100 914 { "response": { "correct": "attention", "incorrect": "attenion" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:6 100 1448 { "response": { "correct": "attention", "incorrect": "attenion" }, "expected": { "incorrect": "attenion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:7 100 1568 { "response": { "correct": "attention", "incorrect": "attetion" }, "expected": { "incorrect": "attetion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:8 100 1336 { "response": { "correct": "attention", "incorrect": "atttention" }, "expected": { "incorrect": "atttention", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:attention:9 100 1111 { "response": { "correct": "attention", "incorrect": "attenttion" }, "expected": { "incorrect": "attenttion", "correct": "attention" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:0 100 1227 { "response": { "correct": "demonstrate", "incorrect": "demonstraite" }, "expected": { "incorrect": "demonstraite", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:1 100 2009 { "response": { "correct": "demonstrate", "incorrect": "deomonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:2 100 1287 { "response": { "correct": "demonstrate", "incorrect": "deomonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:3 100 977 { "response": { "correct": "demonstrate", "incorrect": "deomonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:4 100 1531 { "response": { "correct": "demonstrate", "incorrect": "demanstrate" }, "expected": { "incorrect": "demanstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:5 100 1329 { "response": { "correct": "demonstrate", "incorrect": "deomonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:6 100 1540 { "response": { "correct": "demonstrate", "incorrect": "deomonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:7 100 1139 { "response": { "correct": "demonstrate", "incorrect": "demonstarte" }, "expected": { "incorrect": "demonstarte", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:8 100 1096 { "response": { "correct": "demonstrate", "incorrect": "deomstrate" }, "expected": { "incorrect": "deomstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:demonstrate:9 100 1095 { "response": { "correct": "demonstrate", "incorrect": "deomonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "is_correct": true }
[+]
0015_spell_check:laboratory:0 100 1622 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:1 100 1492 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:2 100 1425 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:3 100 1341 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:4 100 1064 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:5 100 1244 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:6 100 1592 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:7 100 1122 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:8 100 828 { "response": { "correct": "laboratory", "incorrect": "labratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laboratory:9 100 1485 { "response": { "correct": "laboratory", "incorrect": "laberatory" }, "expected": { "incorrect": "laberatory", "correct": "laboratory" }, "is_correct": true }
[+]
0015_spell_check:laughter:0 100 1440 { "response": { "correct": "laughter", "incorrect": "laughterr" }, "expected": { "incorrect": "laughterr", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:1 100 956 { "response": { "correct": "laughter", "incorrect": "laghter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:2 100 1021 { "response": { "correct": "laughter", "incorrect": "laghter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:3 100 1610 { "response": { "correct": "laughter", "incorrect": "laghter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:4 100 1860 { "response": { "correct": "laughter", "incorrect": "lafter" }, "expected": { "incorrect": "lafter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:5 100 1288 { "response": { "correct": "laughter", "incorrect": "laghter" }, "expected": { "incorrect": "laghter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:6 100 2145 { "response": { "correct": "laughter", "incorrect": "laugther" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:7 100 1307 { "response": { "correct": "laughter", "incorrect": "laughtter" }, "expected": { "incorrect": "laughtter", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:8 100 1187 { "response": { "correct": "laughter", "incorrect": "laughtur" }, "expected": { "incorrect": "laughtur", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:laughter:9 100 1604 { "response": { "correct": "laughter", "incorrect": "laugther" }, "expected": { "incorrect": "laugther", "correct": "laughter" }, "is_correct": true }
[+]
0015_spell_check:liaison:0 100 1226 { "response": { "correct": "liaison", "incorrect": "liason" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:1 100 1676 { "response": { "correct": "liaison", "incorrect": "liason" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:2 0 2131 { "response": { "correct": "liaison", "incorrect": "liasoin" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": false }
[+]
0015_spell_check:liaison:3 100 1802 { "response": { "correct": "liaison", "incorrect": "liason" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:4 100 1284 { "response": { "correct": "liaison", "incorrect": "liason" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:5 100 1107 { "response": { "correct": "liaison", "incorrect": "liason" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:6 100 1150 { "response": { "correct": "liaison", "incorrect": "liasion" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:7 100 835 { "response": { "correct": "liaison", "incorrect": "leason" }, "expected": { "incorrect": "leason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:8 100 1004 { "response": { "correct": "liaison", "incorrect": "liasion" }, "expected": { "incorrect": "liasion", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:liaison:9 100 1273 { "response": { "correct": "liaison", "incorrect": "liason" }, "expected": { "incorrect": "liason", "correct": "liaison" }, "is_correct": true }
[+]
0015_spell_check:orange:0 100 1398 { "response": { "correct": "orange", "incorrect": "orrange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:1 100 1645 { "response": { "correct": "orange", "incorrect": "oranje" }, "expected": { "incorrect": "oranje", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:2 100 1477 { "response": { "correct": "orange", "incorrect": "orang" }, "expected": { "incorrect": "orang", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:3 100 1128 { "response": { "correct": "orange", "incorrect": "oranage" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:4 100 1221 { "response": { "correct": "orange", "incorrect": "oranage" }, "expected": { "incorrect": "oranage", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:5 100 1570 { "response": { "correct": "orange", "incorrect": "orrange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:6 100 1531 { "response": { "correct": "orange", "incorrect": "orrange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:7 100 852 { "response": { "correct": "orange", "incorrect": "oringe" }, "expected": { "incorrect": "oringe", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:8 100 1187 { "response": { "correct": "orange", "incorrect": "orennge" }, "expected": { "incorrect": "orennge", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:orange:9 100 2218 { "response": { "correct": "orange", "incorrect": "orrange" }, "expected": { "incorrect": "orrange", "correct": "orange" }, "is_correct": true }
[+]
0015_spell_check:partition:0 100 1004 { "response": { "correct": "partitioned", "incorrect": "partioned" }, "expected": { "incorrect": "partioned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:1 100 2031 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:2 100 1330 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:3 100 956 { "response": { "correct": "partitioned", "incorrect": "partionned" }, "expected": { "incorrect": "partionned", "correct": "partitioned" }, "is_correct": true }
[+]
0015_spell_check:partition:4 100 1900 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:5 100 1729 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:6 100 2834 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:7 100 1123 { "response": { "correct": "partition", "incorrect": "particion" }, "expected": { "incorrect": "particion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:8 100 1118 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:partition:9 100 1568 { "response": { "correct": "partition", "incorrect": "partion" }, "expected": { "incorrect": "partion", "correct": "partition" }, "is_correct": true }
[+]
0015_spell_check:party:0 100 1544 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:1 100 914 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:2 100 2950 { "response": { "correct": "party", "incorrect": "pary" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:3 100 1152 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:4 100 1437 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:5 100 1738 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:6 100 1447 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:7 100 1006 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:8 100 1529 { "response": { "correct": "party", "incorrect": "partee" }, "expected": { "incorrect": "partee", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:party:9 100 1336 { "response": { "correct": "party", "incorrect": "pary" }, "expected": { "incorrect": "pary", "correct": "party" }, "is_correct": true }
[+]
0015_spell_check:stable:0 100 1119 { "response": { "correct": "stable", "incorrect": "staable" }, "expected": { "incorrect": "staable", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:1 100 1111 { "response": { "correct": "stable", "incorrect": "stabe" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:2 100 1548 { "response": { "correct": "stable", "incorrect": "stabal" }, "expected": { "incorrect": "stabal", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:3 100 1207 { "response": { "correct": "stable", "incorrect": "staible" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:4 100 1319 { "response": { "correct": "stable", "incorrect": "stabel" }, "expected": { "incorrect": "stabel", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:5 100 1577 { "response": { "correct": "stable", "incorrect": "staible" }, "expected": { "incorrect": "staible", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:6 100 1230 { "response": { "correct": "stable", "incorrect": "stabl" }, "expected": { "incorrect": "stabl", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:7 100 1632 { "response": { "correct": "stable", "incorrect": "stabe" }, "expected": { "incorrect": "stabe", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:8 100 1224 { "response": { "correct": "stable", "incorrect": "stabble" }, "expected": { "incorrect": "stabble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:stable:9 100 1249 { "response": { "correct": "stable", "incorrect": "stayble" }, "expected": { "incorrect": "stayble", "correct": "stable" }, "is_correct": true }
[+]
0015_spell_check:table:0 100 1104 { "response": { "correct": "table", "incorrect": "tabele" }, "expected": { "incorrect": "tabele", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:1 100 2193 { "response": { "correct": "table", "incorrect": "tabble" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:2 100 1181 { "response": { "correct": "table", "incorrect": "tabel" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:3 100 1229 { "response": { "correct": "table", "incorrect": "tabble" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:4 100 1230 { "response": { "correct": "table", "incorrect": "tabble" }, "expected": { "incorrect": "tabble", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:5 100 1021 { "response": { "correct": "table", "incorrect": "tabl" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:6 100 1111 { "response": { "correct": "table", "incorrect": "tabl" }, "expected": { "incorrect": "tabl", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:7 100 1545 { "response": { "correct": "table", "incorrect": "tabel" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:8 100 2461 { "response": { "correct": "table", "incorrect": "tabel" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]
0015_spell_check:table:9 100 1530 { "response": { "correct": "table", "incorrect": "tabel" }, "expected": { "incorrect": "tabel", "correct": "table" }, "is_correct": true }
[+]