Benchmark Run Details

Run Summary

Model qwen2.5:7b:Q4_K_M
Benchmark 0015_spell_check
Normed Score 96
Run Timestamp 2025-03-26 18:22:37

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0015_spell_check:attention:0 100 4665 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" } }
[+]
0015_spell_check:attention:1 100 1142 { "response": { "incorrect": "attantion", "correct": "attention" }, "expected": { "incorrect": "attantion", "correct": "attention" } }
[+]
0015_spell_check:attention:2 100 1155 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" } }
[+]
0015_spell_check:attention:3 100 1247 { "response": { "incorrect": "attnetion", "correct": "attention" }, "expected": { "incorrect": "attnetion", "correct": "attention" } }
[+]
0015_spell_check:attention:4 100 2102 { "response": { "incorrect": "attntion", "correct": "attention" }, "expected": { "incorrect": "attntion", "correct": "attention" } }
[+]
0015_spell_check:attention:5 100 1463 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" } }
[+]
0015_spell_check:attention:6 100 1782 { "response": { "incorrect": "attenion", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" } }
[+]
0015_spell_check:attention:7 100 1827 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" } }
[+]
0015_spell_check:attention:8 100 1557 { "response": { "incorrect": "atttention", "correct": "attention" }, "expected": { "incorrect": "atttention", "correct": "attention" } }
[+]
0015_spell_check:attention:9 100 1647 { "response": { "incorrect": "attenttion", "correct": "attention" }, "expected": { "incorrect": "attenttion", "correct": "attention" } }
[+]
0015_spell_check:demonstrate:0 100 1816 { "response": { "incorrect": "demonstraite", "correct": "demonstrate" }, "expected": { "incorrect": "demonstraite", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:1 100 1752 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:2 100 1808 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:3 100 1747 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:4 100 1780 { "response": { "incorrect": "demanstrate", "correct": "demonstrate" }, "expected": { "incorrect": "demanstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:5 100 1962 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:6 100 2042 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:7 100 1919 { "response": { "incorrect": "demonstarte", "correct": "demonstrate" }, "expected": { "incorrect": "demonstarte", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:8 100 1811 { "response": { "incorrect": "deomstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:9 100 1793 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:laboratory:0 100 1799 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:1 100 1806 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:2 100 1797 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:3 100 1796 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:4 100 1792 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:5 100 1817 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:6 100 1782 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:7 100 1797 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:8 100 1814 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:9 100 1798 { "response": { "incorrect": "laberatory", "correct": "laboratory" }, "expected": { "incorrect": "laberatory", "correct": "laboratory" } }
[+]
0015_spell_check:laughter:0 100 1634 { "response": { "incorrect": "laughterr", "correct": "laughter" }, "expected": { "incorrect": "laughterr", "correct": "laughter" } }
[+]
0015_spell_check:laughter:1 0 1700 { "response": { "incorrect": "laghter", "correct": "laugh" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:2 0 1705 { "response": { "incorrect": "laghter", "correct": "laugh" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:3 100 1642 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:4 100 1565 { "response": { "incorrect": "lafter", "correct": "laughter" }, "expected": { "incorrect": "lafter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:5 100 1653 { "response": { "incorrect": "laghter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:6 100 1611 { "response": { "incorrect": "laugther", "correct": "laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" } }
[+]
0015_spell_check:laughter:7 100 1624 { "response": { "incorrect": "laughtter", "correct": "laughter" }, "expected": { "incorrect": "laughtter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:8 100 1635 { "response": { "incorrect": "laughtur", "correct": "laughter" }, "expected": { "incorrect": "laughtur", "correct": "laughter" } }
[+]
0015_spell_check:laughter:9 100 1605 { "response": { "incorrect": "laugther", "correct": "laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" } }
[+]
0015_spell_check:liaison:0 100 1641 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:1 100 1608 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:2 100 1643 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" } }
[+]
0015_spell_check:liaison:3 100 1622 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:4 100 1605 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:5 100 1621 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:6 100 1601 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" } }
[+]
0015_spell_check:liaison:7 100 1664 { "response": { "incorrect": "leason", "correct": "liaison" }, "expected": { "incorrect": "leason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:8 100 1581 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" } }
[+]
0015_spell_check:liaison:9 100 1682 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:orange:0 100 1517 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:orange:1 0 1462 { "response": { "incorrect": "orange", "correct": "orange" }, "expected": { "incorrect": "oranje", "correct": "orange" } }
[+]
0015_spell_check:orange:2 100 1499 { "response": { "incorrect": "orang", "correct": "orange" }, "expected": { "incorrect": "orang", "correct": "orange" } }
[+]
0015_spell_check:orange:3 100 1533 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" } }
[+]
0015_spell_check:orange:4 100 1556 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" } }
[+]
0015_spell_check:orange:5 100 1566 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:orange:6 100 1541 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:orange:7 100 1570 { "response": { "incorrect": "oringe", "correct": "orange" }, "expected": { "incorrect": "oringe", "correct": "orange" } }
[+]
0015_spell_check:orange:8 100 1546 { "response": { "incorrect": "orennge", "correct": "orange" }, "expected": { "incorrect": "orennge", "correct": "orange" } }
[+]
0015_spell_check:orange:9 100 1551 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:partition:0 100 1642 { "response": { "incorrect": "partioned", "correct": "partitioned" }, "expected": { "incorrect": "partioned", "correct": "partitioned" } }
[+]
0015_spell_check:partition:1 100 1575 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:2 100 1544 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:3 100 1722 { "response": { "incorrect": "partionned", "correct": "partitioned" }, "expected": { "incorrect": "partionned", "correct": "partitioned" } }
[+]
0015_spell_check:partition:4 100 1583 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:5 100 1581 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:6 100 1664 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:7 100 1591 { "response": { "incorrect": "particion", "correct": "partition" }, "expected": { "incorrect": "particion", "correct": "partition" } }
[+]
0015_spell_check:partition:8 100 1601 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:9 100 1596 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:party:0 100 1580 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:1 100 1603 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:2 100 1633 { "response": { "incorrect": "pary", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" } }
[+]
0015_spell_check:party:3 100 1640 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:4 100 1617 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:5 100 1598 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:6 100 1645 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:7 100 1580 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:8 100 1580 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:9 100 1586 { "response": { "incorrect": "pary", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" } }
[+]
0015_spell_check:stable:0 100 1621 { "response": { "incorrect": "staable", "correct": "stable" }, "expected": { "incorrect": "staable", "correct": "stable" } }
[+]
0015_spell_check:stable:1 100 1618 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" } }
[+]
0015_spell_check:stable:2 100 1620 { "response": { "incorrect": "stabal", "correct": "stable" }, "expected": { "incorrect": "stabal", "correct": "stable" } }
[+]
0015_spell_check:stable:3 100 1665 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" } }
[+]
0015_spell_check:stable:4 100 1694 { "response": { "incorrect": "stabel", "correct": "stable" }, "expected": { "incorrect": "stabel", "correct": "stable" } }
[+]
0015_spell_check:stable:5 100 1610 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" } }
[+]
0015_spell_check:stable:6 100 1663 { "response": { "incorrect": "stabl", "correct": "stable" }, "expected": { "incorrect": "stabl", "correct": "stable" } }
[+]
0015_spell_check:stable:7 100 1626 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" } }
[+]
0015_spell_check:stable:8 100 1609 { "response": { "incorrect": "stabble", "correct": "stable" }, "expected": { "incorrect": "stabble", "correct": "stable" } }
[+]
0015_spell_check:stable:9 0 1688 { "response": { "incorrect": "stayble", "correct": "stale" }, "expected": { "incorrect": "stayble", "correct": "stable" } }
[+]
0015_spell_check:table:0 100 1636 { "response": { "incorrect": "tabele", "correct": "table" }, "expected": { "incorrect": "tabele", "correct": "table" } }
[+]
0015_spell_check:table:1 100 1599 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" } }
[+]
0015_spell_check:table:2 100 1620 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]
0015_spell_check:table:3 100 1604 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" } }
[+]
0015_spell_check:table:4 100 1571 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" } }
[+]
0015_spell_check:table:5 100 1532 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" } }
[+]
0015_spell_check:table:6 100 1495 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" } }
[+]
0015_spell_check:table:7 100 1571 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]
0015_spell_check:table:8 100 1592 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]
0015_spell_check:table:9 100 1632 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]