Benchmark Run Details

Run Summary

Model smollm2:1.7b:Q8_0
Benchmark 0015_spell_check
Normed Score 54
Run Timestamp 2025-03-26 18:14:46

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0015_spell_check:attention:0 100 1811 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" } }
[+]
0015_spell_check:attention:1 100 589 { "response": { "incorrect": "attantion", "correct": "attention" }, "expected": { "incorrect": "attantion", "correct": "attention" } }
[+]
0015_spell_check:attention:2 100 619 { "response": { "incorrect": "attetion", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" } }
[+]
0015_spell_check:attention:3 100 574 { "response": { "incorrect": "attnetion", "correct": "attention" }, "expected": { "incorrect": "attnetion", "correct": "attention" } }
[+]
0015_spell_check:attention:4 0 807 { "response": { "incorrect": "§attentãn", "correct": "attention" }, "expected": { "incorrect": "attntion", "correct": "attention" } }
[+]
0015_spell_check:attention:5 0 521 { "response": { "incorrect": "pay", "correct": "pays" }, "expected": { "incorrect": "attenion", "correct": "attention" } }
[+]
0015_spell_check:attention:6 0 528 { "response": { "incorrect": "attention", "correct": "attention" }, "expected": { "incorrect": "attenion", "correct": "attention" } }
[+]
0015_spell_check:attention:7 0 554 { "response": { "incorrect": "attentation", "correct": "attention" }, "expected": { "incorrect": "attetion", "correct": "attention" } }
[+]
0015_spell_check:attention:8 100 590 { "response": { "incorrect": "atttention", "correct": "attention" }, "expected": { "incorrect": "atttention", "correct": "attention" } }
[+]
0015_spell_check:attention:9 100 599 { "response": { "incorrect": "attenttion", "correct": "attention" }, "expected": { "incorrect": "attenttion", "correct": "attention" } }
[+]
0015_spell_check:demonstrate:0 100 652 { "response": { "incorrect": "demonstraite", "correct": "demonstrate" }, "expected": { "incorrect": "demonstraite", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:1 0 576 { "response": { "incorrect": "demonstrate", "correct": "display" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:2 0 598 { "response": { "incorrect": "dance", "correct": "dance" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:3 100 623 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:4 0 643 { "response": { "incorrect": "demonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "demanstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:5 100 655 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:6 100 651 { "response": { "incorrect": "deomonstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:7 0 775 { "response": { "incorrect": "demonstriant", "correct": "demonstrate" }, "expected": { "incorrect": "demonstarte", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:8 100 761 { "response": { "incorrect": "deomstrate", "correct": "demonstrate" }, "expected": { "incorrect": "deomstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:demonstrate:9 0 671 { "response": { "incorrect": "demonstrate", "correct": "display" }, "expected": { "incorrect": "deomonstrate", "correct": "demonstrate" } }
[+]
0015_spell_check:laboratory:0 100 719 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:1 0 689 { "response": { "incorrect": "labrary", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:2 100 752 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:3 100 731 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:4 0 1700 { "response": { "incorrect": "§»´²¹¼ laboratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:5 0 670 { "response": { "incorrect": "laboratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:6 0 680 { "response": { "incorrect": "labrancy", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:7 100 650 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:8 100 642 { "response": { "incorrect": "labratory", "correct": "laboratory" }, "expected": { "incorrect": "labratory", "correct": "laboratory" } }
[+]
0015_spell_check:laboratory:9 100 684 { "response": { "incorrect": "laberatory", "correct": "laboratory" }, "expected": { "incorrect": "laberatory", "correct": "laboratory" } }
[+]
0015_spell_check:laughter:0 0 700 { "response": { "incorrect": "laughterr", "correct": "laughing" }, "expected": { "incorrect": "laughterr", "correct": "laughter" } }
[+]
0015_spell_check:laughter:1 0 995 { "response": { "incorrect": "£laughter£", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:2 0 1189 { "response": { "incorrect": "“contagious”", "correct": "contagious" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:3 0 955 { "response": { "incorrect": "contagious laughter", "correct": "contagious laugh" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:4 0 843 { "response": { "incorrect": "infectous lather", "correct": "infectious laughter" }, "expected": { "incorrect": "lafter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:5 0 664 { "response": { "incorrect": "laughter", "correct": "laughter" }, "expected": { "incorrect": "laghter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:6 0 702 { "response": { "incorrect": "infectious laughter", "correct": "laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" } }
[+]
0015_spell_check:laughter:7 0 610 { "response": { "incorrect": "laughter", "correct": "laughter" }, "expected": { "incorrect": "laughtter", "correct": "laughter" } }
[+]
0015_spell_check:laughter:8 0 773 { "response": { "incorrect": "contagious laughur", "correct": "contagious laughter" }, "expected": { "incorrect": "laughtur", "correct": "laughter" } }
[+]
0015_spell_check:laughter:9 0 819 { "response": { "incorrect": "contagious laughter", "correct": "contagious laughter" }, "expected": { "incorrect": "laugther", "correct": "laughter" } }
[+]
0015_spell_check:liaison:0 100 600 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:1 0 549 { "response": { "incorrect": "liaison", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:2 100 546 { "response": { "incorrect": "liasion", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" } }
[+]
0015_spell_check:liaison:3 0 626 { "response": { "incorrect": "liaison", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:4 0 621 { "response": { "incorrect": "liaison", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:5 100 636 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:6 0 639 { "response": { "incorrect": "liaison", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" } }
[+]
0015_spell_check:liaison:7 0 573 { "response": { "incorrect": "leason", "correct": "lesson" }, "expected": { "incorrect": "leason", "correct": "liaison" } }
[+]
0015_spell_check:liaison:8 0 677 { "response": { "incorrect": "liaison", "correct": "liaison" }, "expected": { "incorrect": "liasion", "correct": "liaison" } }
[+]
0015_spell_check:liaison:9 100 617 { "response": { "incorrect": "liason", "correct": "liaison" }, "expected": { "incorrect": "liason", "correct": "liaison" } }
[+]
0015_spell_check:orange:0 0 1040 { "response": { "incorrect": "“”", "correct": "“orange”" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:orange:1 100 517 { "response": { "incorrect": "oranje", "correct": "orange" }, "expected": { "incorrect": "oranje", "correct": "orange" } }
[+]
0015_spell_check:orange:2 100 518 { "response": { "incorrect": "orang", "correct": "orange" }, "expected": { "incorrect": "orang", "correct": "orange" } }
[+]
0015_spell_check:orange:3 100 586 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" } }
[+]
0015_spell_check:orange:4 100 579 { "response": { "incorrect": "oranage", "correct": "orange" }, "expected": { "incorrect": "oranage", "correct": "orange" } }
[+]
0015_spell_check:orange:5 100 596 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:orange:6 100 559 { "response": { "incorrect": "orrange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:orange:7 100 514 { "response": { "incorrect": "oringe", "correct": "orange" }, "expected": { "incorrect": "oringe", "correct": "orange" } }
[+]
0015_spell_check:orange:8 100 568 { "response": { "incorrect": "orennge", "correct": "orange" }, "expected": { "incorrect": "orennge", "correct": "orange" } }
[+]
0015_spell_check:orange:9 0 599 { "response": { "incorrect": "orange", "correct": "orange" }, "expected": { "incorrect": "orrange", "correct": "orange" } }
[+]
0015_spell_check:partition:0 100 605 { "response": { "incorrect": "partioned", "correct": "partitioned" }, "expected": { "incorrect": "partioned", "correct": "partitioned" } }
[+]
0015_spell_check:partition:1 0 607 { "response": { "incorrect": "partitioned", "correct": "painted" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:2 100 592 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:3 0 588 { "response": { "incorrect": "partioned", "correct": "partitioned" }, "expected": { "incorrect": "partionned", "correct": "partitioned" } }
[+]
0015_spell_check:partition:4 100 574 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:5 100 603 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:6 100 579 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:7 100 652 { "response": { "incorrect": "particion", "correct": "partition" }, "expected": { "incorrect": "particion", "correct": "partition" } }
[+]
0015_spell_check:partition:8 100 549 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:partition:9 100 587 { "response": { "incorrect": "partion", "correct": "partition" }, "expected": { "incorrect": "partion", "correct": "partition" } }
[+]
0015_spell_check:party:0 0 516 { "response": { "incorrect": "party", "correct": "parties" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:1 100 529 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:2 100 514 { "response": { "incorrect": "pary", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" } }
[+]
0015_spell_check:party:3 0 684 { "response": { "incorrect": "·partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:4 0 564 { "response": { "incorrect": "party", "correct": "parties" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:5 100 533 { "response": { "incorrect": "partee", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:6 0 498 { "response": { "incorrect": "party", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:7 0 556 { "response": { "incorrect": "party", "correct": "parties" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:8 0 491 { "response": { "incorrect": "party", "correct": "party" }, "expected": { "incorrect": "partee", "correct": "party" } }
[+]
0015_spell_check:party:9 100 550 { "response": { "incorrect": "pary", "correct": "party" }, "expected": { "incorrect": "pary", "correct": "party" } }
[+]
0015_spell_check:stable:0 0 516 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staable", "correct": "stable" } }
[+]
0015_spell_check:stable:1 100 520 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" } }
[+]
0015_spell_check:stable:2 100 563 { "response": { "incorrect": "stabal", "correct": "stable" }, "expected": { "incorrect": "stabal", "correct": "stable" } }
[+]
0015_spell_check:stable:3 100 639 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" } }
[+]
0015_spell_check:stable:4 100 559 { "response": { "incorrect": "stabel", "correct": "stable" }, "expected": { "incorrect": "stabel", "correct": "stable" } }
[+]
0015_spell_check:stable:5 100 601 { "response": { "incorrect": "staible", "correct": "stable" }, "expected": { "incorrect": "staible", "correct": "stable" } }
[+]
0015_spell_check:stable:6 100 553 { "response": { "incorrect": "stabl", "correct": "stable" }, "expected": { "incorrect": "stabl", "correct": "stable" } }
[+]
0015_spell_check:stable:7 100 588 { "response": { "incorrect": "stabe", "correct": "stable" }, "expected": { "incorrect": "stabe", "correct": "stable" } }
[+]
0015_spell_check:stable:8 0 620 { "response": { "incorrect": "stabile", "correct": "stable" }, "expected": { "incorrect": "stabble", "correct": "stable" } }
[+]
0015_spell_check:stable:9 0 915 { "response": { "incorrect": "“stayble”", "correct": "stability" }, "expected": { "incorrect": "stayble", "correct": "stable" } }
[+]
0015_spell_check:table:0 100 545 { "response": { "incorrect": "tabele", "correct": "table" }, "expected": { "incorrect": "tabele", "correct": "table" } }
[+]
0015_spell_check:table:1 0 556 { "response": { "incorrect": "tabtable", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" } }
[+]
0015_spell_check:table:2 0 559 { "response": { "incorrect": "table", "correct": "tablet" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]
0015_spell_check:table:3 100 634 { "response": { "incorrect": "tabble", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" } }
[+]
0015_spell_check:table:4 0 527 { "response": { "incorrect": "tabled", "correct": "table" }, "expected": { "incorrect": "tabble", "correct": "table" } }
[+]
0015_spell_check:table:5 100 523 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" } }
[+]
0015_spell_check:table:6 100 624 { "response": { "incorrect": "tabl", "correct": "table" }, "expected": { "incorrect": "tabl", "correct": "table" } }
[+]
0015_spell_check:table:7 100 575 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]
0015_spell_check:table:8 0 585 { "response": { "incorrect": "table", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]
0015_spell_check:table:9 100 598 { "response": { "incorrect": "tabel", "correct": "table" }, "expected": { "incorrect": "tabel", "correct": "table" } }
[+]