Benchmark Run Details

Run Summary

Model smollm2:1.7b:Q8_0
Benchmark 0050_translation_sw_ko
Normed Score 3
Run Timestamp 2025-03-26 19:57:30

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0050_translation_sw_ko:0 0 1953 { "response": "둥근", "expected": "꽃" }
[+]
0050_translation_sw_ko:1 0 638 { "response": "따뜻한", "expected": "운전하다" }
[+]
0050_translation_sw_ko:10 0 586 { "response": "친구", "expected": "산" }
[+]
0050_translation_sw_ko:11 0 500 { "response": "책", "expected": "노래하다" }
[+]
0050_translation_sw_ko:12 0 623 { "response": "춤추다", "expected": "심장" }
[+]
0050_translation_sw_ko:13 0 473 { "response": "별", "expected": "밝은" }
[+]
0050_translation_sw_ko:14 0 565 { "response": "빠른", "expected": "춤추다" }
[+]
0050_translation_sw_ko:15 0 524 { "response": "둥근", "expected": "조용한" }
[+]
0050_translation_sw_ko:16 0 667 { "response": "매끄러운", "expected": "나무" }
[+]
0050_translation_sw_ko:17 0 547 { "response": "추운", "expected": "쓰다" }
[+]
0050_translation_sw_ko:18 0 542 { "response": "바람", "expected": "하늘" }
[+]
0050_translation_sw_ko:19 0 663 { "response": "미소짓다", "expected": "신선한" }
[+]
0050_translation_sw_ko:2 0 710 { "response": "명령행", "expected": "가장 강한" }
[+]
0050_translation_sw_ko:20 0 454 { "response": "산", "expected": "친구" }
[+]
0050_translation_sw_ko:21 0 525 { "response": "모래", "expected": "달리다" }
[+]
0050_translation_sw_ko:22 0 971 { "response": "번역 결과: 딱 다자", "expected": "둥근" }
[+]
0050_translation_sw_ko:23 0 458 { "response": "꽃", "expected": "바람" }
[+]
0050_translation_sw_ko:24 0 617 { "response": "달콤한", "expected": "따뜻한" }
[+]
0050_translation_sw_ko:25 0 480 { "response": "뚫기", "expected": "돌" }
[+]
0050_translation_sw_ko:26 0 442 { "response": "새", "expected": "깊은" }
[+]
0050_translation_sw_ko:27 0 489 { "response": "깊은", "expected": "수영하다" }
[+]
0050_translation_sw_ko:28 0 555 { "response": "신선한", "expected": "새" }
[+]
0050_translation_sw_ko:29 100 530 {}
[+]
0050_translation_sw_ko:3 0 576 { "response": "날다", "expected": "책" }
[+]
0050_translation_sw_ko:30 0 595 { "response": "수영하다", "expected": "구름" }
[+]
0050_translation_sw_ko:31 0 521 { "response": "둥근", "expected": "미소짓다" }
[+]
0050_translation_sw_ko:32 0 525 { "response": "친구", "expected": "부드러운" }
[+]
0050_translation_sw_ko:33 0 566 { "response": "숨쉬다", "expected": "비" }
[+]
0050_translation_sw_ko:34 0 661 { "response": "날카로우", "expected": "자라다" }
[+]
0050_translation_sw_ko:35 0 565 { "response": "춤추다", "expected": "빠른" }
[+]
0050_translation_sw_ko:36 0 516 { "response": "구름", "expected": "별" }
[+]
0050_translation_sw_ko:37 0 654 { "response": "미소짓다", "expected": "춤추다" }
[+]
0050_translation_sw_ko:38 0 551 { "response": "둥근", "expected": "무거운" }
[+]
0050_translation_sw_ko:39 0 439 { "response": "소", "expected": "불" }
[+]
0050_translation_sw_ko:4 0 728 { "response": "운전하다", "expected": "먹다" }
[+]
0050_translation_sw_ko:40 0 587 { "response": "달콤한", "expected": "숨쉬다" }
[+]
0050_translation_sw_ko:41 0 452 { "response": "별", "expected": "날카로운" }
[+]
0050_translation_sw_ko:42 0 1231 { "response": "じんにち世痒", "expected": "소금" }
[+]
0050_translation_sw_ko:43 0 529 { "response": "둥근", "expected": "숨다" }
[+]
0050_translation_sw_ko:44 0 627 { "response": "가홫", "expected": "매끄러운" }
[+]
0050_translation_sw_ko:45 0 526 { "response": "달콤한", "expected": "잔디" }
[+]
0050_translation_sw_ko:46 0 616 { "response": "조용한", "expected": "날다" }
[+]
0050_translation_sw_ko:47 0 558 { "response": "달콤한", "expected": "추운" }
[+]
0050_translation_sw_ko:48 0 455 { "response": "책", "expected": "모래" }
[+]
0050_translation_sw_ko:49 0 553 { "response": "웃다", "expected": "떨어지다" }
[+]
0050_translation_sw_ko:5 0 692 { "response": "따뜻한", "expected": "아름다운" }
[+]
0050_translation_sw_ko:50 100 601 {}
[+]
0050_translation_sw_ko:6 0 731 { "response": "무거운", "expected": "물" }
[+]
0050_translation_sw_ko:7 0 605 { "response": "짓다", "expected": "자다" }
[+]
0050_translation_sw_ko:8 0 520 { "response": "물", "expected": "달" }
[+]
0050_translation_sw_ko:9 0 572 { "response": "구름", "expected": "웃다" }
[+]