Benchmark Run Details

Run Summary

Model llama3.2:3b:Q4_K_M
Benchmark 0050_translation_sw_ko
Normed Score 25
Run Timestamp 2025-03-26 20:03:32

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0050_translation_sw_ko:0 0 2201 { "response": "비", "expected": "꽃" }
[+]
0050_translation_sw_ko:1 100 540 {}
[+]
0050_translation_sw_ko:10 100 453 {}
[+]
0050_translation_sw_ko:11 0 459 { "response": "책", "expected": "노래하다" }
[+]
0050_translation_sw_ko:12 100 475 {}
[+]
0050_translation_sw_ko:13 0 475 { "response": "별", "expected": "밝은" }
[+]
0050_translation_sw_ko:14 0 484 { "response": "play", "expected": "춤추다" }
[+]
0050_translation_sw_ko:15 0 478 { "response": "san", "expected": "조용한" }
[+]
0050_translation_sw_ko:16 0 554 { "response": "simjang", "expected": "나무" }
[+]
0050_translation_sw_ko:17 0 495 { "response": "書く", "expected": "쓰다" }
[+]
0050_translation_sw_ko:18 0 466 { "response": "wind", "expected": "하늘" }
[+]
0050_translation_sw_ko:19 0 493 { "response": "dance", "expected": "신선한" }
[+]
0050_translation_sw_ko:2 0 465 { "response": "drive", "expected": "가장 강한" }
[+]
0050_translation_sw_ko:20 0 542 { "response": "friend", "expected": "친구" }
[+]
0050_translation_sw_ko:21 100 617 {}
[+]
0050_translation_sw_ko:22 100 640 {}
[+]
0050_translation_sw_ko:23 0 537 { "response": "나무", "expected": "바람" }
[+]
0050_translation_sw_ko:24 100 596 {}
[+]
0050_translation_sw_ko:25 0 412 { "response": "dust", "expected": "돌" }
[+]
0050_translation_sw_ko:26 0 636 { "response": "새", "expected": "깊은" }
[+]
0050_translation_sw_ko:27 0 549 { "response": "산", "expected": "수영하다" }
[+]
0050_translation_sw_ko:28 100 639 {}
[+]
0050_translation_sw_ko:29 0 675 { "response": "운전하다", "expected": "달콤한" }
[+]
0050_translation_sw_ko:3 100 579 {}
[+]
0050_translation_sw_ko:30 0 663 { "response": "수영하다", "expected": "구름" }
[+]
0050_translation_sw_ko:31 0 673 { "response": "비", "expected": "미소짓다" }
[+]
0050_translation_sw_ko:32 0 556 { "response": "朋友", "expected": "부드러운" }
[+]
0050_translation_sw_ko:33 100 567 {}
[+]
0050_translation_sw_ko:34 0 683 { "response": "비", "expected": "자라다" }
[+]
0050_translation_sw_ko:35 0 1146 { "response": " 快速하게走다", "expected": "빠른" }
[+]
0050_translation_sw_ko:36 100 603 {}
[+]
0050_translation_sw_ko:37 0 750 { "response": "ダンスする", "expected": "춤추다" }
[+]
0050_translation_sw_ko:38 0 721 { "response": "dumebi", "expected": "무거운" }
[+]
0050_translation_sw_ko:39 0 599 { "response": "riding", "expected": "불" }
[+]
0050_translation_sw_ko:4 0 440 { "response": "drive", "expected": "먹다" }
[+]
0050_translation_sw_ko:40 0 603 { "response": "san", "expected": "숨쉬다" }
[+]
0050_translation_sw_ko:41 0 591 { "response": "산", "expected": "날카로운" }
[+]
0050_translation_sw_ko:42 0 676 { "response": "수영하다", "expected": "소금" }
[+]
0050_translation_sw_ko:43 0 640 { "response": "book", "expected": "숨다" }
[+]
0050_translation_sw_ko:44 0 683 { "response": "소금", "expected": "매끄러운" }
[+]
0050_translation_sw_ko:45 0 758 { "response": "달콤한", "expected": "잔디" }
[+]
0050_translation_sw_ko:46 0 841 { "response": "가벼운", "expected": "날다" }
[+]
0050_translation_sw_ko:47 0 751 { "response": "cold", "expected": "추운" }
[+]
0050_translation_sw_ko:48 0 789 { "response": "책", "expected": "모래" }
[+]
0050_translation_sw_ko:49 0 790 { "response": "웃다", "expected": "떨어지다" }
[+]
0050_translation_sw_ko:5 0 538 { "response": "따뜻한", "expected": "아름다운" }
[+]
0050_translation_sw_ko:50 0 682 { "response": "산", "expected": "가벼운" }
[+]
0050_translation_sw_ko:6 100 464 {}
[+]
0050_translation_sw_ko:7 100 479 {}
[+]
0050_translation_sw_ko:8 100 470 {}
[+]
0050_translation_sw_ko:9 0 548 { "response": "매끄러운", "expected": "웃다" }
[+]