Benchmark Run Details

System Prompt

You are helping with a language translation task.
When translating a word from SW to KO:
- Provide the most direct and common translation
- Give only the base form of the word
- Do not include articles unless they are part of the standard translation
- Do not provide explanations or alternative translations

Run Summary

Model gpt-4.1-mini-2025-04-14
Benchmark 0050_translation_sw_ko
Normed Score 80
Run Timestamp 2025-04-24 18:08:20

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0050_translation_sw_ko:0 0 584 { "response": "비", "expected": "꽃", "is_correct": false }
[+]
0050_translation_sw_ko:1 100 614 { "response": "운전하다", "expected": "운전하다", "is_correct": true }
[+]
0050_translation_sw_ko:10 100 857 { "response": "산", "expected": "산", "is_correct": true }
[+]
0050_translation_sw_ko:11 100 548 { "response": "노래하다", "expected": "노래하다", "is_correct": true }
[+]
0050_translation_sw_ko:12 100 977 { "response": "심장", "expected": "심장", "is_correct": true }
[+]
0050_translation_sw_ko:13 0 482 { "response": "별", "expected": "밝은", "is_correct": false }
[+]
0050_translation_sw_ko:14 100 520 { "response": "춤추다", "expected": "춤추다", "is_correct": true }
[+]
0050_translation_sw_ko:15 0 607 { "response": "화학", "expected": "조용한", "is_correct": false }
[+]
0050_translation_sw_ko:16 100 729 { "response": "나무", "expected": "나무", "is_correct": true }
[+]
0050_translation_sw_ko:17 100 428 { "response": "쓰다", "expected": "쓰다", "is_correct": true }
[+]
0050_translation_sw_ko:18 0 958 { "response": "불", "expected": "하늘", "is_correct": false }
[+]
0050_translation_sw_ko:19 100 984 { "response": "신선한", "expected": "신선한", "is_correct": true }
[+]
0050_translation_sw_ko:2 100 616 { "response": "가장 강한", "expected": "가장 강한", "is_correct": true }
[+]
0050_translation_sw_ko:20 100 498 { "response": "친구", "expected": "친구", "is_correct": true }
[+]
0050_translation_sw_ko:21 100 1110 { "response": "달리다", "expected": "달리다", "is_correct": true }
[+]
0050_translation_sw_ko:22 0 1001 { "response": "바람", "expected": "둥근", "is_correct": false }
[+]
0050_translation_sw_ko:23 100 998 { "response": "바람", "expected": "바람", "is_correct": true }
[+]
0050_translation_sw_ko:24 100 663 { "response": "따뜻한", "expected": "따뜻한", "is_correct": true }
[+]
0050_translation_sw_ko:25 100 716 { "response": "돌", "expected": "돌", "is_correct": true }
[+]
0050_translation_sw_ko:26 0 538 { "response": "모래", "expected": "깊은", "is_correct": false }
[+]
0050_translation_sw_ko:27 100 1169 { "response": "수영하다", "expected": "수영하다", "is_correct": true }
[+]
0050_translation_sw_ko:28 100 551 { "response": "새", "expected": "새", "is_correct": true }
[+]
0050_translation_sw_ko:29 100 1126 { "response": "달콤한", "expected": "달콤한", "is_correct": true }
[+]
0050_translation_sw_ko:3 100 1629 { "response": "책", "expected": "책", "is_correct": true }
[+]
0050_translation_sw_ko:30 100 1114 { "response": "구름", "expected": "구름", "is_correct": true }
[+]
0050_translation_sw_ko:31 100 515 { "response": "미소짓다", "expected": "미소짓다", "is_correct": true }
[+]
0050_translation_sw_ko:32 100 1229 { "response": "부드러운", "expected": "부드러운", "is_correct": true }
[+]
0050_translation_sw_ko:33 100 1018 { "response": "비", "expected": "비", "is_correct": true }
[+]
0050_translation_sw_ko:34 100 1223 { "response": "자라다", "expected": "자라다", "is_correct": true }
[+]
0050_translation_sw_ko:35 100 548 { "response": "빠른", "expected": "빠른", "is_correct": true }
[+]
0050_translation_sw_ko:36 100 937 { "response": "별", "expected": "별", "is_correct": true }
[+]
0050_translation_sw_ko:37 100 1068 { "response": "춤추다", "expected": "춤추다", "is_correct": true }
[+]
0050_translation_sw_ko:38 0 1090 { "response": "둥근", "expected": "무거운", "is_correct": false }
[+]
0050_translation_sw_ko:39 0 758 { "response": "산", "expected": "불", "is_correct": false }
[+]
0050_translation_sw_ko:4 0 504 { "response": "소금", "expected": "먹다", "is_correct": false }
[+]
0050_translation_sw_ko:40 100 997 { "response": "숨쉬다", "expected": "숨쉬다", "is_correct": true }
[+]
0050_translation_sw_ko:41 100 1156 { "response": "날카로운", "expected": "날카로운", "is_correct": true }
[+]
0050_translation_sw_ko:42 100 1159 { "response": "소금", "expected": "소금", "is_correct": true }
[+]
0050_translation_sw_ko:43 100 590 { "response": "숨다", "expected": "숨다", "is_correct": true }
[+]
0050_translation_sw_ko:44 100 708 { "response": "매끄러운", "expected": "매끄러운", "is_correct": true }
[+]
0050_translation_sw_ko:45 100 851 { "response": "잔디", "expected": "잔디", "is_correct": true }
[+]
0050_translation_sw_ko:46 100 826 { "response": "날다", "expected": "날다", "is_correct": true }
[+]
0050_translation_sw_ko:47 100 966 { "response": "추운", "expected": "추운", "is_correct": true }
[+]
0050_translation_sw_ko:48 100 1043 { "response": "모래", "expected": "모래", "is_correct": true }
[+]
0050_translation_sw_ko:49 100 1222 { "response": "떨어지다", "expected": "떨어지다", "is_correct": true }
[+]
0050_translation_sw_ko:5 100 550 { "response": "아름다운", "expected": "아름다운", "is_correct": true }
[+]
0050_translation_sw_ko:50 100 770 { "response": "가벼운", "expected": "가벼운", "is_correct": true }
[+]
0050_translation_sw_ko:6 100 596 { "response": "물", "expected": "물", "is_correct": true }
[+]
0050_translation_sw_ko:7 100 540 { "response": "자다", "expected": "자다", "is_correct": true }
[+]
0050_translation_sw_ko:8 100 468 { "response": "달", "expected": "달", "is_correct": true }
[+]
0050_translation_sw_ko:9 0 575 { "response": "운전하다", "expected": "웃다", "is_correct": false }
[+]