Benchmark Run Details

System Prompt

You are helping with a language translation task.
When translating a word from SW to KO:
- Provide the most direct and common translation
- Give only the base form of the word
- Do not include articles unless they are part of the standard translation
- Do not provide explanations or alternative translations

Run Summary

Model gpt-4.1-nano-2025-04-14
Benchmark 0050_translation_sw_ko
Normed Score 80
Run Timestamp 2025-04-24 18:07:37

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0050_translation_sw_ko:0 0 379 { "response": "숨다", "expected": "꽃", "is_correct": false }
[+]
0050_translation_sw_ko:1 100 710 { "response": "운전하다", "expected": "운전하다", "is_correct": true }
[+]
0050_translation_sw_ko:10 100 393 { "response": "산", "expected": "산", "is_correct": true }
[+]
0050_translation_sw_ko:11 100 434 { "response": "노래하다", "expected": "노래하다", "is_correct": true }
[+]
0050_translation_sw_ko:12 100 439 { "response": "심장", "expected": "심장", "is_correct": true }
[+]
0050_translation_sw_ko:13 0 416 { "response": "별", "expected": "밝은", "is_correct": false }
[+]
0050_translation_sw_ko:14 100 472 { "response": "춤추다", "expected": "춤추다", "is_correct": true }
[+]
0050_translation_sw_ko:15 100 459 { "response": "조용한", "expected": "조용한", "is_correct": true }
[+]
0050_translation_sw_ko:16 0 529 { "response": "돌", "expected": "나무", "is_correct": false }
[+]
0050_translation_sw_ko:17 100 380 { "response": "쓰다", "expected": "쓰다", "is_correct": true }
[+]
0050_translation_sw_ko:18 0 380 { "response": "바람", "expected": "하늘", "is_correct": false }
[+]
0050_translation_sw_ko:19 100 694 { "response": "신선한", "expected": "신선한", "is_correct": true }
[+]
0050_translation_sw_ko:2 100 418 { "response": "가장 강한", "expected": "가장 강한", "is_correct": true }
[+]
0050_translation_sw_ko:20 100 432 { "response": "친구", "expected": "친구", "is_correct": true }
[+]
0050_translation_sw_ko:21 100 479 { "response": "달리다", "expected": "달리다", "is_correct": true }
[+]
0050_translation_sw_ko:22 100 453 { "response": "둥근", "expected": "둥근", "is_correct": true }
[+]
0050_translation_sw_ko:23 100 391 { "response": "바람", "expected": "바람", "is_correct": true }
[+]
0050_translation_sw_ko:24 0 766 { "response": "심장", "expected": "따뜻한", "is_correct": false }
[+]
0050_translation_sw_ko:25 100 426 { "response": "돌", "expected": "돌", "is_correct": true }
[+]
0050_translation_sw_ko:26 0 463 { "response": "모래", "expected": "깊은", "is_correct": false }
[+]
0050_translation_sw_ko:27 100 547 { "response": "수영하다", "expected": "수영하다", "is_correct": true }
[+]
0050_translation_sw_ko:28 100 426 { "response": "새", "expected": "새", "is_correct": true }
[+]
0050_translation_sw_ko:29 100 492 { "response": "달콤한", "expected": "달콤한", "is_correct": true }
[+]
0050_translation_sw_ko:3 100 399 { "response": "책", "expected": "책", "is_correct": true }
[+]
0050_translation_sw_ko:30 100 422 { "response": "구름", "expected": "구름", "is_correct": true }
[+]
0050_translation_sw_ko:31 100 443 { "response": "미소짓다", "expected": "미소짓다", "is_correct": true }
[+]
0050_translation_sw_ko:32 0 444 { "response": "친구", "expected": "부드러운", "is_correct": false }
[+]
0050_translation_sw_ko:33 100 517 { "response": "비", "expected": "비", "is_correct": true }
[+]
0050_translation_sw_ko:34 100 429 { "response": "자라다", "expected": "자라다", "is_correct": true }
[+]
0050_translation_sw_ko:35 100 1227 { "response": "빠른", "expected": "빠른", "is_correct": true }
[+]
0050_translation_sw_ko:36 100 498 { "response": "별", "expected": "별", "is_correct": true }
[+]
0050_translation_sw_ko:37 100 451 { "response": "춤추다", "expected": "춤추다", "is_correct": true }
[+]
0050_translation_sw_ko:38 0 394 { "response": "잔디", "expected": "무거운", "is_correct": false }
[+]
0050_translation_sw_ko:39 100 484 { "response": "불", "expected": "불", "is_correct": true }
[+]
0050_translation_sw_ko:4 0 416 { "response": "운전하다", "expected": "먹다", "is_correct": false }
[+]
0050_translation_sw_ko:40 100 347 { "response": "숨쉬다", "expected": "숨쉬다", "is_correct": true }
[+]
0050_translation_sw_ko:41 0 474 { "response": "별", "expected": "날카로운", "is_correct": false }
[+]
0050_translation_sw_ko:42 100 404 { "response": "소금", "expected": "소금", "is_correct": true }
[+]
0050_translation_sw_ko:43 100 419 { "response": "숨다", "expected": "숨다", "is_correct": true }
[+]
0050_translation_sw_ko:44 100 485 { "response": "매끄러운", "expected": "매끄러운", "is_correct": true }
[+]
0050_translation_sw_ko:45 100 627 { "response": "잔디", "expected": "잔디", "is_correct": true }
[+]
0050_translation_sw_ko:46 100 404 { "response": "날다", "expected": "날다", "is_correct": true }
[+]
0050_translation_sw_ko:47 100 438 { "response": "추운", "expected": "추운", "is_correct": true }
[+]
0050_translation_sw_ko:48 100 391 { "response": "모래", "expected": "모래", "is_correct": true }
[+]
0050_translation_sw_ko:49 100 410 { "response": "떨어지다", "expected": "떨어지다", "is_correct": true }
[+]
0050_translation_sw_ko:5 100 724 { "response": "아름다운", "expected": "아름다운", "is_correct": true }
[+]
0050_translation_sw_ko:50 100 484 { "response": "가벼운", "expected": "가벼운", "is_correct": true }
[+]
0050_translation_sw_ko:6 100 414 { "response": "물", "expected": "물", "is_correct": true }
[+]
0050_translation_sw_ko:7 100 457 { "response": "자다", "expected": "자다", "is_correct": true }
[+]
0050_translation_sw_ko:8 100 406 { "response": "달", "expected": "달", "is_correct": true }
[+]
0050_translation_sw_ko:9 100 574 { "response": "웃다", "expected": "웃다", "is_correct": true }
[+]