Benchmark Run Details

Run Summary

Model qwen2.5:1.5b:Q4_K_M
Benchmark 0050_translation_sw_ko
Normed Score 19
Run Timestamp 2025-03-26 20:10:43

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0050_translation_sw_ko:0 0 1099 { "response": "비", "expected": "꽃" }
[+]
0050_translation_sw_ko:1 0 266 { "response": "따뜻한", "expected": "운전하다" }
[+]
0050_translation_sw_ko:10 100 332 {}
[+]
0050_translation_sw_ko:11 0 499 { "response": "책", "expected": "노래하다" }
[+]
0050_translation_sw_ko:12 100 768 {}
[+]
0050_translation_sw_ko:13 0 449 { "response": "별", "expected": "밝은" }
[+]
0050_translation_sw_ko:14 0 383 { "response": "친구", "expected": "춤추다" }
[+]
0050_translation_sw_ko:15 0 340 { "response": "kimya", "expected": "조용한" }
[+]
0050_translation_sw_ko:16 0 326 { "response": "소금", "expected": "나무" }
[+]
0050_translation_sw_ko:17 0 329 { "response": "추운", "expected": "쓰다" }
[+]
0050_translation_sw_ko:18 0 324 { "response": "바람", "expected": "하늘" }
[+]
0050_translation_sw_ko:19 0 319 { "response": "물", "expected": "신선한" }
[+]
0050_translation_sw_ko:2 0 263 { "response": "심장", "expected": "가장 강한" }
[+]
0050_translation_sw_ko:20 0 388 { "response": "수영하다", "expected": "친구" }
[+]
0050_translation_sw_ko:21 0 339 { "response": "꽃", "expected": "달리다" }
[+]
0050_translation_sw_ko:22 0 488 { "response": "매끄러운", "expected": "둥근" }
[+]
0050_translation_sw_ko:23 0 1087 { "response": "모래", "expected": "바람" }
[+]
0050_translation_sw_ko:24 0 694 { "response": "달콤한", "expected": "따뜻한" }
[+]
0050_translation_sw_ko:25 0 404 { "response": "책", "expected": "돌" }
[+]
0050_translation_sw_ko:26 0 330 { "response": "새", "expected": "깊은" }
[+]
0050_translation_sw_ko:27 0 311 { "response": "깊은", "expected": "수영하다" }
[+]
0050_translation_sw_ko:28 100 278 {}
[+]
0050_translation_sw_ko:29 100 293 {}
[+]
0050_translation_sw_ko:3 100 243 {}
[+]
0050_translation_sw_ko:30 100 309 {}
[+]
0050_translation_sw_ko:31 0 337 { "response": "밝은", "expected": "미소짓다" }
[+]
0050_translation_sw_ko:32 0 370 { "response": "친구", "expected": "부드러운" }
[+]
0050_translation_sw_ko:33 0 419 { "response": "부드러운", "expected": "비" }
[+]
0050_translation_sw_ko:34 0 345 { "response": "돌", "expected": "자라다" }
[+]
0050_translation_sw_ko:35 0 427 { "response": "춤추다", "expected": "빠른" }
[+]
0050_translation_sw_ko:36 100 404 {}
[+]
0050_translation_sw_ko:37 100 470 {}
[+]
0050_translation_sw_ko:38 0 457 { "response": "소리", "expected": "무거운" }
[+]
0050_translation_sw_ko:39 0 448 { "response": "춤추다", "expected": "불" }
[+]
0050_translation_sw_ko:4 0 289 { "response": "달리다", "expected": "먹다" }
[+]
0050_translation_sw_ko:40 0 473 { "response": "달콤한", "expected": "숨쉬다" }
[+]
0050_translation_sw_ko:41 0 336 { "response": "물", "expected": "날카로운" }
[+]
0050_translation_sw_ko:42 0 417 { "response": "수영하다", "expected": "소금" }
[+]
0050_translation_sw_ko:43 0 401 { "response": "자다", "expected": "숨다" }
[+]
0050_translation_sw_ko:44 0 403 { "response": "소금", "expected": "매끄러운" }
[+]
0050_translation_sw_ko:45 0 399 { "response": "달", "expected": "잔디" }
[+]
0050_translation_sw_ko:46 0 364 { "response": "달", "expected": "날다" }
[+]
0050_translation_sw_ko:47 0 395 { "response": "달콤한", "expected": "추운" }
[+]
0050_translation_sw_ko:48 0 370 { "response": "장마", "expected": "모래" }
[+]
0050_translation_sw_ko:49 0 332 { "response": "웃다", "expected": "떨어지다" }
[+]
0050_translation_sw_ko:5 0 274 { "response": "먹다", "expected": "아름다운" }
[+]
0050_translation_sw_ko:50 0 301 { "response": "새", "expected": "가벼운" }
[+]
0050_translation_sw_ko:6 100 260 {}
[+]
0050_translation_sw_ko:7 0 256 { "response": "돌", "expected": "자다" }
[+]
0050_translation_sw_ko:8 100 252 {}
[+]
0050_translation_sw_ko:9 0 284 { "response": "구름", "expected": "웃다" }
[+]