Benchmark Run Details

Run Summary

Model gemma3:1b:Q4_K_M
Benchmark 0050_translation_sw_ko
Normed Score 9
Run Timestamp 2025-03-26 20:09:41

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0050_translation_sw_ko:0 0 828 { "response": "가장 강한", "expected": "꽃" }
[+]
0050_translation_sw_ko:1 0 277 { "response": "kuendesha", "expected": "운전하다" }
[+]
0050_translation_sw_ko:10 0 359 { "response": "친구", "expected": "산" }
[+]
0050_translation_sw_ko:11 0 337 { "response": "신선한", "expected": "노래하다" }
[+]
0050_translation_sw_ko:12 0 318 { "response": "춤추다", "expected": "심장" }
[+]
0050_translation_sw_ko:13 0 287 { "response": "별", "expected": "밝은" }
[+]
0050_translation_sw_ko:14 100 298 {}
[+]
0050_translation_sw_ko:15 0 335 { "response": "미소짓다", "expected": "조용한" }
[+]
0050_translation_sw_ko:16 0 314 { "response": "심장", "expected": "나무" }
[+]
0050_translation_sw_ko:17 0 362 { "response": "숨다", "expected": "쓰다" }
[+]
0050_translation_sw_ko:18 0 447 { "response": "바람", "expected": "하늘" }
[+]
0050_translation_sw_ko:19 0 532 { "response": "춤추다", "expected": "신선한" }
[+]
0050_translation_sw_ko:2 0 262 { "response": "மிகவும்", "expected": "가장 강한" }
[+]
0050_translation_sw_ko:20 0 495 { "response": "숨쉬다", "expected": "친구" }
[+]
0050_translation_sw_ko:21 0 438 { "response": "숨쉬다", "expected": "달리다" }
[+]
0050_translation_sw_ko:22 100 365 {}
[+]
0050_translation_sw_ko:23 0 328 { "response": "upepo", "expected": "바람" }
[+]
0050_translation_sw_ko:24 0 295 { "response": "심장", "expected": "따뜻한" }
[+]
0050_translation_sw_ko:25 100 316 {}
[+]
0050_translation_sw_ko:26 0 345 { "response": "돌", "expected": "깊은" }
[+]
0050_translation_sw_ko:27 0 384 { "response": "깊은", "expected": "수영하다" }
[+]
0050_translation_sw_ko:28 0 473 { "response": "신선한", "expected": "새" }
[+]
0050_translation_sw_ko:29 0 640 { "response": "운전하다", "expected": "달콤한" }
[+]
0050_translation_sw_ko:3 100 242 {}
[+]
0050_translation_sw_ko:30 0 478 { "response": "수영하다", "expected": "구름" }
[+]
0050_translation_sw_ko:31 0 429 { "response": "tabasamu", "expected": "미소짓다" }
[+]
0050_translation_sw_ko:32 0 422 { "response": "가장 강한", "expected": "부드러운" }
[+]
0050_translation_sw_ko:33 0 371 { "response": "부드러운", "expected": "비" }
[+]
0050_translation_sw_ko:34 0 313 { "response": "돌", "expected": "자라다" }
[+]
0050_translation_sw_ko:35 0 322 { "response": "춤추다", "expected": "빠른" }
[+]
0050_translation_sw_ko:36 0 295 { "response": "돌", "expected": "별" }
[+]
0050_translation_sw_ko:37 100 403 {}
[+]
0050_translation_sw_ko:38 0 420 { "response": "둥근", "expected": "무거운" }
[+]
0050_translation_sw_ko:39 0 398 { "response": "산", "expected": "불" }
[+]
0050_translation_sw_ko:4 0 301 { "response": "자라다", "expected": "먹다" }
[+]
0050_translation_sw_ko:40 0 470 { "response": "kupumua", "expected": "숨쉬다" }
[+]
0050_translation_sw_ko:41 0 348 { "response": "kali", "expected": "날카로운" }
[+]
0050_translation_sw_ko:42 0 339 { "response": "책", "expected": "소금" }
[+]
0050_translation_sw_ko:43 0 376 { "response": "춤추다", "expected": "숨다" }
[+]
0050_translation_sw_ko:44 0 337 { "response": "laini", "expected": "매끄러운" }
[+]
0050_translation_sw_ko:45 0 349 { "response": "달콤한", "expected": "잔디" }
[+]
0050_translation_sw_ko:46 0 341 { "response": "달", "expected": "날다" }
[+]
0050_translation_sw_ko:47 0 319 { "response": "나무", "expected": "추운" }
[+]
0050_translation_sw_ko:48 0 359 { "response": "가장 강한", "expected": "모래" }
[+]
0050_translation_sw_ko:49 0 362 { "response": "웃다", "expected": "떨어지다" }
[+]
0050_translation_sw_ko:5 0 309 { "response": "따뜻한", "expected": "아름다운" }
[+]
0050_translation_sw_ko:50 0 311 { "response": "나무", "expected": "가벼운" }
[+]
0050_translation_sw_ko:6 0 297 { "response": "무거운", "expected": "물" }
[+]
0050_translation_sw_ko:7 0 360 { "response": "미소짓다", "expected": "자다" }
[+]
0050_translation_sw_ko:8 0 1038 { "response": "물", "expected": "달" }
[+]
0050_translation_sw_ko:9 0 678 { "response": "구름", "expected": "웃다" }
[+]