Benchmark Run Details

Run Summary

Model phi4:14b:Q4_K_M
Benchmark 0051_pinyin_letters
Normed Score 42
Run Timestamp 2025-04-01 19:08:46

Question-Level Details

Question ID Score Evaluation Time (ms) Debug Info
0051_pinyin_letters:0 100 11007 { "question": "Count how many times the letter 'I' appears in the Pinyin representation of the following Chinese sentence: 我喜欢学习中文", "expected_count": 2, "model_count": 2, "is_correct": true }
[+]
0051_pinyin_letters:1 0 1609 { "question": "Count how many times the letter 'G' appears in the Pinyin representation of the following Chinese sentence: 北京是中国的首都", "expected_count": 3, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:10 0 1614 { "question": "Count how many times the letter 'I' appears in the Pinyin representation of the following Chinese sentence: 你好吗?", "expected_count": 1, "model_count": 2, "is_correct": false }
[+]
0051_pinyin_letters:11 100 1734 { "question": "Count how many times the letter 'C' appears in the Pinyin representation of the following Chinese sentence: 我喜欢吃饭。", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]
0051_pinyin_letters:12 0 1769 { "question": "Count how many times the letter 'I' appears in the Pinyin representation of the following Chinese sentence: 天气很好。", "expected_count": 2, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:13 100 1806 { "question": "Count how many times the letter 'M' appears in the Pinyin representation of the following Chinese sentence: 我叫李明。", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]
0051_pinyin_letters:14 100 1755 { "question": "Count how many times the letter 'E' appears in the Pinyin representation of the following Chinese sentence: 今天很忙。", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]
0051_pinyin_letters:15 100 1668 { "question": "Count how many times the letter 'Q' appears in the Pinyin representation of the following Chinese sentence: 多少钱?", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]
0051_pinyin_letters:16 100 1646 { "question": "Count how many times the letter 'T' appears in the Pinyin representation of the following Chinese sentence: 他去学校了。", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]
0051_pinyin_letters:17 100 1659 { "question": "Count how many times the letter 'S' appears in the Pinyin representation of the following Chinese sentence: 你想喝水吗?", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]
0051_pinyin_letters:18 0 1808 { "question": "Count how many times the letter 'N' appears in the Pinyin representation of the following Chinese sentence: 再见,朋友。", "expected_count": 2, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:2 0 1619 { "question": "Count how many times the letter 'Q' appears in the Pinyin representation of the following Chinese sentence: 今天天气很好", "expected_count": 1, "model_count": 2, "is_correct": false }
[+]
0051_pinyin_letters:3 0 1616 { "question": "Count how many times the letter 'G' appears in the Pinyin representation of the following Chinese sentence: 他的哥哥八岁了", "expected_count": 2, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:4 0 1690 { "question": "Count how many times the letter 'A' appears in the Pinyin representation of the following Chinese sentence: 我们一起去公园吧", "expected_count": 2, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:5 0 1662 { "question": "Count how many times the letter 'U' appears in the Pinyin representation of the following Chinese sentence: 这本书非常有趣", "expected_count": 3, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:6 0 1609 { "question": "Count how many times the letter 'I' appears in the Pinyin representation of the following Chinese sentence: 你明天有什么计划", "expected_count": 4, "model_count": 1, "is_correct": false }
[+]
0051_pinyin_letters:7 0 2055 { "question": "Count how many times the letter 'S' appears in the Pinyin representation of the following Chinese sentence: 我的猫喜欢睡觉", "expected_count": 1, "model_count": 2, "is_correct": false }
[+]
0051_pinyin_letters:8 0 1639 { "question": "Count how many times the letter 'U' appears in the Pinyin representation of the following Chinese sentence: 中国有很长的历史", "expected_count": 2, "model_count": 3, "is_correct": false }
[+]
0051_pinyin_letters:9 100 1619 { "question": "Count how many times the letter 'E' appears in the Pinyin representation of the following Chinese sentence: 昨天我去了图书馆", "expected_count": 1, "model_count": 1, "is_correct": true }
[+]