File size: 5,775 Bytes
50ad069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
[
    {
        "id": "polyphone_polyphone5",
        "input_path": "/input/polyphone/polyphone5.wav",
        "text": "Is there anything wrong with my pronunciation in the following sentence?: 'I will live (/lɪv/) to see the live (/lɪv/) performance tomorrow night.'",
        "task": "Polyphonic word comprehension",
        "task_description": "Can the model accurately understand polyphonic word?",
        "output_path_4o": "/output/ChatGPT-4o/polyphone/polyphone5/polyphone5.wav",
        "output_path_miniomni": "/output/Mini-Omni/polyphone/00.wav",
        "output_path_speechgpt": "/output/SpeechGPT/polyphone/polyphone5.wav",
        "output_path_funaudio": "/output/FunAudioLLM/polyphone/audio_4.wav",
        "text_cn": "以下句子中的我的发音有问题吗?:我将活着观看明晚的现场表演。",
        "language": "English",
        "category": "Education",
        "output_path_4o_cascade": "/output/cascade/polyphone/polyphone5.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/polyphone/polyphone5.wav",
        "level": "L1"
    },
    {
        "id": "polyphone_polyphone6",
        "input_path": "/input/polyphone/polyphone6.wav",
        "text": "Is there anything wrong with my pronunciation in the following sentence?: 'Try not to tear (/tɪər/) the paper, or it may bring a tear (/tɛər/) to your eye.'",
        "task": "Polyphonic word comprehension",
        "task_description": "Can the model accurately understand polyphonic word?",
        "output_path_4o": "/output/ChatGPT-4o/polyphone/polyphone6/polyphone6.wav",
        "output_path_miniomni": "/output/Mini-Omni/polyphone/01.wav",
        "output_path_speechgpt": "/output/SpeechGPT/polyphone/polyphone6.wav",
        "output_path_funaudio": "/output/FunAudioLLM/polyphone/audio_5.wav",
        "text_cn": "以下句子中的我的发音有问题吗?:尽量不要撕纸张,否则可能会让你的眼睛流泪。",
        "language": "English",
        "category": "Education",
        "output_path_4o_cascade": "/output/cascade/polyphone/polyphone6.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/polyphone/polyphone6.wav",
        "level": "L1"
    },
    {
        "id": "polyphone_audio_0",
        "input_path": "/input/polyphone/audio_0.mp3",
        "text": "下面这句话是什么意思:“我们要给行长送行。”",
        "task": "Polyphonic word comprehension",
        "task_description": "Can the model accurately understand polyphonic word?",
        "output_path_4o": "/output/ChatGPT-4o/polyphone/audio_0/audio_0.wav",
        "output_path_miniomni": "/output/Mini-Omni/polyphone/02.wav",
        "output_path_speechgpt": "/output/SpeechGPT/polyphone/audio_0.wav",
        "output_path_funaudio": "/output/FunAudioLLM/polyphone/audio_0.wav",
        "language": "Chinese",
        "category": "Education",
        "output_path_4o_cascade": "/output/cascade/polyphone/audio_0.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/polyphone/audio_0.wav",
        "level": "L1"
    },
    {
        "id": "polyphone_audio_1",
        "input_path": "/input/polyphone/audio_1.mp3",
        "text": "下面这句话是什么意思:“他没参加校园活动,也没参加校正发音的活动。”",
        "task": "Polyphonic word comprehension",
        "task_description": "Can the model accurately understand polyphonic word?",
        "output_path_4o": "/output/ChatGPT-4o/polyphone/audio_1/audio_1.wav",
        "output_path_miniomni": "/output/Mini-Omni/polyphone/03.wav",
        "output_path_speechgpt": "/output/SpeechGPT/polyphone/audio_1.wav",
        "output_path_funaudio": "/output/FunAudioLLM/polyphone/audio_1.wav",
        "language": "Chinese",
        "category": "Education",
        "output_path_4o_cascade": "/output/cascade/polyphone/audio_1.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/polyphone/audio_1.wav",
        "level": "L1"
    },
    {
        "id": "polyphone_audio_2",
        "input_path": "/input/polyphone/audio_2.mp3",
        "text": "下面这句话我的读音有误吗?“这个掌(长)期计划非常重要,而他的长(发)乏也很特别。”",
        "task": "Polyphonic word comprehension",
        "task_description": "Can the model accurately understand polyphonic word?",
        "output_path_4o": "/output/ChatGPT-4o/polyphone/audio_2/audio_2.wav",
        "output_path_miniomni": "/output/Mini-Omni/polyphone/04.wav",
        "output_path_speechgpt": "/output/SpeechGPT/polyphone/audio_2.wav",
        "output_path_funaudio": "/output/FunAudioLLM/polyphone/audio_2.wav",
        "language": "Chinese",
        "category": "Education",
        "output_path_4o_cascade": "/output/cascade/polyphone/audio_2.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/polyphone/audio_2.wav",
        "level": "L1"
    },
    {
        "id": "polyphone_audio_3",
        "input_path": "/input/polyphone/audio_3.mp3",
        "text": "纠正我下面这句话的发音:“今天的月(乐)趣很多,我特别喜欢那首乐曲。”",
        "task": "Polyphonic word comprehension",
        "task_description": "Can the model accurately understand polyphonic word?",
        "output_path_4o": "/output/ChatGPT-4o/polyphone/audio_3/audio_3.wav",
        "output_path_miniomni": "/output/Mini-Omni/polyphone/05.wav",
        "output_path_speechgpt": "/output/SpeechGPT/polyphone/audio_3.wav",
        "output_path_funaudio": "/output/FunAudioLLM/polyphone/audio_3.wav",
        "language": "Chinese",
        "category": "Education",
        "output_path_4o_cascade": "/output/cascade/polyphone/audio_3.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/polyphone/audio_3.wav",
        "level": "L1"
    }
]