File size: 7,274 Bytes
50ad069 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 |
[
{
"id": "crosstalk_audio_0",
"input_path": "/input/crosstalk/audio_0.mp3",
"text": "请说一段经典的相声,题材可以是关于医生和病人的趣事。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_0/audio_0.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/00.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_0.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_0.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_0.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_0.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_1",
"input_path": "/input/crosstalk/audio_1.mp3",
"text": "你来扮演捧哏,我说:“这家店的老板怎么这么小气?”,你怎么接话?",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_1/audio_1.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/01.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_1.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_1.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_1.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_1.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_2",
"input_path": "/input/crosstalk/audio_2.mp3",
"text": "现在你来扮演逗哏角色,想象我是捧哏,我说:“今天的天气真不错啊!”,你该怎么接下去?",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_2/audio_2.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/02.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_2.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_2.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_2.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_2.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_3",
"input_path": "/input/crosstalk/audio_3.mp3",
"text": "讲一段融合现代元素(比如互联网语言)的相声,内容关于在网上购物的经历。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_3/audio_3.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/03.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_3.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_3.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_3.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_3.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_4",
"input_path": "/input/crosstalk/audio_4.mp3",
"text": "我会说出一个情景,你作为相声演员要即兴发挥,继续扩展故事。情景是:在火车站不小心丢了票。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_4/audio_4.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/04.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_4.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_4.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_4.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_4.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_5",
"input_path": "/input/crosstalk/audio_5.mp3",
"text": "试着讲一段涉及中西文化差异的相声,比如中国的春节与西方的圣诞节的对比。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_5/audio_5.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/05.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_5.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_5.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_5.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_5.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_6",
"input_path": "/input/crosstalk/audio_6.mp3",
"text": "模仿郭德纲的风格,说一段关于“互联网生活”的相声。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_6/audio_6.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/06.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_6.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_6.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_6.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_6.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_7",
"input_path": "/input/crosstalk/audio_7.mp3",
"text": "通过相声风格来解释一下:“为什么学习编程这么难?”",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_7/audio_7.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/07.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_7.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_7.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_7.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_7.wav",
"level": "L2"
}
] |