S2S_Evaluation / data /crosstalk.json
KurtDu's picture
Upload 21 files
50ad069 verified
raw
history blame
7.27 kB
[
{
"id": "crosstalk_audio_0",
"input_path": "/input/crosstalk/audio_0.mp3",
"text": "请说一段经典的相声,题材可以是关于医生和病人的趣事。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_0/audio_0.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/00.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_0.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_0.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_0.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_0.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_1",
"input_path": "/input/crosstalk/audio_1.mp3",
"text": "你来扮演捧哏,我说:“这家店的老板怎么这么小气?”,你怎么接话?",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_1/audio_1.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/01.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_1.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_1.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_1.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_1.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_2",
"input_path": "/input/crosstalk/audio_2.mp3",
"text": "现在你来扮演逗哏角色,想象我是捧哏,我说:“今天的天气真不错啊!”,你该怎么接下去?",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_2/audio_2.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/02.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_2.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_2.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_2.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_2.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_3",
"input_path": "/input/crosstalk/audio_3.mp3",
"text": "讲一段融合现代元素(比如互联网语言)的相声,内容关于在网上购物的经历。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_3/audio_3.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/03.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_3.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_3.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_3.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_3.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_4",
"input_path": "/input/crosstalk/audio_4.mp3",
"text": "我会说出一个情景,你作为相声演员要即兴发挥,继续扩展故事。情景是:在火车站不小心丢了票。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_4/audio_4.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/04.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_4.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_4.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_4.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_4.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_5",
"input_path": "/input/crosstalk/audio_5.mp3",
"text": "试着讲一段涉及中西文化差异的相声,比如中国的春节与西方的圣诞节的对比。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_5/audio_5.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/05.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_5.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_5.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_5.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_5.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_6",
"input_path": "/input/crosstalk/audio_6.mp3",
"text": "模仿郭德纲的风格,说一段关于“互联网生活”的相声。",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_6/audio_6.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/06.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_6.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_6.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_6.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_6.wav",
"level": "L2"
},
{
"id": "crosstalk_audio_7",
"input_path": "/input/crosstalk/audio_7.mp3",
"text": "通过相声风格来解释一下:“为什么学习编程这么难?”",
"task": "Crosstalk ability",
"task_description": "Can the model perform a skit, playing both roles in a comedic dialogue?",
"output_path_4o": "/output/ChatGPT-4o/crosstalk/audio_7/audio_7.wav",
"output_path_miniomni": "/output/Mini-Omni/crosstalk/07.wav",
"output_path_speechgpt": "/output/SpeechGPT/crosstalk/answer_7.wav",
"output_path_funaudio": "/output/FunAudioLLM/crosstalk/audio_7.wav",
"language": "Chinese",
"category": "Entertainment",
"output_path_4o_cascade": "/output/cascade/crosstalk/audio_7.wav",
"output_path_4o_llama_omni": "/output/LLaMA_omni/crosstalk/audio_7.wav",
"level": "L2"
}
]