File size: 5,079 Bytes
50ad069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
[
    {
        "id": "story_audio_0",
        "input_path": "/input/story/audio_0.mp3",
        "text": "Tell a sad story, such as the journey of a little kitten being abandoned and later adopted by a kind person.",
        "task": "Storytelling",
        "task_description": "Can the model narrate a story with emotional depth?",
        "output_path_4o": "/output/ChatGPT-4o/story/audio_0/audio_0.wav",
        "output_path_miniomni": "/output/Mini-Omni/story/00.wav",
        "output_path_speechgpt": "/output/SpeechGPT/story/answer_0.wav",
        "output_path_funaudio": "/output/FunAudioLLM/story/audio_0.wav",
        "text_cn": "讲一个悲伤的故事,例如一只小猫被抛弃并后来被一个善良的人采用的旅程。",
        "language": "English",
        "category": "Entertainment",
        "output_path_4o_cascade": "/output/cascade/story/audio_0.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/story/audio_0.wav",
        "level": "L2"
    },
    {
        "id": "story_audio_1",
        "input_path": "/input/story/audio_1.mp3",
        "text": "Begin a mysterious story set in an ancient, abandoned castle.",
        "task": "Storytelling",
        "task_description": "Can the model narrate a story with emotional depth?",
        "output_path_4o": "/output/ChatGPT-4o/story/audio_1/audio_1.wav",
        "output_path_miniomni": "/output/Mini-Omni/story/01.wav",
        "output_path_speechgpt": "/output/SpeechGPT/story/answer_1.wav",
        "output_path_funaudio": "/output/FunAudioLLM/story/audio_1.wav",
        "text_cn": "在一个古老的废弃城堡中开始一个神秘的故事。",
        "language": "English",
        "category": "Entertainment",
        "output_path_4o_cascade": "/output/cascade/story/audio_1.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/story/audio_1.wav",
        "level": "L2"
    },
    {
        "id": "story_audio_2",
        "input_path": "/input/story/audio_2.mp3",
        "text": "Describe a story where a little boy discovers a lost puppy in the snow, detailing their first meeting.",
        "task": "Storytelling",
        "task_description": "Can the model narrate a story with emotional depth?",
        "output_path_4o": "/output/ChatGPT-4o/story/audio_2/audio_2.wav",
        "output_path_miniomni": "/output/Mini-Omni/story/02.wav",
        "output_path_speechgpt": "/output/SpeechGPT/story/answer_2.wav",
        "output_path_funaudio": "/output/FunAudioLLM/story/audio_2.wav",
        "text_cn": "描述一个故事,一个小男孩在雪中发现一只迷失的小狗,详细介绍了他们的第一次见面。",
        "language": "English",
        "category": "Entertainment",
        "output_path_4o_cascade": "/output/cascade/story/audio_2.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/story/audio_2.wav",
        "level": "L2"
    },
    {
        "id": "story_story0_CopyMachine_1",
        "input_path": "/input/noise/story0_CopyMachine_1.wav",
        "text": "[Add CopyMachine noise]Tell a sad story, such as the journey of a little kitten being abandoned and later adopted by a kind person.",
        "noise":"Add CopyMachine noise",
        "task": "Storytelling",
        "task_description": "Can the model narrate a story with emotional depth?",
        "output_path_4o": "/output/ChatGPT-4o/noise/story0_CopyMachine_1/story0_CopyMachine_1.wav",
        "output_path_miniomni": "/output/Mini-Omni/noise/10.wav",
        "output_path_speechgpt": "/output/SpeechGPT/noise/story0_CopyMachine_1.wav",
        "output_path_funaudio": "/output/FunAudioLLM/noise/audio_10.wav",
        "text_cn": "讲一个悲伤的故事,例如一只小猫被抛弃并后来被一个善良的人采用的旅程。",
        "language": "English",
        "category": "Entertainment",
        "output_path_4o_cascade": "/output/cascade/noise/story0_CopyMachine_1.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/noise/story0_CopyMachine_1.wav",
        "level": "L2"
    },
    {
        "id": "story_story1_CopyMachine_1",
        "input_path": "/input/noise/story1_CopyMachine_1.wav",
        "text": "[Add CopyMachine noise]Begin a mysterious story set in an ancient, abandoned castle.",
        "noise":"Add CopyMachine noise",
        "task": "Storytelling",
        "task_description": "Can the model narrate a story with emotional depth?",
        "output_path_4o": "/output/ChatGPT-4o/noise/story1_CopyMachine_1/story1_CopyMachine_1.wav",
        "output_path_miniomni": "/output/Mini-Omni/noise/11.wav",
        "output_path_speechgpt": "/output/SpeechGPT/noise/story1_CopyMachine_1.wav",
        "output_path_funaudio": "/output/FunAudioLLM/noise/audio_11.wav",
        "text_cn": "在一个古老的废弃城堡中开始一个神秘的故事。",
        "language": "English",
        "category": "Entertainment",
        "output_path_4o_cascade": "/output/cascade/noise/story1_CopyMachine_1.wav",
        "output_path_4o_llama_omni": "/output/LLaMA_omni/noise/story1_CopyMachine_1.wav",
        "level": "L2"
    }
]