Spaces:
Runtime error
Runtime error
zdxiaoda
commited on
Commit
•
35b318d
1
Parent(s):
f3367c4
update
Browse files- models/Mona/G_GenshinMona.pth +3 -0
- models/Mona/config.json +67 -0
- models/Trump/G_18500.pth +3 -0
- models/Trump/config.json +62 -0
- models/alice/G_alice.pth +3 -0
- models/alice/config.json +62 -0
- models/alice/cover.png +0 -0
- models/sora_mix/config.json +1 -1
- models/sora_speak/config.json +1 -1
- models/teio/G_teio.pth +3 -0
- models/teio/config.json +62 -0
- models/teio/cover.png +0 -0
- models/sora_speak/kmeans_10000.pt → so-vits-svc/pretrain/nsf_hifigan/nsf_hifigan.ckpt +2 -2
- so-vits-svc/sovits4_for_colab.ipynb +0 -0
- so-vits-svc/webUI.py +1 -1
models/Mona/G_GenshinMona.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2788326783fd64037b666680828969b40a3d86435f9d78d45c96708bcaa3c2b2
|
3 |
+
size 542789469
|
models/Mona/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"train": {
|
3 |
+
"log_interval": 200,
|
4 |
+
"eval_interval": 800,
|
5 |
+
"seed": 1234,
|
6 |
+
"epochs": 10000,
|
7 |
+
"learning_rate": 0.0001,
|
8 |
+
"betas": [0.8, 0.99],
|
9 |
+
"eps": 1e-9,
|
10 |
+
"batch_size": 16,
|
11 |
+
"fp16_run": false,
|
12 |
+
"bf16_run": false,
|
13 |
+
"lr_decay": 0.999875,
|
14 |
+
"segment_size": 10240,
|
15 |
+
"init_lr_ratio": 1,
|
16 |
+
"warmup_epochs": 0,
|
17 |
+
"c_mel": 45,
|
18 |
+
"c_kl": 1.0,
|
19 |
+
"use_sr": true,
|
20 |
+
"max_speclen": 512,
|
21 |
+
"port": "8001",
|
22 |
+
"keep_ckpts": 3,
|
23 |
+
"num_workers": 4,
|
24 |
+
"log_version": 0,
|
25 |
+
"ckpt_name_by_step": false,
|
26 |
+
"accumulate_grad_batches": 1
|
27 |
+
},
|
28 |
+
"data": {
|
29 |
+
"training_files": "filelists/44k/train.txt",
|
30 |
+
"validation_files": "filelists/44k/val.txt",
|
31 |
+
"max_wav_value": 32768.0,
|
32 |
+
"sampling_rate": 44100,
|
33 |
+
"filter_length": 2048,
|
34 |
+
"hop_length": 512,
|
35 |
+
"win_length": 2048,
|
36 |
+
"n_mel_channels": 80,
|
37 |
+
"mel_fmin": 0.0,
|
38 |
+
"mel_fmax": 22050
|
39 |
+
},
|
40 |
+
"model": {
|
41 |
+
"inter_channels": 192,
|
42 |
+
"hidden_channels": 192,
|
43 |
+
"filter_channels": 768,
|
44 |
+
"n_heads": 2,
|
45 |
+
"n_layers": 6,
|
46 |
+
"kernel_size": 3,
|
47 |
+
"p_dropout": 0.1,
|
48 |
+
"resblock": "1",
|
49 |
+
"resblock_kernel_sizes": [3, 7, 11],
|
50 |
+
"resblock_dilation_sizes": [
|
51 |
+
[1, 3, 5],
|
52 |
+
[1, 3, 5],
|
53 |
+
[1, 3, 5]
|
54 |
+
],
|
55 |
+
"upsample_rates": [8, 8, 2, 2, 2],
|
56 |
+
"upsample_initial_channel": 512,
|
57 |
+
"upsample_kernel_sizes": [16, 16, 4, 4, 4],
|
58 |
+
"n_layers_q": 3,
|
59 |
+
"use_spectral_norm": false,
|
60 |
+
"gin_channels": 256,
|
61 |
+
"ssl_dim": 256,
|
62 |
+
"n_speakers": 200
|
63 |
+
},
|
64 |
+
"spk": {
|
65 |
+
"Genshin_Mona_Ī��": 0
|
66 |
+
}
|
67 |
+
}
|
models/Trump/G_18500.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:059b1dc76e356fc5d9d0374d200fd459804ad74957d25ad0dc01be24cb94cbc0
|
3 |
+
size 542789469
|
models/Trump/config.json
ADDED
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"train": {
|
3 |
+
"log_interval": 100,
|
4 |
+
"eval_interval": 500,
|
5 |
+
"seed": 1234,
|
6 |
+
"epochs": 10001,
|
7 |
+
"learning_rate": 0.0001,
|
8 |
+
"betas": [0.8, 0.99],
|
9 |
+
"eps": 1e-9,
|
10 |
+
"batch_size": 6,
|
11 |
+
"fp16_run": false,
|
12 |
+
"lr_decay": 0.999875,
|
13 |
+
"segment_size": 10240,
|
14 |
+
"init_lr_ratio": 1,
|
15 |
+
"warmup_epochs": 0,
|
16 |
+
"c_mel": 45,
|
17 |
+
"c_kl": 1.0,
|
18 |
+
"use_sr": true,
|
19 |
+
"max_speclen": 512,
|
20 |
+
"port": "8001",
|
21 |
+
"keep_ckpts": 3
|
22 |
+
},
|
23 |
+
"data": {
|
24 |
+
"training_files": "filelists/44k/train.txt",
|
25 |
+
"validation_files": "filelists/44k/val.txt",
|
26 |
+
"max_wav_value": 32768.0,
|
27 |
+
"sampling_rate": 44100,
|
28 |
+
"filter_length": 2048,
|
29 |
+
"hop_length": 512,
|
30 |
+
"win_length": 2048,
|
31 |
+
"n_mel_channels": 80,
|
32 |
+
"mel_fmin": 0.0,
|
33 |
+
"mel_fmax": 22050
|
34 |
+
},
|
35 |
+
"model": {
|
36 |
+
"inter_channels": 192,
|
37 |
+
"hidden_channels": 192,
|
38 |
+
"filter_channels": 768,
|
39 |
+
"n_heads": 2,
|
40 |
+
"n_layers": 6,
|
41 |
+
"kernel_size": 3,
|
42 |
+
"p_dropout": 0.1,
|
43 |
+
"resblock": "1",
|
44 |
+
"resblock_kernel_sizes": [3, 7, 11],
|
45 |
+
"resblock_dilation_sizes": [
|
46 |
+
[1, 3, 5],
|
47 |
+
[1, 3, 5],
|
48 |
+
[1, 3, 5]
|
49 |
+
],
|
50 |
+
"upsample_rates": [8, 8, 2, 2, 2],
|
51 |
+
"upsample_initial_channel": 512,
|
52 |
+
"upsample_kernel_sizes": [16, 16, 4, 4, 4],
|
53 |
+
"n_layers_q": 3,
|
54 |
+
"use_spectral_norm": false,
|
55 |
+
"gin_channels": 256,
|
56 |
+
"ssl_dim": 256,
|
57 |
+
"n_speakers": 200
|
58 |
+
},
|
59 |
+
"spk": {
|
60 |
+
"Trump_���ɵ¡�������": 0
|
61 |
+
}
|
62 |
+
}
|
models/alice/G_alice.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d1bef76e26beeadcae5f716cc0b60abb2aac4aae1316cac709cc439726cf533
|
3 |
+
size 180883747
|
models/alice/config.json
ADDED
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"train": {
|
3 |
+
"log_interval": 200,
|
4 |
+
"eval_interval": 800,
|
5 |
+
"seed": 1234,
|
6 |
+
"epochs": 10000,
|
7 |
+
"learning_rate": 0.0001,
|
8 |
+
"betas": [0.8, 0.99],
|
9 |
+
"eps": 1e-9,
|
10 |
+
"batch_size": 32,
|
11 |
+
"fp16_run": false,
|
12 |
+
"lr_decay": 0.999875,
|
13 |
+
"segment_size": 10240,
|
14 |
+
"init_lr_ratio": 1,
|
15 |
+
"warmup_epochs": 0,
|
16 |
+
"c_mel": 45,
|
17 |
+
"c_kl": 1.0,
|
18 |
+
"use_sr": true,
|
19 |
+
"max_speclen": 512,
|
20 |
+
"port": "8001",
|
21 |
+
"keep_ckpts": 99
|
22 |
+
},
|
23 |
+
"data": {
|
24 |
+
"training_files": "filelists/train.txt",
|
25 |
+
"validation_files": "filelists/val.txt",
|
26 |
+
"max_wav_value": 32768.0,
|
27 |
+
"sampling_rate": 44100,
|
28 |
+
"filter_length": 2048,
|
29 |
+
"hop_length": 512,
|
30 |
+
"win_length": 2048,
|
31 |
+
"n_mel_channels": 80,
|
32 |
+
"mel_fmin": 0.0,
|
33 |
+
"mel_fmax": 22050
|
34 |
+
},
|
35 |
+
"model": {
|
36 |
+
"inter_channels": 192,
|
37 |
+
"hidden_channels": 192,
|
38 |
+
"filter_channels": 768,
|
39 |
+
"n_heads": 2,
|
40 |
+
"n_layers": 6,
|
41 |
+
"kernel_size": 3,
|
42 |
+
"p_dropout": 0.1,
|
43 |
+
"resblock": "1",
|
44 |
+
"resblock_kernel_sizes": [3, 7, 11],
|
45 |
+
"resblock_dilation_sizes": [
|
46 |
+
[1, 3, 5],
|
47 |
+
[1, 3, 5],
|
48 |
+
[1, 3, 5]
|
49 |
+
],
|
50 |
+
"upsample_rates": [8, 8, 2, 2, 2],
|
51 |
+
"upsample_initial_channel": 512,
|
52 |
+
"upsample_kernel_sizes": [16, 16, 4, 4, 4],
|
53 |
+
"n_layers_q": 3,
|
54 |
+
"use_spectral_norm": false,
|
55 |
+
"gin_channels": 256,
|
56 |
+
"ssl_dim": 256,
|
57 |
+
"n_speakers": 200
|
58 |
+
},
|
59 |
+
"spk": {
|
60 |
+
"Blue_Archive_Tendou_Arisu_��ͯ����˿": 0
|
61 |
+
}
|
62 |
+
}
|
models/alice/cover.png
ADDED
models/sora_mix/config.json
CHANGED
@@ -58,6 +58,6 @@
|
|
58 |
"n_speakers": 1
|
59 |
},
|
60 |
"spk": {
|
61 |
-
"
|
62 |
}
|
63 |
}
|
|
|
58 |
"n_speakers": 1
|
59 |
},
|
60 |
"spk": {
|
61 |
+
"Ե֮��_SoraKasugano_Sora_����Ұ�_mix": 0
|
62 |
}
|
63 |
}
|
models/sora_speak/config.json
CHANGED
@@ -58,6 +58,6 @@
|
|
58 |
"n_speakers": 1
|
59 |
},
|
60 |
"spk": {
|
61 |
-
"
|
62 |
}
|
63 |
}
|
|
|
58 |
"n_speakers": 1
|
59 |
},
|
60 |
"spk": {
|
61 |
+
"Ե֮��_SoraKasugano_Sora_����Ұ�_speak": 0
|
62 |
}
|
63 |
}
|
models/teio/G_teio.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:305cbd8bc9bc468f2744d0fc425d1c7363a6232140728d403e90486dc2921160
|
3 |
+
size 180883747
|
models/teio/config.json
ADDED
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"train": {
|
3 |
+
"log_interval": 200,
|
4 |
+
"eval_interval": 800,
|
5 |
+
"seed": 1234,
|
6 |
+
"epochs": 10000,
|
7 |
+
"learning_rate": 0.0001,
|
8 |
+
"betas": [0.8, 0.99],
|
9 |
+
"eps": 1e-9,
|
10 |
+
"batch_size": 32,
|
11 |
+
"fp16_run": false,
|
12 |
+
"lr_decay": 0.999875,
|
13 |
+
"segment_size": 10240,
|
14 |
+
"init_lr_ratio": 1,
|
15 |
+
"warmup_epochs": 0,
|
16 |
+
"c_mel": 45,
|
17 |
+
"c_kl": 1.0,
|
18 |
+
"use_sr": true,
|
19 |
+
"max_speclen": 512,
|
20 |
+
"port": "8001",
|
21 |
+
"keep_ckpts": 99
|
22 |
+
},
|
23 |
+
"data": {
|
24 |
+
"training_files": "filelists/train.txt",
|
25 |
+
"validation_files": "filelists/val.txt",
|
26 |
+
"max_wav_value": 32768.0,
|
27 |
+
"sampling_rate": 44100,
|
28 |
+
"filter_length": 2048,
|
29 |
+
"hop_length": 512,
|
30 |
+
"win_length": 2048,
|
31 |
+
"n_mel_channels": 80,
|
32 |
+
"mel_fmin": 0.0,
|
33 |
+
"mel_fmax": 22050
|
34 |
+
},
|
35 |
+
"model": {
|
36 |
+
"inter_channels": 192,
|
37 |
+
"hidden_channels": 192,
|
38 |
+
"filter_channels": 768,
|
39 |
+
"n_heads": 2,
|
40 |
+
"n_layers": 6,
|
41 |
+
"kernel_size": 3,
|
42 |
+
"p_dropout": 0.1,
|
43 |
+
"resblock": "1",
|
44 |
+
"resblock_kernel_sizes": [3, 7, 11],
|
45 |
+
"resblock_dilation_sizes": [
|
46 |
+
[1, 3, 5],
|
47 |
+
[1, 3, 5],
|
48 |
+
[1, 3, 5]
|
49 |
+
],
|
50 |
+
"upsample_rates": [8, 8, 2, 2, 2],
|
51 |
+
"upsample_initial_channel": 512,
|
52 |
+
"upsample_kernel_sizes": [16, 16, 4, 4, 4],
|
53 |
+
"n_layers_q": 3,
|
54 |
+
"use_spectral_norm": false,
|
55 |
+
"gin_channels": 256,
|
56 |
+
"ssl_dim": 256,
|
57 |
+
"n_speakers": 200
|
58 |
+
},
|
59 |
+
"spk": {
|
60 |
+
"Pretty_Derby_Tokai_Teio_��������": 0
|
61 |
+
}
|
62 |
+
}
|
models/teio/cover.png
ADDED
models/sora_speak/kmeans_10000.pt → so-vits-svc/pretrain/nsf_hifigan/nsf_hifigan.ckpt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c576b63b7ed952161b70fad34e0562ace502ce689195520d8a2a6c051de29d6
|
3 |
+
size 56825430
|
so-vits-svc/sovits4_for_colab.ipynb
DELETED
The diff for this file is too large to render.
See raw diff
|
|
so-vits-svc/webUI.py
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
import io
|
2 |
import os
|
3 |
|
4 |
-
os.system("wget -nc -P hubert/ https://huggingface.co/spaces/innnky/nanami/resolve/main/checkpoint_best_legacy_500.pt")
|
5 |
import gradio as gr
|
6 |
import gradio.processing_utils as gr_pu
|
7 |
import librosa
|
|
|
1 |
import io
|
2 |
import os
|
3 |
|
4 |
+
#os.system("wget -nc -P hubert/ https://huggingface.co/spaces/innnky/nanami/resolve/main/checkpoint_best_legacy_500.pt")
|
5 |
import gradio as gr
|
6 |
import gradio.processing_utils as gr_pu
|
7 |
import librosa
|