zdxiaoda commited on
Commit
35b318d
1 Parent(s): f3367c4
models/Mona/G_GenshinMona.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2788326783fd64037b666680828969b40a3d86435f9d78d45c96708bcaa3c2b2
3
+ size 542789469
models/Mona/config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train": {
3
+ "log_interval": 200,
4
+ "eval_interval": 800,
5
+ "seed": 1234,
6
+ "epochs": 10000,
7
+ "learning_rate": 0.0001,
8
+ "betas": [0.8, 0.99],
9
+ "eps": 1e-9,
10
+ "batch_size": 16,
11
+ "fp16_run": false,
12
+ "bf16_run": false,
13
+ "lr_decay": 0.999875,
14
+ "segment_size": 10240,
15
+ "init_lr_ratio": 1,
16
+ "warmup_epochs": 0,
17
+ "c_mel": 45,
18
+ "c_kl": 1.0,
19
+ "use_sr": true,
20
+ "max_speclen": 512,
21
+ "port": "8001",
22
+ "keep_ckpts": 3,
23
+ "num_workers": 4,
24
+ "log_version": 0,
25
+ "ckpt_name_by_step": false,
26
+ "accumulate_grad_batches": 1
27
+ },
28
+ "data": {
29
+ "training_files": "filelists/44k/train.txt",
30
+ "validation_files": "filelists/44k/val.txt",
31
+ "max_wav_value": 32768.0,
32
+ "sampling_rate": 44100,
33
+ "filter_length": 2048,
34
+ "hop_length": 512,
35
+ "win_length": 2048,
36
+ "n_mel_channels": 80,
37
+ "mel_fmin": 0.0,
38
+ "mel_fmax": 22050
39
+ },
40
+ "model": {
41
+ "inter_channels": 192,
42
+ "hidden_channels": 192,
43
+ "filter_channels": 768,
44
+ "n_heads": 2,
45
+ "n_layers": 6,
46
+ "kernel_size": 3,
47
+ "p_dropout": 0.1,
48
+ "resblock": "1",
49
+ "resblock_kernel_sizes": [3, 7, 11],
50
+ "resblock_dilation_sizes": [
51
+ [1, 3, 5],
52
+ [1, 3, 5],
53
+ [1, 3, 5]
54
+ ],
55
+ "upsample_rates": [8, 8, 2, 2, 2],
56
+ "upsample_initial_channel": 512,
57
+ "upsample_kernel_sizes": [16, 16, 4, 4, 4],
58
+ "n_layers_q": 3,
59
+ "use_spectral_norm": false,
60
+ "gin_channels": 256,
61
+ "ssl_dim": 256,
62
+ "n_speakers": 200
63
+ },
64
+ "spk": {
65
+ "Genshin_Mona_Ī��": 0
66
+ }
67
+ }
models/Trump/G_18500.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:059b1dc76e356fc5d9d0374d200fd459804ad74957d25ad0dc01be24cb94cbc0
3
+ size 542789469
models/Trump/config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train": {
3
+ "log_interval": 100,
4
+ "eval_interval": 500,
5
+ "seed": 1234,
6
+ "epochs": 10001,
7
+ "learning_rate": 0.0001,
8
+ "betas": [0.8, 0.99],
9
+ "eps": 1e-9,
10
+ "batch_size": 6,
11
+ "fp16_run": false,
12
+ "lr_decay": 0.999875,
13
+ "segment_size": 10240,
14
+ "init_lr_ratio": 1,
15
+ "warmup_epochs": 0,
16
+ "c_mel": 45,
17
+ "c_kl": 1.0,
18
+ "use_sr": true,
19
+ "max_speclen": 512,
20
+ "port": "8001",
21
+ "keep_ckpts": 3
22
+ },
23
+ "data": {
24
+ "training_files": "filelists/44k/train.txt",
25
+ "validation_files": "filelists/44k/val.txt",
26
+ "max_wav_value": 32768.0,
27
+ "sampling_rate": 44100,
28
+ "filter_length": 2048,
29
+ "hop_length": 512,
30
+ "win_length": 2048,
31
+ "n_mel_channels": 80,
32
+ "mel_fmin": 0.0,
33
+ "mel_fmax": 22050
34
+ },
35
+ "model": {
36
+ "inter_channels": 192,
37
+ "hidden_channels": 192,
38
+ "filter_channels": 768,
39
+ "n_heads": 2,
40
+ "n_layers": 6,
41
+ "kernel_size": 3,
42
+ "p_dropout": 0.1,
43
+ "resblock": "1",
44
+ "resblock_kernel_sizes": [3, 7, 11],
45
+ "resblock_dilation_sizes": [
46
+ [1, 3, 5],
47
+ [1, 3, 5],
48
+ [1, 3, 5]
49
+ ],
50
+ "upsample_rates": [8, 8, 2, 2, 2],
51
+ "upsample_initial_channel": 512,
52
+ "upsample_kernel_sizes": [16, 16, 4, 4, 4],
53
+ "n_layers_q": 3,
54
+ "use_spectral_norm": false,
55
+ "gin_channels": 256,
56
+ "ssl_dim": 256,
57
+ "n_speakers": 200
58
+ },
59
+ "spk": {
60
+ "Trump_���ɵ¡�������": 0
61
+ }
62
+ }
models/alice/G_alice.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d1bef76e26beeadcae5f716cc0b60abb2aac4aae1316cac709cc439726cf533
3
+ size 180883747
models/alice/config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train": {
3
+ "log_interval": 200,
4
+ "eval_interval": 800,
5
+ "seed": 1234,
6
+ "epochs": 10000,
7
+ "learning_rate": 0.0001,
8
+ "betas": [0.8, 0.99],
9
+ "eps": 1e-9,
10
+ "batch_size": 32,
11
+ "fp16_run": false,
12
+ "lr_decay": 0.999875,
13
+ "segment_size": 10240,
14
+ "init_lr_ratio": 1,
15
+ "warmup_epochs": 0,
16
+ "c_mel": 45,
17
+ "c_kl": 1.0,
18
+ "use_sr": true,
19
+ "max_speclen": 512,
20
+ "port": "8001",
21
+ "keep_ckpts": 99
22
+ },
23
+ "data": {
24
+ "training_files": "filelists/train.txt",
25
+ "validation_files": "filelists/val.txt",
26
+ "max_wav_value": 32768.0,
27
+ "sampling_rate": 44100,
28
+ "filter_length": 2048,
29
+ "hop_length": 512,
30
+ "win_length": 2048,
31
+ "n_mel_channels": 80,
32
+ "mel_fmin": 0.0,
33
+ "mel_fmax": 22050
34
+ },
35
+ "model": {
36
+ "inter_channels": 192,
37
+ "hidden_channels": 192,
38
+ "filter_channels": 768,
39
+ "n_heads": 2,
40
+ "n_layers": 6,
41
+ "kernel_size": 3,
42
+ "p_dropout": 0.1,
43
+ "resblock": "1",
44
+ "resblock_kernel_sizes": [3, 7, 11],
45
+ "resblock_dilation_sizes": [
46
+ [1, 3, 5],
47
+ [1, 3, 5],
48
+ [1, 3, 5]
49
+ ],
50
+ "upsample_rates": [8, 8, 2, 2, 2],
51
+ "upsample_initial_channel": 512,
52
+ "upsample_kernel_sizes": [16, 16, 4, 4, 4],
53
+ "n_layers_q": 3,
54
+ "use_spectral_norm": false,
55
+ "gin_channels": 256,
56
+ "ssl_dim": 256,
57
+ "n_speakers": 200
58
+ },
59
+ "spk": {
60
+ "Blue_Archive_Tendou_Arisu_��ͯ����˿": 0
61
+ }
62
+ }
models/alice/cover.png ADDED
models/sora_mix/config.json CHANGED
@@ -58,6 +58,6 @@
58
  "n_speakers": 1
59
  },
60
  "spk": {
61
- "春日野穹_mix": 0
62
  }
63
  }
 
58
  "n_speakers": 1
59
  },
60
  "spk": {
61
+ "Ե֮��_SoraKasugano_Sora_����Ұ�_mix": 0
62
  }
63
  }
models/sora_speak/config.json CHANGED
@@ -58,6 +58,6 @@
58
  "n_speakers": 1
59
  },
60
  "spk": {
61
- "春日野穹_speak": 0
62
  }
63
  }
 
58
  "n_speakers": 1
59
  },
60
  "spk": {
61
+ "Ե֮��_SoraKasugano_Sora_����Ұ�_speak": 0
62
  }
63
  }
models/teio/G_teio.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305cbd8bc9bc468f2744d0fc425d1c7363a6232140728d403e90486dc2921160
3
+ size 180883747
models/teio/config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train": {
3
+ "log_interval": 200,
4
+ "eval_interval": 800,
5
+ "seed": 1234,
6
+ "epochs": 10000,
7
+ "learning_rate": 0.0001,
8
+ "betas": [0.8, 0.99],
9
+ "eps": 1e-9,
10
+ "batch_size": 32,
11
+ "fp16_run": false,
12
+ "lr_decay": 0.999875,
13
+ "segment_size": 10240,
14
+ "init_lr_ratio": 1,
15
+ "warmup_epochs": 0,
16
+ "c_mel": 45,
17
+ "c_kl": 1.0,
18
+ "use_sr": true,
19
+ "max_speclen": 512,
20
+ "port": "8001",
21
+ "keep_ckpts": 99
22
+ },
23
+ "data": {
24
+ "training_files": "filelists/train.txt",
25
+ "validation_files": "filelists/val.txt",
26
+ "max_wav_value": 32768.0,
27
+ "sampling_rate": 44100,
28
+ "filter_length": 2048,
29
+ "hop_length": 512,
30
+ "win_length": 2048,
31
+ "n_mel_channels": 80,
32
+ "mel_fmin": 0.0,
33
+ "mel_fmax": 22050
34
+ },
35
+ "model": {
36
+ "inter_channels": 192,
37
+ "hidden_channels": 192,
38
+ "filter_channels": 768,
39
+ "n_heads": 2,
40
+ "n_layers": 6,
41
+ "kernel_size": 3,
42
+ "p_dropout": 0.1,
43
+ "resblock": "1",
44
+ "resblock_kernel_sizes": [3, 7, 11],
45
+ "resblock_dilation_sizes": [
46
+ [1, 3, 5],
47
+ [1, 3, 5],
48
+ [1, 3, 5]
49
+ ],
50
+ "upsample_rates": [8, 8, 2, 2, 2],
51
+ "upsample_initial_channel": 512,
52
+ "upsample_kernel_sizes": [16, 16, 4, 4, 4],
53
+ "n_layers_q": 3,
54
+ "use_spectral_norm": false,
55
+ "gin_channels": 256,
56
+ "ssl_dim": 256,
57
+ "n_speakers": 200
58
+ },
59
+ "spk": {
60
+ "Pretty_Derby_Tokai_Teio_��������": 0
61
+ }
62
+ }
models/teio/cover.png ADDED
models/sora_speak/kmeans_10000.pt → so-vits-svc/pretrain/nsf_hifigan/nsf_hifigan.ckpt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:225146a37386b9504f485a2db89011d6482244930c3ced1864fb822ba61a861b
3
- size 15427449
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c576b63b7ed952161b70fad34e0562ace502ce689195520d8a2a6c051de29d6
3
+ size 56825430
so-vits-svc/sovits4_for_colab.ipynb DELETED
The diff for this file is too large to render. See raw diff
 
so-vits-svc/webUI.py CHANGED
@@ -1,7 +1,7 @@
1
  import io
2
  import os
3
 
4
- os.system("wget -nc -P hubert/ https://huggingface.co/spaces/innnky/nanami/resolve/main/checkpoint_best_legacy_500.pt")
5
  import gradio as gr
6
  import gradio.processing_utils as gr_pu
7
  import librosa
 
1
  import io
2
  import os
3
 
4
+ #os.system("wget -nc -P hubert/ https://huggingface.co/spaces/innnky/nanami/resolve/main/checkpoint_best_legacy_500.pt")
5
  import gradio as gr
6
  import gradio.processing_utils as gr_pu
7
  import librosa