Spaces:
Running
on
T4
Running
on
T4
initial code release
Browse files- README.md +4 -6
- app.py +11 -0
- packages.txt +5 -0
- requirements.txt +35 -0
README.md
CHANGED
@@ -1,13 +1,11 @@
|
|
1 |
---
|
2 |
title: MassivelyMultilingualTTS
|
3 |
-
emoji:
|
4 |
colorFrom: indigo
|
5 |
colorTo: purple
|
6 |
sdk: gradio
|
7 |
-
sdk_version: 4.
|
8 |
app_file: app.py
|
9 |
-
pinned:
|
10 |
license: mit
|
11 |
-
---
|
12 |
-
|
13 |
-
Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
|
|
|
1 |
---
|
2 |
title: MassivelyMultilingualTTS
|
3 |
+
emoji: ππ¦
|
4 |
colorFrom: indigo
|
5 |
colorTo: purple
|
6 |
sdk: gradio
|
7 |
+
sdk_version: 4.32.2
|
8 |
app_file: app.py
|
9 |
+
pinned: true
|
10 |
license: mit
|
11 |
+
---
|
|
|
|
app.py
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import os
|
2 |
+
import torch
|
3 |
+
|
4 |
+
os.system("git clone --branch v3.1 https://github.com/DigitalPhonetics/IMS-Toucan.git toucan_codebase")
|
5 |
+
os.system("mv toucan_codebase/* .")
|
6 |
+
|
7 |
+
from run_model_downloader import download_models
|
8 |
+
from run_GUI_demo import TTSWebUI
|
9 |
+
|
10 |
+
download_models()
|
11 |
+
TTSWebUI(gpu_id="cuda" if torch.cuda.is_available() else "cpu")
|
packages.txt
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
libsndfile1
|
2 |
+
espeak-ng
|
3 |
+
ffmpeg
|
4 |
+
libasound-dev
|
5 |
+
libportaudio2
|
requirements.txt
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
torch_complex~=0.4.3
|
2 |
+
tqdm~=4.64.1
|
3 |
+
scipy~=1.9.3
|
4 |
+
librosa~=0.9.2
|
5 |
+
scikit-learn~=1.1.3
|
6 |
+
praat-parselmouth~=0.4.2
|
7 |
+
torch~=2.3.0
|
8 |
+
numpy~=1.23.4
|
9 |
+
torchaudio~=2.3.0
|
10 |
+
soundfile~=0.12.0
|
11 |
+
pypinyin~=0.47.1
|
12 |
+
pyloudnorm~=0.1.0
|
13 |
+
numba~=0.56.4
|
14 |
+
cvxopt~=1.3.0
|
15 |
+
sounddevice~=0.4.5
|
16 |
+
matplotlib~=3.6.2
|
17 |
+
phonemizer~=3.2.1
|
18 |
+
wandb~=0.13.5
|
19 |
+
speechbrain~=0.5.13
|
20 |
+
dragonmapper~=0.2.6
|
21 |
+
auraloss~=0.2.2
|
22 |
+
alias_free_torch~=0.0.6
|
23 |
+
dotwiz==0.4.0
|
24 |
+
transphone==1.5.3
|
25 |
+
phonepiece==1.4.2
|
26 |
+
geopy==2.4.1
|
27 |
+
einops==0.7.0
|
28 |
+
torchvision~=0.18.0
|
29 |
+
sklearn~=0.0
|
30 |
+
datasets~=2.10.1
|
31 |
+
pandas~=1.5.0
|
32 |
+
rich~=13.4.2
|
33 |
+
PyYAML~=6.0
|
34 |
+
imageio~=2.34.0
|
35 |
+
pykakasi~=2.2.1
|