Spaces:
Sleeping
Sleeping
Hugo Flores Garcia
commited on
Commit
•
03107fd
1
Parent(s):
c039932
cleaning up
Browse files- .gitignore +3 -1
- README.md +1 -2
- conf/{interface/maestro.yml → interface.yml} +6 -6
- conf/interface/jazzpop.yml +0 -10
- conf/interface/spotdl.yml +0 -12
- conf/interface/xeno-canto.yml +0 -11
- demo.py +5 -47
.gitignore
CHANGED
@@ -177,4 +177,6 @@ samples-*/**
|
|
177 |
|
178 |
gradio-outputs/
|
179 |
models/
|
180 |
-
samples*/
|
|
|
|
|
|
177 |
|
178 |
gradio-outputs/
|
179 |
models/
|
180 |
+
samples*/
|
181 |
+
models-all/
|
182 |
+
models.zip
|
README.md
CHANGED
@@ -10,7 +10,6 @@ install [audiotools](https://github.com/descriptinc/audiotools.git)
|
|
10 |
```bash
|
11 |
git clone https://github.com/descriptinc/audiotools.git
|
12 |
cd audiotools
|
13 |
-
git checkout f35914b5b3c6f1bf589cd09481478d741538828e
|
14 |
pip install -e .
|
15 |
```
|
16 |
|
@@ -51,7 +50,7 @@ source ./env/env.sh
|
|
51 |
You can launch a gradio UI to play with vampnet.
|
52 |
|
53 |
```bash
|
54 |
-
python demo.py --args.load conf/interface
|
55 |
```
|
56 |
|
57 |
# Training / Fine-tuning
|
|
|
10 |
```bash
|
11 |
git clone https://github.com/descriptinc/audiotools.git
|
12 |
cd audiotools
|
|
|
13 |
pip install -e .
|
14 |
```
|
15 |
|
|
|
50 |
You can launch a gradio UI to play with vampnet.
|
51 |
|
52 |
```bash
|
53 |
+
python demo.py --args.load conf/interface.yml --Interface.device cuda
|
54 |
```
|
55 |
|
56 |
# Training / Fine-tuning
|
conf/{interface/maestro.yml → interface.yml}
RENAMED
@@ -1,10 +1,10 @@
|
|
1 |
-
Interface.coarse_ckpt: ./models/
|
2 |
-
Interface.coarse2fine_ckpt: ./models/
|
3 |
-
Interface.codec_ckpt: ./models/
|
4 |
-
Interface.coarse_chunk_size_s:
|
5 |
Interface.coarse2fine_chunk_size_s: 3
|
6 |
Interface.wavebeat_ckpt: ./models/wavebeat.pth
|
7 |
|
8 |
-
|
9 |
AudioLoader.sources:
|
10 |
-
- /
|
|
|
|
1 |
+
Interface.coarse_ckpt: ./models/vampnet/coarse.pth
|
2 |
+
Interface.coarse2fine_ckpt: ./models/vampnet/c2f.pth
|
3 |
+
Interface.codec_ckpt: ./models/vampnet/codec.pth
|
4 |
+
Interface.coarse_chunk_size_s: 10
|
5 |
Interface.coarse2fine_chunk_size_s: 3
|
6 |
Interface.wavebeat_ckpt: ./models/wavebeat.pth
|
7 |
|
|
|
8 |
AudioLoader.sources:
|
9 |
+
- /media/CHONK/null
|
10 |
+
|
conf/interface/jazzpop.yml
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
Interface.coarse_ckpt: ./models/jazzpop/coarse.pth
|
2 |
-
Interface.coarse2fine_ckpt: ./models/jazzpop/c2f.pth
|
3 |
-
Interface.codec_ckpt: ./models/jazzpop/codec.pth
|
4 |
-
Interface.coarse_chunk_size_s: 5
|
5 |
-
Interface.coarse2fine_chunk_size_s: 3
|
6 |
-
Interface.wavebeat_ckpt: ./models/wavebeat.pth
|
7 |
-
|
8 |
-
AudioLoader.sources:
|
9 |
-
- /data/spotdl-jazzpop/audio/val
|
10 |
-
- /data/spotdl-jazzpop/audio/test
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
conf/interface/spotdl.yml
DELETED
@@ -1,12 +0,0 @@
|
|
1 |
-
Interface.coarse_ckpt: ./models/spotdl/coarse.pth
|
2 |
-
Interface.coarse2fine_ckpt: ./models/spotdl/c2f.pth
|
3 |
-
Interface.codec_ckpt: ./models/spotdl/codec.pth
|
4 |
-
Interface.coarse_chunk_size_s: 10
|
5 |
-
Interface.coarse2fine_chunk_size_s: 3
|
6 |
-
# Interface.wavebeat_ckpt: ./models/wavebeat.pth
|
7 |
-
|
8 |
-
|
9 |
-
AudioLoader.sources:
|
10 |
-
# - /media/CHONK/hugo/spotdl/subsets/jazz-blues/
|
11 |
-
- /media/CHONK/null
|
12 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
conf/interface/xeno-canto.yml
DELETED
@@ -1,11 +0,0 @@
|
|
1 |
-
Interface.coarse_ckpt: ./runs/xeno-canto-2/coarse/best/vampnet/weights.pth
|
2 |
-
Interface.coarse2fine_ckpt: ./runs/xeno-canto-2/c2f/best/vampnet/weights.pth
|
3 |
-
Interface.codec_ckpt: ./models/spotdl/codec.pth
|
4 |
-
Interface.coarse_chunk_size_s: 10
|
5 |
-
Interface.coarse2fine_chunk_size_s: 3
|
6 |
-
# Interface.wavebeat_ckpt: ./models/wavebeat.pth
|
7 |
-
|
8 |
-
|
9 |
-
AudioLoader.sources:
|
10 |
-
- /media/CHONK/hugo/xeno-canto-2
|
11 |
-
- /media/CHONK/hugo/xeno-canto-2
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
demo.py
CHANGED
@@ -33,56 +33,14 @@ dataset = at.data.datasets.AudioDataset(
|
|
33 |
|
34 |
|
35 |
checkpoints = {
|
36 |
-
"
|
37 |
-
"coarse": "./models/
|
38 |
-
"c2f": "./models/
|
39 |
-
"codec": "./models/
|
40 |
"full_ckpt": True
|
41 |
},
|
42 |
-
"berta": {
|
43 |
-
"coarse": "./models/finetuned/berta-goldman-speech/coarse.pth",
|
44 |
-
"c2f": "./models/finetuned/berta-goldman-speech/c2f.pth",
|
45 |
-
"codec": "./model/spotdl/codec.pth",
|
46 |
-
"full_ckpt": True
|
47 |
-
},
|
48 |
-
"xeno-canto-2": {
|
49 |
-
"coarse": "./models/finetuned/xeno-canto-2/coarse.pth",
|
50 |
-
"c2f": "./models/finetuned/xeno-canto-2/c2f.pth",
|
51 |
-
"codec": "./models/spotdl/codec.pth",
|
52 |
-
"full_ckpt": True
|
53 |
-
},
|
54 |
-
"panchos": {
|
55 |
-
"coarse": "./models/finetuned/panchos/coarse.pth",
|
56 |
-
"c2f": "./models/finetuned/panchos/c2f.pth",
|
57 |
-
"codec": "./models/spotdl/codec.pth",
|
58 |
-
"full_ckpt": False
|
59 |
-
},
|
60 |
-
"tv-choir": {
|
61 |
-
"coarse": "./models/finetuned/tv-choir/coarse.pth",
|
62 |
-
"c2f": "./models/finetuned/tv-choir/c2f.pth",
|
63 |
-
"codec": "./models/spotdl/codec.pth",
|
64 |
-
"full_ckpt": False
|
65 |
-
},
|
66 |
-
"titi": {
|
67 |
-
"coarse": "./models/finetuned/titi/coarse.pth",
|
68 |
-
"c2f": "./models/finetuned/titi/c2f.pth",
|
69 |
-
"codec": "./models/spotdl/codec.pth",
|
70 |
-
"full_ckpt": False
|
71 |
-
},
|
72 |
-
"titi-clean": {
|
73 |
-
"coarse": "./models/finetuned/titi-clean/coarse.pth",
|
74 |
-
"c2f": "./models/finetuned/titi-clean/c2f.pth",
|
75 |
-
"codec": "./models/spotdl/codec.pth",
|
76 |
-
"full_ckpt": False
|
77 |
-
},
|
78 |
-
"breaks-steps": {
|
79 |
-
"coarse": "./models/finetuned/breaks-steps/coarse.pth",
|
80 |
-
"c2f": None, #"./models/finetuned/breaks-steps/c2f.pth",
|
81 |
-
"codec": "./models/spotdl/codec.pth",
|
82 |
-
"full_ckpt": False
|
83 |
-
},
|
84 |
}
|
85 |
-
interface.checkpoint_key = "
|
86 |
|
87 |
|
88 |
OUT_DIR = Path("gradio-outputs")
|
|
|
33 |
|
34 |
|
35 |
checkpoints = {
|
36 |
+
"vampnet": {
|
37 |
+
"coarse": "./models/vampnet/coarse.pth",
|
38 |
+
"c2f": "./models/vampnet/c2f.pth",
|
39 |
+
"codec": "./models/vampnet/codec.pth",
|
40 |
"full_ckpt": True
|
41 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
42 |
}
|
43 |
+
interface.checkpoint_key = "vampnet"
|
44 |
|
45 |
|
46 |
OUT_DIR = Path("gradio-outputs")
|