Hugo Flores Garcia commited on
Commit
03107fd
1 Parent(s): c039932

cleaning up

Browse files
.gitignore CHANGED
@@ -177,4 +177,6 @@ samples-*/**
177
 
178
  gradio-outputs/
179
  models/
180
- samples*/
 
 
 
177
 
178
  gradio-outputs/
179
  models/
180
+ samples*/
181
+ models-all/
182
+ models.zip
README.md CHANGED
@@ -10,7 +10,6 @@ install [audiotools](https://github.com/descriptinc/audiotools.git)
10
  ```bash
11
  git clone https://github.com/descriptinc/audiotools.git
12
  cd audiotools
13
- git checkout f35914b5b3c6f1bf589cd09481478d741538828e
14
  pip install -e .
15
  ```
16
 
@@ -51,7 +50,7 @@ source ./env/env.sh
51
  You can launch a gradio UI to play with vampnet.
52
 
53
  ```bash
54
- python demo.py --args.load conf/interface/spotdl.yml --Interface.device cuda
55
  ```
56
 
57
  # Training / Fine-tuning
 
10
  ```bash
11
  git clone https://github.com/descriptinc/audiotools.git
12
  cd audiotools
 
13
  pip install -e .
14
  ```
15
 
 
50
  You can launch a gradio UI to play with vampnet.
51
 
52
  ```bash
53
+ python demo.py --args.load conf/interface.yml --Interface.device cuda
54
  ```
55
 
56
  # Training / Fine-tuning
conf/{interface/maestro.yml → interface.yml} RENAMED
@@ -1,10 +1,10 @@
1
- Interface.coarse_ckpt: ./models/maestro/coarse.pth
2
- Interface.coarse2fine_ckpt: ./models/maestro/c2f.pth
3
- Interface.codec_ckpt: ./models/maestro/codec.pth
4
- Interface.coarse_chunk_size_s: 12
5
  Interface.coarse2fine_chunk_size_s: 3
6
  Interface.wavebeat_ckpt: ./models/wavebeat.pth
7
 
8
-
9
  AudioLoader.sources:
10
- - /data/maestro-reorg/test
 
 
1
+ Interface.coarse_ckpt: ./models/vampnet/coarse.pth
2
+ Interface.coarse2fine_ckpt: ./models/vampnet/c2f.pth
3
+ Interface.codec_ckpt: ./models/vampnet/codec.pth
4
+ Interface.coarse_chunk_size_s: 10
5
  Interface.coarse2fine_chunk_size_s: 3
6
  Interface.wavebeat_ckpt: ./models/wavebeat.pth
7
 
 
8
  AudioLoader.sources:
9
+ - /media/CHONK/null
10
+
conf/interface/jazzpop.yml DELETED
@@ -1,10 +0,0 @@
1
- Interface.coarse_ckpt: ./models/jazzpop/coarse.pth
2
- Interface.coarse2fine_ckpt: ./models/jazzpop/c2f.pth
3
- Interface.codec_ckpt: ./models/jazzpop/codec.pth
4
- Interface.coarse_chunk_size_s: 5
5
- Interface.coarse2fine_chunk_size_s: 3
6
- Interface.wavebeat_ckpt: ./models/wavebeat.pth
7
-
8
- AudioLoader.sources:
9
- - /data/spotdl-jazzpop/audio/val
10
- - /data/spotdl-jazzpop/audio/test
 
 
 
 
 
 
 
 
 
 
 
conf/interface/spotdl.yml DELETED
@@ -1,12 +0,0 @@
1
- Interface.coarse_ckpt: ./models/spotdl/coarse.pth
2
- Interface.coarse2fine_ckpt: ./models/spotdl/c2f.pth
3
- Interface.codec_ckpt: ./models/spotdl/codec.pth
4
- Interface.coarse_chunk_size_s: 10
5
- Interface.coarse2fine_chunk_size_s: 3
6
- # Interface.wavebeat_ckpt: ./models/wavebeat.pth
7
-
8
-
9
- AudioLoader.sources:
10
- # - /media/CHONK/hugo/spotdl/subsets/jazz-blues/
11
- - /media/CHONK/null
12
-
 
 
 
 
 
 
 
 
 
 
 
 
 
conf/interface/xeno-canto.yml DELETED
@@ -1,11 +0,0 @@
1
- Interface.coarse_ckpt: ./runs/xeno-canto-2/coarse/best/vampnet/weights.pth
2
- Interface.coarse2fine_ckpt: ./runs/xeno-canto-2/c2f/best/vampnet/weights.pth
3
- Interface.codec_ckpt: ./models/spotdl/codec.pth
4
- Interface.coarse_chunk_size_s: 10
5
- Interface.coarse2fine_chunk_size_s: 3
6
- # Interface.wavebeat_ckpt: ./models/wavebeat.pth
7
-
8
-
9
- AudioLoader.sources:
10
- - /media/CHONK/hugo/xeno-canto-2
11
- - /media/CHONK/hugo/xeno-canto-2
 
 
 
 
 
 
 
 
 
 
 
 
demo.py CHANGED
@@ -33,56 +33,14 @@ dataset = at.data.datasets.AudioDataset(
33
 
34
 
35
  checkpoints = {
36
- "spotdl": {
37
- "coarse": "./models/spotdl/coarse.pth",
38
- "c2f": "./models/spotdl/c2f.pth",
39
- "codec": "./models/spotdl/codec.pth",
40
  "full_ckpt": True
41
  },
42
- "berta": {
43
- "coarse": "./models/finetuned/berta-goldman-speech/coarse.pth",
44
- "c2f": "./models/finetuned/berta-goldman-speech/c2f.pth",
45
- "codec": "./model/spotdl/codec.pth",
46
- "full_ckpt": True
47
- },
48
- "xeno-canto-2": {
49
- "coarse": "./models/finetuned/xeno-canto-2/coarse.pth",
50
- "c2f": "./models/finetuned/xeno-canto-2/c2f.pth",
51
- "codec": "./models/spotdl/codec.pth",
52
- "full_ckpt": True
53
- },
54
- "panchos": {
55
- "coarse": "./models/finetuned/panchos/coarse.pth",
56
- "c2f": "./models/finetuned/panchos/c2f.pth",
57
- "codec": "./models/spotdl/codec.pth",
58
- "full_ckpt": False
59
- },
60
- "tv-choir": {
61
- "coarse": "./models/finetuned/tv-choir/coarse.pth",
62
- "c2f": "./models/finetuned/tv-choir/c2f.pth",
63
- "codec": "./models/spotdl/codec.pth",
64
- "full_ckpt": False
65
- },
66
- "titi": {
67
- "coarse": "./models/finetuned/titi/coarse.pth",
68
- "c2f": "./models/finetuned/titi/c2f.pth",
69
- "codec": "./models/spotdl/codec.pth",
70
- "full_ckpt": False
71
- },
72
- "titi-clean": {
73
- "coarse": "./models/finetuned/titi-clean/coarse.pth",
74
- "c2f": "./models/finetuned/titi-clean/c2f.pth",
75
- "codec": "./models/spotdl/codec.pth",
76
- "full_ckpt": False
77
- },
78
- "breaks-steps": {
79
- "coarse": "./models/finetuned/breaks-steps/coarse.pth",
80
- "c2f": None, #"./models/finetuned/breaks-steps/c2f.pth",
81
- "codec": "./models/spotdl/codec.pth",
82
- "full_ckpt": False
83
- },
84
  }
85
- interface.checkpoint_key = "spotdl"
86
 
87
 
88
  OUT_DIR = Path("gradio-outputs")
 
33
 
34
 
35
  checkpoints = {
36
+ "vampnet": {
37
+ "coarse": "./models/vampnet/coarse.pth",
38
+ "c2f": "./models/vampnet/c2f.pth",
39
+ "codec": "./models/vampnet/codec.pth",
40
  "full_ckpt": True
41
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  }
43
+ interface.checkpoint_key = "vampnet"
44
 
45
 
46
  OUT_DIR = Path("gradio-outputs")