Spaces:
Running
on
T4
Running
on
T4
Hugo Flores Garcia
commited on
Commit
•
4687dd9
1
Parent(s):
0a036ac
per-instrument models
Browse files- conf/vampnet-groovemidi.yml +54 -0
- conf/vampnet-maestro.yml +21 -0
- conf/vampnet.yml +1 -1
- vampnet/modules/transformer.py +2 -1
conf/vampnet-groovemidi.yml
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
$include:
|
2 |
+
- conf/vampnet.yml
|
3 |
+
|
4 |
+
VampNet.embedding_dim: 512
|
5 |
+
VampNet.n_layers: 12
|
6 |
+
VampNet.n_heads: 8
|
7 |
+
|
8 |
+
AudioDataset.duration: 12.0
|
9 |
+
|
10 |
+
train/AudioDataset.n_examples: 10000000
|
11 |
+
train/AudioLoader.sources:
|
12 |
+
# drummer 1 sessions 1, 2, and 3
|
13 |
+
- /data/e-gmd-v1.0.0/drummer1/session1
|
14 |
+
- /data/e-gmd-v1.0.0/drummer1/session2
|
15 |
+
- /data/e-gmd-v1.0.0/drummer1/session3
|
16 |
+
# drummer 3 sessions 1 and 2
|
17 |
+
- /data/e-gmd-v1.0.0/drummer3/session1
|
18 |
+
- /data/e-gmd-v1.0.0/drummer3/session2
|
19 |
+
# drummer 4 session 1
|
20 |
+
- /data/e-gmd-v1.0.0/drummer4/session1
|
21 |
+
# drummer 5 sessions 1 and 2
|
22 |
+
- /data/e-gmd-v1.0.0/drummer5/session1
|
23 |
+
- /data/e-gmd-v1.0.0/drummer5/session2
|
24 |
+
# drummer 6 session 1, 2, and 3
|
25 |
+
- /data/e-gmd-v1.0.0/drummer6/session1
|
26 |
+
- /data/e-gmd-v1.0.0/drummer6/session2
|
27 |
+
- /data/e-gmd-v1.0.0/drummer6/session3
|
28 |
+
# drummer 7 session 1, 2 and 3
|
29 |
+
- /data/e-gmd-v1.0.0/drummer7/session1
|
30 |
+
- /data/e-gmd-v1.0.0/drummer7/session2
|
31 |
+
- /data/e-gmd-v1.0.0/drummer7/session3
|
32 |
+
# drummer 8 session 1
|
33 |
+
- /data/e-gmd-v1.0.0/drummer8/session1
|
34 |
+
# drummer 9 session 1
|
35 |
+
- /data/e-gmd-v1.0.0/drummer9/session1
|
36 |
+
# drummer 10 session 1
|
37 |
+
- /data/e-gmd-v1.0.0/drummer10/session1
|
38 |
+
|
39 |
+
|
40 |
+
val/AudioDataset.n_examples: 500
|
41 |
+
val/AudioLoader.sources:
|
42 |
+
# drummer 1 eval session
|
43 |
+
- /data/e-gmd-v1.0.0/drummer1/eval_session
|
44 |
+
# drummer 5 eval session
|
45 |
+
- /data/e-gmd-v1.0.0/drummer5/eval_session
|
46 |
+
# drummer 7 eval session
|
47 |
+
- /data/e-gmd-v1.0.0/drummer7/eval_session
|
48 |
+
|
49 |
+
|
50 |
+
|
51 |
+
test/AudioDataset.n_examples: 1000
|
52 |
+
test/AudioLoader.sources:
|
53 |
+
# drummer 8 eval session
|
54 |
+
- /data/e-gmd-v1.0.0/drummer8/eval_session
|
conf/vampnet-maestro.yml
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
$include:
|
2 |
+
- conf/vampnet.yml
|
3 |
+
|
4 |
+
VampNet.embedding_dim: 512
|
5 |
+
VampNet.n_layers: 12
|
6 |
+
VampNet.n_heads: 8
|
7 |
+
|
8 |
+
AudioDataset.duration: 12.0
|
9 |
+
|
10 |
+
train/AudioDataset.n_examples: 10000000
|
11 |
+
train/AudioLoader.sources:
|
12 |
+
- /data/maestro-reorg/train
|
13 |
+
|
14 |
+
val/AudioDataset.n_examples: 500
|
15 |
+
val/AudioLoader.sources:
|
16 |
+
- /data/maestro-reorg/val
|
17 |
+
|
18 |
+
|
19 |
+
test/AudioDataset.n_examples: 1000
|
20 |
+
test/AudioLoader.sources:
|
21 |
+
- /data/maestro-reorg/test
|
conf/vampnet.yml
CHANGED
@@ -34,7 +34,7 @@ VampNet.embedding_dim: 1280
|
|
34 |
VampNet.n_layers: 20
|
35 |
VampNet.n_heads: 20
|
36 |
VampNet.flash_attn: false
|
37 |
-
VampNet.dropout: 0.
|
38 |
|
39 |
AudioLoader.relative_path: /data/
|
40 |
AudioDataset.loudness_cutoff: -30.0
|
|
|
34 |
VampNet.n_layers: 20
|
35 |
VampNet.n_heads: 20
|
36 |
VampNet.flash_attn: false
|
37 |
+
VampNet.dropout: 0.1
|
38 |
|
39 |
AudioLoader.relative_path: /data/
|
40 |
AudioDataset.loudness_cutoff: -30.0
|
vampnet/modules/transformer.py
CHANGED
@@ -445,6 +445,7 @@ class VampNet(VampBase):
|
|
445 |
vocab_size: int = 1024,
|
446 |
flash_attn: bool = True,
|
447 |
noise_mode: str = "mask",
|
|
|
448 |
):
|
449 |
super().__init__()
|
450 |
self.n_heads = n_heads
|
@@ -485,7 +486,7 @@ class VampNet(VampBase):
|
|
485 |
bidirectional=True,
|
486 |
flash_attn=flash_attn,
|
487 |
is_decoder=False,
|
488 |
-
dropout=
|
489 |
)
|
490 |
|
491 |
# Add final conv layer
|
|
|
445 |
vocab_size: int = 1024,
|
446 |
flash_attn: bool = True,
|
447 |
noise_mode: str = "mask",
|
448 |
+
dropout: float = 0.1
|
449 |
):
|
450 |
super().__init__()
|
451 |
self.n_heads = n_heads
|
|
|
486 |
bidirectional=True,
|
487 |
flash_attn=flash_attn,
|
488 |
is_decoder=False,
|
489 |
+
dropout=dropout,
|
490 |
)
|
491 |
|
492 |
# Add final conv layer
|