Hugo Flores Garcia commited on
Commit
4687dd9
1 Parent(s): 0a036ac

per-instrument models

Browse files
conf/vampnet-groovemidi.yml ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ $include:
2
+ - conf/vampnet.yml
3
+
4
+ VampNet.embedding_dim: 512
5
+ VampNet.n_layers: 12
6
+ VampNet.n_heads: 8
7
+
8
+ AudioDataset.duration: 12.0
9
+
10
+ train/AudioDataset.n_examples: 10000000
11
+ train/AudioLoader.sources:
12
+ # drummer 1 sessions 1, 2, and 3
13
+ - /data/e-gmd-v1.0.0/drummer1/session1
14
+ - /data/e-gmd-v1.0.0/drummer1/session2
15
+ - /data/e-gmd-v1.0.0/drummer1/session3
16
+ # drummer 3 sessions 1 and 2
17
+ - /data/e-gmd-v1.0.0/drummer3/session1
18
+ - /data/e-gmd-v1.0.0/drummer3/session2
19
+ # drummer 4 session 1
20
+ - /data/e-gmd-v1.0.0/drummer4/session1
21
+ # drummer 5 sessions 1 and 2
22
+ - /data/e-gmd-v1.0.0/drummer5/session1
23
+ - /data/e-gmd-v1.0.0/drummer5/session2
24
+ # drummer 6 session 1, 2, and 3
25
+ - /data/e-gmd-v1.0.0/drummer6/session1
26
+ - /data/e-gmd-v1.0.0/drummer6/session2
27
+ - /data/e-gmd-v1.0.0/drummer6/session3
28
+ # drummer 7 session 1, 2 and 3
29
+ - /data/e-gmd-v1.0.0/drummer7/session1
30
+ - /data/e-gmd-v1.0.0/drummer7/session2
31
+ - /data/e-gmd-v1.0.0/drummer7/session3
32
+ # drummer 8 session 1
33
+ - /data/e-gmd-v1.0.0/drummer8/session1
34
+ # drummer 9 session 1
35
+ - /data/e-gmd-v1.0.0/drummer9/session1
36
+ # drummer 10 session 1
37
+ - /data/e-gmd-v1.0.0/drummer10/session1
38
+
39
+
40
+ val/AudioDataset.n_examples: 500
41
+ val/AudioLoader.sources:
42
+ # drummer 1 eval session
43
+ - /data/e-gmd-v1.0.0/drummer1/eval_session
44
+ # drummer 5 eval session
45
+ - /data/e-gmd-v1.0.0/drummer5/eval_session
46
+ # drummer 7 eval session
47
+ - /data/e-gmd-v1.0.0/drummer7/eval_session
48
+
49
+
50
+
51
+ test/AudioDataset.n_examples: 1000
52
+ test/AudioLoader.sources:
53
+ # drummer 8 eval session
54
+ - /data/e-gmd-v1.0.0/drummer8/eval_session
conf/vampnet-maestro.yml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ $include:
2
+ - conf/vampnet.yml
3
+
4
+ VampNet.embedding_dim: 512
5
+ VampNet.n_layers: 12
6
+ VampNet.n_heads: 8
7
+
8
+ AudioDataset.duration: 12.0
9
+
10
+ train/AudioDataset.n_examples: 10000000
11
+ train/AudioLoader.sources:
12
+ - /data/maestro-reorg/train
13
+
14
+ val/AudioDataset.n_examples: 500
15
+ val/AudioLoader.sources:
16
+ - /data/maestro-reorg/val
17
+
18
+
19
+ test/AudioDataset.n_examples: 1000
20
+ test/AudioLoader.sources:
21
+ - /data/maestro-reorg/test
conf/vampnet.yml CHANGED
@@ -34,7 +34,7 @@ VampNet.embedding_dim: 1280
34
  VampNet.n_layers: 20
35
  VampNet.n_heads: 20
36
  VampNet.flash_attn: false
37
- VampNet.dropout: 0.05
38
 
39
  AudioLoader.relative_path: /data/
40
  AudioDataset.loudness_cutoff: -30.0
 
34
  VampNet.n_layers: 20
35
  VampNet.n_heads: 20
36
  VampNet.flash_attn: false
37
+ VampNet.dropout: 0.1
38
 
39
  AudioLoader.relative_path: /data/
40
  AudioDataset.loudness_cutoff: -30.0
vampnet/modules/transformer.py CHANGED
@@ -445,6 +445,7 @@ class VampNet(VampBase):
445
  vocab_size: int = 1024,
446
  flash_attn: bool = True,
447
  noise_mode: str = "mask",
 
448
  ):
449
  super().__init__()
450
  self.n_heads = n_heads
@@ -485,7 +486,7 @@ class VampNet(VampBase):
485
  bidirectional=True,
486
  flash_attn=flash_attn,
487
  is_decoder=False,
488
- dropout=0.1,
489
  )
490
 
491
  # Add final conv layer
 
445
  vocab_size: int = 1024,
446
  flash_attn: bool = True,
447
  noise_mode: str = "mask",
448
+ dropout: float = 0.1
449
  ):
450
  super().__init__()
451
  self.n_heads = n_heads
 
486
  bidirectional=True,
487
  flash_attn=flash_attn,
488
  is_decoder=False,
489
+ dropout=dropout,
490
  )
491
 
492
  # Add final conv layer