Spaces:
Runtime error
Runtime error
Hugo Flores Garcia
commited on
Commit
·
4687dd9
1
Parent(s):
0a036ac
per-instrument models
Browse files- conf/vampnet-groovemidi.yml +54 -0
- conf/vampnet-maestro.yml +21 -0
- conf/vampnet.yml +1 -1
- vampnet/modules/transformer.py +2 -1
conf/vampnet-groovemidi.yml
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
$include:
|
| 2 |
+
- conf/vampnet.yml
|
| 3 |
+
|
| 4 |
+
VampNet.embedding_dim: 512
|
| 5 |
+
VampNet.n_layers: 12
|
| 6 |
+
VampNet.n_heads: 8
|
| 7 |
+
|
| 8 |
+
AudioDataset.duration: 12.0
|
| 9 |
+
|
| 10 |
+
train/AudioDataset.n_examples: 10000000
|
| 11 |
+
train/AudioLoader.sources:
|
| 12 |
+
# drummer 1 sessions 1, 2, and 3
|
| 13 |
+
- /data/e-gmd-v1.0.0/drummer1/session1
|
| 14 |
+
- /data/e-gmd-v1.0.0/drummer1/session2
|
| 15 |
+
- /data/e-gmd-v1.0.0/drummer1/session3
|
| 16 |
+
# drummer 3 sessions 1 and 2
|
| 17 |
+
- /data/e-gmd-v1.0.0/drummer3/session1
|
| 18 |
+
- /data/e-gmd-v1.0.0/drummer3/session2
|
| 19 |
+
# drummer 4 session 1
|
| 20 |
+
- /data/e-gmd-v1.0.0/drummer4/session1
|
| 21 |
+
# drummer 5 sessions 1 and 2
|
| 22 |
+
- /data/e-gmd-v1.0.0/drummer5/session1
|
| 23 |
+
- /data/e-gmd-v1.0.0/drummer5/session2
|
| 24 |
+
# drummer 6 session 1, 2, and 3
|
| 25 |
+
- /data/e-gmd-v1.0.0/drummer6/session1
|
| 26 |
+
- /data/e-gmd-v1.0.0/drummer6/session2
|
| 27 |
+
- /data/e-gmd-v1.0.0/drummer6/session3
|
| 28 |
+
# drummer 7 session 1, 2 and 3
|
| 29 |
+
- /data/e-gmd-v1.0.0/drummer7/session1
|
| 30 |
+
- /data/e-gmd-v1.0.0/drummer7/session2
|
| 31 |
+
- /data/e-gmd-v1.0.0/drummer7/session3
|
| 32 |
+
# drummer 8 session 1
|
| 33 |
+
- /data/e-gmd-v1.0.0/drummer8/session1
|
| 34 |
+
# drummer 9 session 1
|
| 35 |
+
- /data/e-gmd-v1.0.0/drummer9/session1
|
| 36 |
+
# drummer 10 session 1
|
| 37 |
+
- /data/e-gmd-v1.0.0/drummer10/session1
|
| 38 |
+
|
| 39 |
+
|
| 40 |
+
val/AudioDataset.n_examples: 500
|
| 41 |
+
val/AudioLoader.sources:
|
| 42 |
+
# drummer 1 eval session
|
| 43 |
+
- /data/e-gmd-v1.0.0/drummer1/eval_session
|
| 44 |
+
# drummer 5 eval session
|
| 45 |
+
- /data/e-gmd-v1.0.0/drummer5/eval_session
|
| 46 |
+
# drummer 7 eval session
|
| 47 |
+
- /data/e-gmd-v1.0.0/drummer7/eval_session
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
|
| 51 |
+
test/AudioDataset.n_examples: 1000
|
| 52 |
+
test/AudioLoader.sources:
|
| 53 |
+
# drummer 8 eval session
|
| 54 |
+
- /data/e-gmd-v1.0.0/drummer8/eval_session
|
conf/vampnet-maestro.yml
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
$include:
|
| 2 |
+
- conf/vampnet.yml
|
| 3 |
+
|
| 4 |
+
VampNet.embedding_dim: 512
|
| 5 |
+
VampNet.n_layers: 12
|
| 6 |
+
VampNet.n_heads: 8
|
| 7 |
+
|
| 8 |
+
AudioDataset.duration: 12.0
|
| 9 |
+
|
| 10 |
+
train/AudioDataset.n_examples: 10000000
|
| 11 |
+
train/AudioLoader.sources:
|
| 12 |
+
- /data/maestro-reorg/train
|
| 13 |
+
|
| 14 |
+
val/AudioDataset.n_examples: 500
|
| 15 |
+
val/AudioLoader.sources:
|
| 16 |
+
- /data/maestro-reorg/val
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
test/AudioDataset.n_examples: 1000
|
| 20 |
+
test/AudioLoader.sources:
|
| 21 |
+
- /data/maestro-reorg/test
|
conf/vampnet.yml
CHANGED
|
@@ -34,7 +34,7 @@ VampNet.embedding_dim: 1280
|
|
| 34 |
VampNet.n_layers: 20
|
| 35 |
VampNet.n_heads: 20
|
| 36 |
VampNet.flash_attn: false
|
| 37 |
-
VampNet.dropout: 0.
|
| 38 |
|
| 39 |
AudioLoader.relative_path: /data/
|
| 40 |
AudioDataset.loudness_cutoff: -30.0
|
|
|
|
| 34 |
VampNet.n_layers: 20
|
| 35 |
VampNet.n_heads: 20
|
| 36 |
VampNet.flash_attn: false
|
| 37 |
+
VampNet.dropout: 0.1
|
| 38 |
|
| 39 |
AudioLoader.relative_path: /data/
|
| 40 |
AudioDataset.loudness_cutoff: -30.0
|
vampnet/modules/transformer.py
CHANGED
|
@@ -445,6 +445,7 @@ class VampNet(VampBase):
|
|
| 445 |
vocab_size: int = 1024,
|
| 446 |
flash_attn: bool = True,
|
| 447 |
noise_mode: str = "mask",
|
|
|
|
| 448 |
):
|
| 449 |
super().__init__()
|
| 450 |
self.n_heads = n_heads
|
|
@@ -485,7 +486,7 @@ class VampNet(VampBase):
|
|
| 485 |
bidirectional=True,
|
| 486 |
flash_attn=flash_attn,
|
| 487 |
is_decoder=False,
|
| 488 |
-
dropout=
|
| 489 |
)
|
| 490 |
|
| 491 |
# Add final conv layer
|
|
|
|
| 445 |
vocab_size: int = 1024,
|
| 446 |
flash_attn: bool = True,
|
| 447 |
noise_mode: str = "mask",
|
| 448 |
+
dropout: float = 0.1
|
| 449 |
):
|
| 450 |
super().__init__()
|
| 451 |
self.n_heads = n_heads
|
|
|
|
| 486 |
bidirectional=True,
|
| 487 |
flash_attn=flash_attn,
|
| 488 |
is_decoder=False,
|
| 489 |
+
dropout=dropout,
|
| 490 |
)
|
| 491 |
|
| 492 |
# Add final conv layer
|