flexthink
/

ttseval-wavlm-transformer

Model card Files Files and versions

flexthink commited on Feb 29, 2024

Commit

c33d085

·

1 Parent(s): 772ca28

Initial import of the model

Files changed (2) hide show

hyperparams.yaml +57 -0
model.ckpt +3 -0

hyperparams.yaml ADDED Viewed

	@@ -0,0 +1,57 @@

+# ############################################################################
+# Model: SSL with Wav2Vec (training from scratch)
+# Authors:  Artem Ploujnikov, Yingzhi Wang
+# # ############################################################################
+# Seed needs to be set at top of yaml, before objects with parameters are instantiated
+seed: 42
+__set_seed: !apply:torch.manual_seed [!ref <seed>]
+train_regression_metric: True
+batch_size: 4
+num_workers: 4
+src_sample_rate: 24000
+tgt_sample_rate: 16000
+contrastive: False
+lr: 0.00001
+number_of_epochs: 10
+ckpt_interval_minutes: 15
+activation: !name:torch.nn.LeakyReLU
+d_model: 512
+d_ffn: 2048
+num_layers: 3
+nhead: 4
+dropout: 0.5
+wavlm_source: microsoft/wavlm-large
+wavlm_save_path: .
+splits: ["train", "valid", "test"]
+subset: "full"
+skip_prep: False
+wavlm: !new:speechbrain.lobes.models.huggingface_transformers.wavlm.WavLM
+  source: !ref <wavlm_source>
+  output_norm: True
+  save_path: !ref <wavlm_save_path>
+model: !new:speechbrain.lobes.models.eval.ssl.TransformerRegression
+  base_model: !ref <wavlm>
+  d_model: !ref <d_model>
+  d_ffn: !ref <d_ffn>
+  num_layers: !ref <num_layers>
+  nhead: !ref <nhead>
+  dropout: !ref <dropout>
+  activation: !ref <activation>
+modules:
+  model: !ref <model>
+pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
+    loadables:
+        model: !ref <model>

model.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:92a1dbd86f911d1c261b7638282f1f5ceb0aea95a7337602263ca50bf43d2374
+size 1281843773