mtauro commited on
Commit
235b080
1 Parent(s): 36495c5

Upload hyperparams.yaml

Browse files
Files changed (1) hide show
  1. hyperparams.yaml +65 -0
hyperparams.yaml ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ############################################################################
2
+ # Model: WAV2VEC base for Emotion Recognition
3
+ ############################################################################
4
+ # Hparams NEEDED
5
+ HPARAMS_NEEDED: [ "out_n_neurons", "label_encoder", ]
6
+ # Modules Needed
7
+ MODULES_NEEDED: ["transf", "avg_pool", "enc", 'classifier']
8
+
9
+ # Feature parameters
10
+ wavlm_hub: "microsoft/wavlm-large"
11
+
12
+ # Pretrain folder (HuggingFace)
13
+ pretrained_path: "mtauro/wavlm_vrs_ck_iva_k492"
14
+
15
+ # parameters
16
+ #encoder_dim: 768
17
+ out_n_neurons: 2
18
+
19
+ transf: !new:speechbrain.lobes.models.huggingface_wav2vec.HuggingFaceWav2Vec2
20
+ source: !ref <wavlm_hub>
21
+ save_path: wavlm_checkpoint
22
+
23
+ avg_pool: !new:speechbrain.nnet.pooling.StatisticsPooling
24
+ return_std: False
25
+
26
+ enc: !new:speechbrain.lobes.models.VanillaNN.VanillaNN
27
+ input_shape: [null, null, 1024]
28
+ dnn_blocks: 1
29
+ dnn_neurons: 1024 # this will be output size of 3rd dimension
30
+
31
+
32
+ classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
33
+ input_size: 1024 #192 for ecapa, double number of channels
34
+ out_neurons: !ref <out_n_neurons>
35
+
36
+ softmax: !new:speechbrain.nnet.activations.Softmax
37
+
38
+ model: !new:torch.nn.ModuleList
39
+ - [!ref <avg_pool>, !ref <enc>, !ref <classifier>]
40
+
41
+ modules:
42
+ transf: !ref <transf>
43
+ avg_pool: !ref <avg_pool>
44
+ enc: !ref <enc>
45
+ classifier: !ref <classifier>
46
+
47
+
48
+ label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
49
+
50
+
51
+ pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
52
+ loadables:
53
+ transf: !ref <transf>
54
+ avg_pool: !ref <avg_pool>
55
+ enc: !ref <enc>
56
+ classifier: !ref <classifier>
57
+ label_encoder: !ref <label_encoder>
58
+ paths:
59
+ transf: !ref <pretrained_path>/transf.ckpt
60
+ avg_pool: !ref <pretrained_path>/avg_pool.ckpt
61
+ enc: !ref <pretrained_path>/enc.ckpt
62
+ classifier: !ref <pretrained_path>/classifier.ckpt
63
+ label_encoder: !ref <pretrained_path>/label_encoder.txt
64
+
65
+