Commit
·
ed407bf
1
Parent(s):
0b9d6a7
Delete hyperparams.yaml
Browse files- hyperparams.yaml +0 -120
hyperparams.yaml
DELETED
@@ -1,120 +0,0 @@
|
|
1 |
-
# ################################
|
2 |
-
# Model: Fastspeech2 for TTS
|
3 |
-
# Authors: Sathvik Udupa, Yingzhi Wang
|
4 |
-
# ################################
|
5 |
-
n_symbols: 62 #fixed deppending on symbols in textToSequence
|
6 |
-
n_mel_channels: 80
|
7 |
-
padding_idx: 0
|
8 |
-
|
9 |
-
# Encoder parameters
|
10 |
-
enc_num_layers: 4
|
11 |
-
enc_num_head: 2
|
12 |
-
enc_d_model: 384
|
13 |
-
enc_ffn_dim: 1024
|
14 |
-
enc_k_dim: 384
|
15 |
-
enc_v_dim: 384
|
16 |
-
enc_dropout: 0.1
|
17 |
-
|
18 |
-
# Decoder parameters
|
19 |
-
dec_num_layers: 4
|
20 |
-
dec_num_head: 2
|
21 |
-
dec_d_model: 384
|
22 |
-
dec_ffn_dim: 1024
|
23 |
-
dec_k_dim: 384
|
24 |
-
dec_v_dim: 384
|
25 |
-
dec_dropout: 0.1
|
26 |
-
|
27 |
-
# common
|
28 |
-
normalize_before: True
|
29 |
-
ffn_type: 1dcnn #1dcnn or ffn
|
30 |
-
dur_pred_kernel_size: 3
|
31 |
-
pitch_pred_kernel_size: 3
|
32 |
-
energy_pred_kernel_size: 3
|
33 |
-
|
34 |
-
model: !new:speechbrain.lobes.models.FastSpeech2.FastSpeech2
|
35 |
-
enc_num_layers: !ref <enc_num_layers>
|
36 |
-
enc_num_head: !ref <enc_num_head>
|
37 |
-
enc_d_model: !ref <enc_d_model>
|
38 |
-
enc_ffn_dim: !ref <enc_ffn_dim>
|
39 |
-
enc_k_dim: !ref <enc_k_dim>
|
40 |
-
enc_v_dim: !ref <enc_v_dim>
|
41 |
-
enc_dropout: !ref <enc_dropout>
|
42 |
-
dec_num_layers: !ref <dec_num_layers>
|
43 |
-
dec_num_head: !ref <dec_num_head>
|
44 |
-
dec_d_model: !ref <dec_d_model>
|
45 |
-
dec_ffn_dim: !ref <dec_ffn_dim>
|
46 |
-
dec_k_dim: !ref <dec_k_dim>
|
47 |
-
dec_v_dim: !ref <dec_v_dim>
|
48 |
-
dec_dropout: !ref <dec_dropout>
|
49 |
-
normalize_before: !ref <normalize_before>
|
50 |
-
ffn_type: !ref <ffn_type>
|
51 |
-
n_char: !ref <n_symbols>
|
52 |
-
n_mels: !ref <n_mel_channels>
|
53 |
-
padding_idx: !ref <padding_idx>
|
54 |
-
dur_pred_kernel_size: !ref <dur_pred_kernel_size>
|
55 |
-
pitch_pred_kernel_size: !ref <pitch_pred_kernel_size>
|
56 |
-
energy_pred_kernel_size: !ref <energy_pred_kernel_size>
|
57 |
-
|
58 |
-
# The lexicon file must be the same used for training
|
59 |
-
lexicon:
|
60 |
-
- "t"
|
61 |
-
- "?"
|
62 |
-
- "q"
|
63 |
-
- "j"
|
64 |
-
- "g"
|
65 |
-
- "p"
|
66 |
-
- "x"
|
67 |
-
- "("
|
68 |
-
- "é"
|
69 |
-
- "e"
|
70 |
-
- "z"
|
71 |
-
- ","
|
72 |
-
- "o"
|
73 |
-
- "a"
|
74 |
-
- "m"
|
75 |
-
- "n"
|
76 |
-
- "u"
|
77 |
-
- "d"
|
78 |
-
- ":"
|
79 |
-
- "w"
|
80 |
-
- "à"
|
81 |
-
- "“"
|
82 |
-
- "."
|
83 |
-
- "”"
|
84 |
-
- "’"
|
85 |
-
- "["
|
86 |
-
- "v"
|
87 |
-
- "h"
|
88 |
-
- " "
|
89 |
-
- "ê"
|
90 |
-
- "b"
|
91 |
-
- "'"
|
92 |
-
- "\""
|
93 |
-
- "f"
|
94 |
-
- "â"
|
95 |
-
- "!"
|
96 |
-
- ";"
|
97 |
-
- "l"
|
98 |
-
- "r"
|
99 |
-
- "è"
|
100 |
-
- "i"
|
101 |
-
- "]"
|
102 |
-
- "s"
|
103 |
-
- "k"
|
104 |
-
- "y"
|
105 |
-
- ")"
|
106 |
-
- "c"
|
107 |
-
- "ü"
|
108 |
-
- "-"
|
109 |
-
|
110 |
-
|
111 |
-
input_encoder: !new:speechbrain.dataio.encoder.TextEncoder
|
112 |
-
|
113 |
-
|
114 |
-
modules:
|
115 |
-
model: !ref <model>
|
116 |
-
|
117 |
-
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
|
118 |
-
loadables:
|
119 |
-
model: !ref <model>
|
120 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|