patriotyk commited on
Commit
648aa98
·
verified ·
1 Parent(s): d196075

Create config.yml

Browse files
Files changed (1) hide show
  1. config.yml +52 -0
config.yml ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ plbert_params:
2
+ vocab_size: 171
3
+ hidden_size: 768
4
+ num_attention_heads: 12
5
+ intermediate_size: 2048
6
+ max_position_embeddings: 512
7
+ num_hidden_layers: 12
8
+ dropout: 0.1
9
+
10
+
11
+ model_params:
12
+ multispeaker: true
13
+ vocab: "$;:,.!?¡¿—…\"«»“” ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyzɑɐɒæɓʙβɔɕçɗɖðʤəɘɚɛɜɝɞɟʄɡɠɢʛɦɧħɥʜɨɪʝɭɬɫɮʟɱɯɰŋɳɲɴøɵɸθœɶʘɹɺɾɻʀʁɽʂʃʈʧʉʊʋⱱʌɣɤʍχʎʏʑʐʒʔʡʕʢǀǁǂǃˈˌːˑʼʴʰʱʲʷˠˤ˞↓↑→↗↘'̩'ᵻ"
14
+
15
+ dim_in: 64
16
+ hidden_dim: 512
17
+ max_conv_dim: 512
18
+ n_layer: 3
19
+ n_mels: 80
20
+
21
+ n_token: 171 # number of phoneme tokens
22
+ max_dur: 50 # maximum duration of a single phoneme
23
+ style_dim: 128 # style vector size
24
+
25
+ dropout: 0.0
26
+
27
+ # config for decoder
28
+ decoder:
29
+ type: 'hifigan' # either hifigan or istftnet
30
+ resblock_kernel_sizes: [3,7,11]
31
+ upsample_rates : [10,5,3,2]
32
+ upsample_initial_channel: 512
33
+ resblock_dilation_sizes: [[1,3,5], [1,3,5], [1,3,5]]
34
+ upsample_kernel_sizes: [20,10,6,4]
35
+
36
+
37
+ # style diffusion model config
38
+ diffusion:
39
+ embedding_mask_proba: 0.1
40
+ # transformer config
41
+ transformer:
42
+ num_layers: 3
43
+ num_heads: 8
44
+ head_features: 64
45
+ multiplier: 2
46
+
47
+ # diffusion distribution config
48
+ dist:
49
+ sigma_data: 0.19988229232390187
50
+ mean: -4.0
51
+ std: 4.0
52
+