sob111 commited on
Commit
46b2d52
·
verified ·
1 Parent(s): b009c70

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +31 -34
config.json CHANGED
@@ -1,44 +1,41 @@
1
  {
2
- "model": "xtts_v2",
 
3
  "output_path": "./output_model",
4
- "restore_path": null,
5
  "datasets": [
6
  {
7
- "formatter": "coqui",
8
  "meta_file_train": "./voxpopuli_es_500/metadata.json",
9
  "path": "./voxpopuli_es_500/wav_data",
10
  "language": "es"
11
  }
12
  ],
13
- "trainer": {
14
- "max_epochs": 5,
15
- "batch_size": 4,
16
- "save_step": 100,
17
- "log_step": 10,
18
- "eval_step": 100,
19
- "mixed_precision": true,
20
- "num_loader_workers": 4,
21
- "eval_split_max_size": 50,
22
- "run_eval": true
23
- },
24
- "audio": {
25
- "sample_rate": 22050,
26
- "win_length": 1024,
27
- "hop_length": 256,
28
- "fft_size": 1024,
29
- "mel_fmin": 0,
30
- "mel_fmax": 8000
31
- },
32
- "optimizer": {
33
- "type": "adam",
34
- "lr": 0.0001,
35
- "weight_decay": 0.0
36
- },
37
- "lr_scheduler": {
38
- "type": "step",
39
- "step_size": 1000,
40
- "gamma": 0.5
41
- },
42
- "use_cuda": true,
43
- "seed": 42
44
  }
 
1
  {
2
+ "model": "xtts",
3
+ "run_name": "xttsv2_finetune_es",
4
  "output_path": "./output_model",
 
5
  "datasets": [
6
  {
7
+ "formatter": "json",
8
  "meta_file_train": "./voxpopuli_es_500/metadata.json",
9
  "path": "./voxpopuli_es_500/wav_data",
10
  "language": "es"
11
  }
12
  ],
13
+ "batch_size": 4,
14
+ "eval_batch_size": 4,
15
+ "num_loader_workers": 2,
16
+ "num_eval_loader_workers": 1,
17
+ "run_eval": true,
18
+ "test_delay_epochs": 1,
19
+ "epochs": 5,
20
+ "save_step": 100,
21
+ "print_step": 25,
22
+ "eval_step": 100,
23
+ "mixed_precision": true,
24
+ "cudnn_benchmark": true,
25
+ "lr": 1e-4,
26
+ "grad_clip": 5.0,
27
+ "loss_masking": true,
28
+ "use_speaker_embedding": true,
29
+ "compute_input_seq_cache": true,
30
+ "eval_split_size": 0.05,
31
+ "text_cleaner": "multilingual_cleaners",
32
+ "use_phonemes": false,
33
+ "phoneme_language": "es",
34
+ "min_text_len": 1,
35
+ "max_text_len": 200,
36
+ "min_audio_len": 1000,
37
+ "max_audio_len": 160000,
38
+ "output_step": 25,
39
+ "logger": "tensorboard",
40
+ "seed": 1234
 
 
 
41
  }