nonoJDWAOIDAWKDA commited on
Commit
2b74a9d
·
verified ·
1 Parent(s): 0501e17

Upload StyleTTS2 checkpoint epoch_2nd_00005.pth with all inference components

Browse files
README.md CHANGED
@@ -16,16 +16,16 @@ This model is a fine-tuned version of StyleTTS2, containing all necessary compon
16
  - **Base Model:** StyleTTS2-LibriTTS
17
  - **Architecture:** StyleTTS2
18
  - **Task:** Text-to-Speech
19
- - **Last Checkpoint:** epoch_2nd_00001.pth
20
 
21
  ## Training Details
22
  - **Total Epochs:** 6
23
- - **Completed Epochs:** 1
24
- - **Total Iterations:** 648
25
  - **Batch Size:** 2
26
- - **Max Length:** 630
27
  - **Learning Rate:** 0.0001
28
- - **Final Validation Loss:** 0.488410
29
 
30
  ## Model Components
31
  The repository includes all necessary components for inference:
 
16
  - **Base Model:** StyleTTS2-LibriTTS
17
  - **Architecture:** StyleTTS2
18
  - **Task:** Text-to-Speech
19
+ - **Last Checkpoint:** epoch_2nd_00005.pth
20
 
21
  ## Training Details
22
  - **Total Epochs:** 6
23
+ - **Completed Epochs:** 5
24
+ - **Total Iterations:** 1944
25
  - **Batch Size:** 2
26
+ - **Max Length:** 620
27
  - **Learning Rate:** 0.0001
28
+ - **Final Validation Loss:** 0.485287
29
 
30
  ## Model Components
31
  The repository includes all necessary components for inference:
bert.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b086f44bf311f585cf073a52518c20095ba3c090be5af2847f23c976395ce3c
3
  size 25178740
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae20fea5f2d0c5aba00d867f1ed9241e7dc164811917ab06628b1faf65cc4c91
3
  size 25178740
bert_encoder.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba91ded085853bef041882bedfd28074284af14ebaa3e31ce8826987de729303
3
  size 1576502
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31ba9acf684366042536f950897fd51cf210884cedfb27f94498b4859269aff4
3
  size 1576502
checkpoint.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00ef7d7e768fecec6721c5545482b2896bf18a35e782e32bc9501d5b695989ad
3
- size 2026454778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15f22f7d0b4ebd58ab444ed4e44ff9b9402d36c8b42b9364ecee857cafae75ed
3
+ size 2201837262
config.json CHANGED
@@ -74,7 +74,7 @@
74
  "training_config": {
75
  "epochs": 6,
76
  "batch_size": 2,
77
- "max_len": 630,
78
  "optimizer": {
79
  "bert_lr": 1e-05,
80
  "ft_lr": 0.0001,
@@ -112,9 +112,9 @@
112
  "val_data": "Data/val_list.txt"
113
  },
114
  "model_state": {
115
- "epoch": 1,
116
- "iterations": 648,
117
- "val_loss": 0.48840951919555664
118
  },
119
  "training_metrics": {
120
  "train_loss": [],
@@ -162,7 +162,13 @@
162
  42.0,
163
  16.0,
164
  5.0,
165
- 35.0
 
 
 
 
 
 
166
  ],
167
  "dur_loss": [
168
  0.502,
@@ -208,7 +214,13 @@
208
  0.445,
209
  0.439,
210
  0.524,
211
- 0.488
 
 
 
 
 
 
212
  ],
213
  "F0_loss": [
214
  1.759,
@@ -254,7 +266,13 @@
254
  1.443,
255
  1.441,
256
  1.573,
257
- 1.585
 
 
 
 
 
 
258
  ],
259
  "epochs": [
260
  1,
@@ -300,7 +318,13 @@
300
  41,
301
  42,
302
  43,
303
- 44
 
 
 
 
 
 
304
  ]
305
  }
306
  }
 
74
  "training_config": {
75
  "epochs": 6,
76
  "batch_size": 2,
77
+ "max_len": 620,
78
  "optimizer": {
79
  "bert_lr": 1e-05,
80
  "ft_lr": 0.0001,
 
112
  "val_data": "Data/val_list.txt"
113
  },
114
  "model_state": {
115
+ "epoch": 5,
116
+ "iterations": 1944,
117
+ "val_loss": 0.48528674244880676
118
  },
119
  "training_metrics": {
120
  "train_loss": [],
 
162
  42.0,
163
  16.0,
164
  5.0,
165
+ 35.0,
166
+ 13.0,
167
+ 51.0,
168
+ 4.0,
169
+ 27.0,
170
+ 44.0,
171
+ 16.0
172
  ],
173
  "dur_loss": [
174
  0.502,
 
214
  0.445,
215
  0.439,
216
  0.524,
217
+ 0.488,
218
+ 0.495,
219
+ 0.486,
220
+ 0.488,
221
+ 0.494,
222
+ 0.484,
223
+ 0.485
224
  ],
225
  "F0_loss": [
226
  1.759,
 
266
  1.443,
267
  1.441,
268
  1.573,
269
+ 1.585,
270
+ 1.659,
271
+ 1.654,
272
+ 1.68,
273
+ 1.614,
274
+ 1.596,
275
+ 1.552
276
  ],
277
  "epochs": [
278
  1,
 
318
  41,
319
  42,
320
  43,
321
+ 44,
322
+ 45,
323
+ 46,
324
+ 47,
325
+ 48,
326
+ 49,
327
+ 50
328
  ]
329
  }
330
  }
decoder.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1785d4f41b6cea59ac0830c67d43f9c5a0d91df94f218ac6f4682839b87432da
3
  size 217409318
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a309dff51e689b9cd56001575287ab933de233e7ca777c8ffd6da77dac83da63
3
  size 217409318
diffusion.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cf771d99fcfdfab7e0c2c905813f6846829d465b7167da29dbbbc267d4793af
3
  size 87699504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bee50db80c722cf72dfc28ce53bd8be86df7bd9d13ae56350587ac89bcc3c97b
3
  size 87699504
mpd.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e62deedbbc57b8bc824a2d0f7765ce106fd58344f7bedbb4c6d93a31d8908f7f
3
  size 164447824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a59c4b2d4bdaa05a9b64f5b3d67fac6e06dfa91cc2e649f7107ea172a3f50a0e
3
  size 164447824
msd.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdad23273ae36500d80a90f4ffdf172b145dbb1f2384b1a92b8d470e881d6b53
3
  size 1139020
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85130e48dedb76fa77ece85eea6f7f35420c40e8ff4e894f02ca2c7451d659e6
3
  size 1139020
predictor.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29e5b9ef7a2ac2c286317b86b1626098f8abbe9ad9b2b3caa638711435e10755
3
  size 64813639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44d1eb7b58570cc0137e4e77a9b2f9cf7c9e0a0a28fb79eea13c0916c12a3e0f
3
  size 64813639
predictor_encoder.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01a28c748d50e14bd662beaecb6a60682559fb6de5778ad5c614fe1fdda7e9bc
3
  size 55547155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87dd4dd75a97524c1e8fbf8731b91f1e20d9e8546e4b256ccc1fc651941a2a5d
3
  size 55547155
style_encoder.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06b5682a776988c64de0a5d53c7e55f7ac05692cda6006f6596b1648681842f5
3
  size 55546871
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3df89b7cbde89bbc338a27f5688e665bb765dbf80cf1f85135f356d90e36db07
3
  size 55546871
text_aligner.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13ee1d58f1389f969a8035ba762ae656005b2dff7278c87ab59dbcd60a28f448
3
  size 31531315
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3391b0d11ea3cb9e79f17e111fbcac63f7e6e0c192239332fc625ada4b43ba6
3
  size 31531315
text_encoder.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a4817057f30f702acbeae12cac5c0ad3611cd32d62e9ca05e842aaa60e7c35b
3
  size 22432460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e005aa7145a3231658c7b50932c294d81b8f198ac2591f8f0c3e2429b035ad63
3
  size 22432460
training_metrics.png CHANGED