Upload StyleTTS2 checkpoint epoch_2nd_00005.pth with all inference components
Browse files- README.md +5 -5
- bert.pth +1 -1
- bert_encoder.pth +1 -1
- checkpoint.pth +2 -2
- config.json +32 -8
- decoder.pth +1 -1
- diffusion.pth +1 -1
- mpd.pth +1 -1
- msd.pth +1 -1
- predictor.pth +1 -1
- predictor_encoder.pth +1 -1
- style_encoder.pth +1 -1
- text_aligner.pth +1 -1
- text_encoder.pth +1 -1
- training_metrics.png +0 -0
README.md
CHANGED
@@ -16,16 +16,16 @@ This model is a fine-tuned version of StyleTTS2, containing all necessary compon
|
|
16 |
- **Base Model:** StyleTTS2-LibriTTS
|
17 |
- **Architecture:** StyleTTS2
|
18 |
- **Task:** Text-to-Speech
|
19 |
-
- **Last Checkpoint:**
|
20 |
|
21 |
## Training Details
|
22 |
- **Total Epochs:** 6
|
23 |
-
- **Completed Epochs:**
|
24 |
-
- **Total Iterations:**
|
25 |
- **Batch Size:** 2
|
26 |
-
- **Max Length:**
|
27 |
- **Learning Rate:** 0.0001
|
28 |
-
- **Final Validation Loss:** 0.
|
29 |
|
30 |
## Model Components
|
31 |
The repository includes all necessary components for inference:
|
|
|
16 |
- **Base Model:** StyleTTS2-LibriTTS
|
17 |
- **Architecture:** StyleTTS2
|
18 |
- **Task:** Text-to-Speech
|
19 |
+
- **Last Checkpoint:** epoch_2nd_00005.pth
|
20 |
|
21 |
## Training Details
|
22 |
- **Total Epochs:** 6
|
23 |
+
- **Completed Epochs:** 5
|
24 |
+
- **Total Iterations:** 1944
|
25 |
- **Batch Size:** 2
|
26 |
+
- **Max Length:** 620
|
27 |
- **Learning Rate:** 0.0001
|
28 |
+
- **Final Validation Loss:** 0.485287
|
29 |
|
30 |
## Model Components
|
31 |
The repository includes all necessary components for inference:
|
bert.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 25178740
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae20fea5f2d0c5aba00d867f1ed9241e7dc164811917ab06628b1faf65cc4c91
|
3 |
size 25178740
|
bert_encoder.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1576502
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31ba9acf684366042536f950897fd51cf210884cedfb27f94498b4859269aff4
|
3 |
size 1576502
|
checkpoint.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15f22f7d0b4ebd58ab444ed4e44ff9b9402d36c8b42b9364ecee857cafae75ed
|
3 |
+
size 2201837262
|
config.json
CHANGED
@@ -74,7 +74,7 @@
|
|
74 |
"training_config": {
|
75 |
"epochs": 6,
|
76 |
"batch_size": 2,
|
77 |
-
"max_len":
|
78 |
"optimizer": {
|
79 |
"bert_lr": 1e-05,
|
80 |
"ft_lr": 0.0001,
|
@@ -112,9 +112,9 @@
|
|
112 |
"val_data": "Data/val_list.txt"
|
113 |
},
|
114 |
"model_state": {
|
115 |
-
"epoch":
|
116 |
-
"iterations":
|
117 |
-
"val_loss": 0.
|
118 |
},
|
119 |
"training_metrics": {
|
120 |
"train_loss": [],
|
@@ -162,7 +162,13 @@
|
|
162 |
42.0,
|
163 |
16.0,
|
164 |
5.0,
|
165 |
-
35.0
|
|
|
|
|
|
|
|
|
|
|
|
|
166 |
],
|
167 |
"dur_loss": [
|
168 |
0.502,
|
@@ -208,7 +214,13 @@
|
|
208 |
0.445,
|
209 |
0.439,
|
210 |
0.524,
|
211 |
-
0.488
|
|
|
|
|
|
|
|
|
|
|
|
|
212 |
],
|
213 |
"F0_loss": [
|
214 |
1.759,
|
@@ -254,7 +266,13 @@
|
|
254 |
1.443,
|
255 |
1.441,
|
256 |
1.573,
|
257 |
-
1.585
|
|
|
|
|
|
|
|
|
|
|
|
|
258 |
],
|
259 |
"epochs": [
|
260 |
1,
|
@@ -300,7 +318,13 @@
|
|
300 |
41,
|
301 |
42,
|
302 |
43,
|
303 |
-
44
|
|
|
|
|
|
|
|
|
|
|
|
|
304 |
]
|
305 |
}
|
306 |
}
|
|
|
74 |
"training_config": {
|
75 |
"epochs": 6,
|
76 |
"batch_size": 2,
|
77 |
+
"max_len": 620,
|
78 |
"optimizer": {
|
79 |
"bert_lr": 1e-05,
|
80 |
"ft_lr": 0.0001,
|
|
|
112 |
"val_data": "Data/val_list.txt"
|
113 |
},
|
114 |
"model_state": {
|
115 |
+
"epoch": 5,
|
116 |
+
"iterations": 1944,
|
117 |
+
"val_loss": 0.48528674244880676
|
118 |
},
|
119 |
"training_metrics": {
|
120 |
"train_loss": [],
|
|
|
162 |
42.0,
|
163 |
16.0,
|
164 |
5.0,
|
165 |
+
35.0,
|
166 |
+
13.0,
|
167 |
+
51.0,
|
168 |
+
4.0,
|
169 |
+
27.0,
|
170 |
+
44.0,
|
171 |
+
16.0
|
172 |
],
|
173 |
"dur_loss": [
|
174 |
0.502,
|
|
|
214 |
0.445,
|
215 |
0.439,
|
216 |
0.524,
|
217 |
+
0.488,
|
218 |
+
0.495,
|
219 |
+
0.486,
|
220 |
+
0.488,
|
221 |
+
0.494,
|
222 |
+
0.484,
|
223 |
+
0.485
|
224 |
],
|
225 |
"F0_loss": [
|
226 |
1.759,
|
|
|
266 |
1.443,
|
267 |
1.441,
|
268 |
1.573,
|
269 |
+
1.585,
|
270 |
+
1.659,
|
271 |
+
1.654,
|
272 |
+
1.68,
|
273 |
+
1.614,
|
274 |
+
1.596,
|
275 |
+
1.552
|
276 |
],
|
277 |
"epochs": [
|
278 |
1,
|
|
|
318 |
41,
|
319 |
42,
|
320 |
43,
|
321 |
+
44,
|
322 |
+
45,
|
323 |
+
46,
|
324 |
+
47,
|
325 |
+
48,
|
326 |
+
49,
|
327 |
+
50
|
328 |
]
|
329 |
}
|
330 |
}
|
decoder.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 217409318
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a309dff51e689b9cd56001575287ab933de233e7ca777c8ffd6da77dac83da63
|
3 |
size 217409318
|
diffusion.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 87699504
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bee50db80c722cf72dfc28ce53bd8be86df7bd9d13ae56350587ac89bcc3c97b
|
3 |
size 87699504
|
mpd.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 164447824
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a59c4b2d4bdaa05a9b64f5b3d67fac6e06dfa91cc2e649f7107ea172a3f50a0e
|
3 |
size 164447824
|
msd.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1139020
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85130e48dedb76fa77ece85eea6f7f35420c40e8ff4e894f02ca2c7451d659e6
|
3 |
size 1139020
|
predictor.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 64813639
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44d1eb7b58570cc0137e4e77a9b2f9cf7c9e0a0a28fb79eea13c0916c12a3e0f
|
3 |
size 64813639
|
predictor_encoder.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 55547155
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87dd4dd75a97524c1e8fbf8731b91f1e20d9e8546e4b256ccc1fc651941a2a5d
|
3 |
size 55547155
|
style_encoder.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 55546871
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3df89b7cbde89bbc338a27f5688e665bb765dbf80cf1f85135f356d90e36db07
|
3 |
size 55546871
|
text_aligner.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 31531315
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3391b0d11ea3cb9e79f17e111fbcac63f7e6e0c192239332fc625ada4b43ba6
|
3 |
size 31531315
|
text_encoder.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 22432460
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e005aa7145a3231658c7b50932c294d81b8f198ac2591f8f0c3e2429b035ad63
|
3 |
size 22432460
|
training_metrics.png
CHANGED
![]() |
![]() |