huseinzol05 commited on
Commit
6aa5bf2
·
verified ·
1 Parent(s): 70040b3

Upload ParlerTTSForConditionalGeneration

Browse files
Files changed (2) hide show
  1. config.json +10 -38
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "_name_or_path": "output_dir_training-v3/checkpoint-17000-epoch-5",
3
  "architectures": [
4
  "ParlerTTSForConditionalGeneration"
5
  ],
6
  "audio_encoder": {
7
  "_attn_implementation_autoset": false,
8
- "_name_or_path": "ylacombe/dac_44khZ_8kbps",
9
  "add_cross_attention": false,
10
  "architectures": [
11
  "DACModel"
@@ -77,7 +77,7 @@
77
  },
78
  "decoder": {
79
  "_attn_implementation_autoset": false,
80
- "_name_or_path": "/fsx/yoach/tmp/artefacts/decoder_400M/",
81
  "activation_dropout": 0.0,
82
  "activation_function": "gelu",
83
  "add_cross_attention": true,
@@ -170,7 +170,7 @@
170
  "prompt_cross_attention": false,
171
  "text_encoder": {
172
  "_attn_implementation_autoset": false,
173
- "_name_or_path": "google/flan-t5-base",
174
  "add_cross_attention": false,
175
  "architectures": [
176
  "T5ForConditionalGeneration"
@@ -181,9 +181,9 @@
181
  "chunk_size_feed_forward": 0,
182
  "classifier_dropout": 0.0,
183
  "cross_attention_hidden_size": null,
184
- "d_ff": 2048,
185
  "d_kv": 64,
186
- "d_model": 768,
187
  "decoder_start_token_id": 0,
188
  "dense_act_fn": "gelu_new",
189
  "diversity_penalty": 0.0,
@@ -218,9 +218,9 @@
218
  "no_repeat_ngram_size": 0,
219
  "num_beam_groups": 1,
220
  "num_beams": 1,
221
- "num_decoder_layers": 12,
222
- "num_heads": 12,
223
- "num_layers": 12,
224
  "num_return_sequences": 1,
225
  "output_attentions": false,
226
  "output_hidden_states": false,
@@ -238,35 +238,7 @@
238
  "return_dict_in_generate": false,
239
  "sep_token_id": null,
240
  "suppress_tokens": null,
241
- "task_specific_params": {
242
- "summarization": {
243
- "early_stopping": true,
244
- "length_penalty": 2.0,
245
- "max_length": 200,
246
- "min_length": 30,
247
- "no_repeat_ngram_size": 3,
248
- "num_beams": 4,
249
- "prefix": "summarize: "
250
- },
251
- "translation_en_to_de": {
252
- "early_stopping": true,
253
- "max_length": 300,
254
- "num_beams": 4,
255
- "prefix": "translate English to German: "
256
- },
257
- "translation_en_to_fr": {
258
- "early_stopping": true,
259
- "max_length": 300,
260
- "num_beams": 4,
261
- "prefix": "translate English to French: "
262
- },
263
- "translation_en_to_ro": {
264
- "early_stopping": true,
265
- "max_length": 300,
266
- "num_beams": 4,
267
- "prefix": "translate English to Romanian: "
268
- }
269
- },
270
  "temperature": 1.0,
271
  "tf_legacy_loss": false,
272
  "tie_encoder_decoder": false,
 
1
  {
2
+ "_name_or_path": "output_mini/checkpoint-16000-epoch-4",
3
  "architectures": [
4
  "ParlerTTSForConditionalGeneration"
5
  ],
6
  "audio_encoder": {
7
  "_attn_implementation_autoset": false,
8
+ "_name_or_path": "parler-tts/dac_44khZ_8kbps",
9
  "add_cross_attention": false,
10
  "architectures": [
11
  "DACModel"
 
77
  },
78
  "decoder": {
79
  "_attn_implementation_autoset": false,
80
+ "_name_or_path": "/fsx/yoach/tmp/artefacts/parler-tts-mini/decoder",
81
  "activation_dropout": 0.0,
82
  "activation_function": "gelu",
83
  "add_cross_attention": true,
 
170
  "prompt_cross_attention": false,
171
  "text_encoder": {
172
  "_attn_implementation_autoset": false,
173
+ "_name_or_path": "google/flan-t5-large",
174
  "add_cross_attention": false,
175
  "architectures": [
176
  "T5ForConditionalGeneration"
 
181
  "chunk_size_feed_forward": 0,
182
  "classifier_dropout": 0.0,
183
  "cross_attention_hidden_size": null,
184
+ "d_ff": 2816,
185
  "d_kv": 64,
186
+ "d_model": 1024,
187
  "decoder_start_token_id": 0,
188
  "dense_act_fn": "gelu_new",
189
  "diversity_penalty": 0.0,
 
218
  "no_repeat_ngram_size": 0,
219
  "num_beam_groups": 1,
220
  "num_beams": 1,
221
+ "num_decoder_layers": 24,
222
+ "num_heads": 16,
223
+ "num_layers": 24,
224
  "num_return_sequences": 1,
225
  "output_attentions": false,
226
  "output_hidden_states": false,
 
238
  "return_dict_in_generate": false,
239
  "sep_token_id": null,
240
  "suppress_tokens": null,
241
+ "task_specific_params": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
242
  "temperature": 1.0,
243
  "tf_legacy_loss": false,
244
  "tie_encoder_decoder": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7837edd27e2d71b7979cdcb8fa9d00f7dc71d99c40f91595ba1308fef0d0d71
3
- size 2588219296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a1b5b96a4c1232a4420bc95b352067b13000f2673903e8fa09785db77abba79
3
+ size 3511494464