AmitMY commited on
Commit
4525eff
·
verified ·
1 Parent(s): b1f5033

Upload folder using huggingface_hub

Browse files
Files changed (6) hide show
  1. args.yaml +9 -9
  2. config +102 -96
  3. metrics +0 -0
  4. params.best +2 -2
  5. tokenizer.json +0 -0
  6. vocab.src.0.json +0 -0
args.yaml CHANGED
@@ -83,11 +83,11 @@ optimizer_betas:
83
  - 0.9
84
  - 0.999
85
  optimizer_eps: 1.0e-08
86
- output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v2/model
87
  overwrite_output: false
88
  pad_vocab_to_multiple_of: 8
89
- params: null
90
- prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v2/train_data
91
  quiet: false
92
  quiet_secondary_workers: false
93
  seed: 1
@@ -152,14 +152,14 @@ transformer_preprocess:
152
  - n
153
  update_interval: 1
154
  use_cpu: false
155
- validation_source: /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/source.txt
156
  validation_source_factors: []
157
- validation_target: /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_0.txt
158
  validation_target_factors:
159
- - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_1.txt
160
- - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_2.txt
161
- - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_3.txt
162
- - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_4.txt
163
  weight_decay: 0.0
164
  weight_tying_type: trg_softmax
165
  word_min_count:
 
83
  - 0.9
84
  - 0.999
85
  optimizer_eps: 1.0e-08
86
+ output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-tuned/model
87
  overwrite_output: false
88
  pad_vocab_to_multiple_of: 8
89
+ params: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v4/model/params.best
90
+ prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-tuned/train_data
91
  quiet: false
92
  quiet_secondary_workers: false
93
  seed: 1
 
152
  - n
153
  update_interval: 1
154
  use_cpu: false
155
+ validation_source: /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/source.txt
156
  validation_source_factors: []
157
+ validation_target: /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_0.txt
158
  validation_target_factors:
159
+ - /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_1.txt
160
+ - /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_2.txt
161
+ - /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_3.txt
162
+ - /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_4.txt
163
  weight_decay: 0.0
164
  weight_tying_type: trg_softmax
165
  word_min_count:
config CHANGED
@@ -2,29 +2,30 @@
2
  config_data: !DataConfig
3
  data_statistics: !DataStatistics
4
  average_len_target_per_bucket:
5
- - 6.043404555083469
6
- - 10.519883768009015
7
- - 18.59887856456265
8
- - 26.278671761476776
9
- - 33.190033876079
10
- - 41.83887781695534
11
- - 51.24769950218732
12
- - 59.783405313440575
13
- - 68.16214942257864
14
- - 75.68928386092358
15
- - 82.77250900360164
16
- - 18.47619047619048
17
- - 8.058823529411766
18
- - 5.647058823529413
19
- - 9.5
20
- - 8.499999999999998
21
- - 5.0
22
- - 6.444444444444445
23
- - null
24
- - 5.0
25
- - null
26
- - null
27
- - null
 
28
  - null
29
  - null
30
  - null
@@ -39,7 +40,6 @@ config_data: !DataConfig
39
  - null
40
  - null
41
  - null
42
- - 6.0
43
  - null
44
  - null
45
  - null
@@ -263,67 +263,79 @@ config_data: !DataConfig
263
  - !!python/tuple
264
  - 513
265
  - 513
266
- length_ratio_mean: 1.488763422684226
267
  length_ratio_stats_per_bucket:
268
  - !!python/tuple
269
- - 1.172606268110977
270
- - 0.3198943487302755
271
  - !!python/tuple
272
- - 1.7758876999918463
273
- - 0.6634649712813119
274
  - !!python/tuple
275
- - 2.667916151313991
276
- - 1.011426597835219
277
  - !!python/tuple
278
- - 3.173004208160318
279
- - 1.618051536035044
280
  - !!python/tuple
281
- - 3.3799284759654693
282
- - 2.4421821481902017
283
  - !!python/tuple
284
- - 3.5445340678088186
285
- - 2.377062423666999
286
  - !!python/tuple
287
- - 3.870005889139779
288
- - 2.8520973384152954
289
  - !!python/tuple
290
- - 3.6032825677516436
291
- - 2.6820622916732426
292
  - !!python/tuple
293
- - 3.672787931128752
294
- - 2.7023842818124146
295
  - !!python/tuple
296
- - 3.807871945448423
297
- - 2.9154974163883414
298
  - !!python/tuple
299
- - 3.5339756014008112
300
- - 2.253656007685683
301
  - !!python/tuple
302
- - 0.19909941868381043
303
- - 0.2555613448334357
304
  - !!python/tuple
305
- - 0.08097343381798354
306
- - 0.02276102142801515
307
  - !!python/tuple
308
- - 0.05189939313382113
309
- - 0.014368277929717775
310
  - !!python/tuple
311
- - 0.08091857432628224
312
- - 0.052824789190560516
313
  - !!python/tuple
314
- - 0.06762976914376581
315
- - 0.015451689277268104
316
  - !!python/tuple
317
- - 0.03788218925017831
318
- - 0.0054846792633349494
319
  - !!python/tuple
320
- - 0.0463036569542669
321
- - 0.0098489446540238
 
 
 
322
  - &id001 !!python/tuple
323
  - null
324
  - null
325
  - !!python/tuple
326
- - 0.032679738562091505
 
 
 
 
 
 
 
 
 
327
  - 0.0
328
  - *id001
329
  - *id001
@@ -342,12 +354,6 @@ config_data: !DataConfig
342
  - *id001
343
  - *id001
344
  - *id001
345
- - !!python/tuple
346
- - 0.020066889632107024
347
- - 0.0
348
- - *id001
349
- - *id001
350
- - *id001
351
  - *id001
352
  - *id001
353
  - *id001
@@ -372,32 +378,36 @@ config_data: !DataConfig
372
  - *id001
373
  - *id001
374
  - *id001
375
- length_ratio_std: 0.8554135166970332
376
- max_observed_len_source: 299
377
  max_observed_len_target: 87
378
  num_discarded: 0
379
- num_sents: 1874353
380
  num_sents_per_bucket:
381
- - 1183908
382
- - 558194
383
- - 62420
384
- - 18581
385
- - 9151
386
- - 6523
387
- - 6629
388
- - 7641
389
- - 8486
390
- - 7708
391
- - 4998
392
- - 42
393
- - 17
394
- - 17
395
- - 4
396
- - 12
397
  - 9
398
  - 9
 
 
 
 
 
399
  - 0
 
400
  - 3
 
 
401
  - 0
402
  - 0
403
  - 0
@@ -415,10 +425,6 @@ config_data: !DataConfig
415
  - 0
416
  - 0
417
  - 0
418
- - 1
419
- - 0
420
- - 0
421
- - 0
422
  - 0
423
  - 0
424
  - 0
@@ -443,11 +449,11 @@ config_data: !DataConfig
443
  - 0
444
  - 0
445
  - 0
446
- num_tokens_source: 11815202
447
- num_tokens_target: 17626167
448
  num_unks_source: 0
449
  num_unks_target: 0
450
- size_vocab_source: 46256
451
  size_vocab_target: 656
452
  eop_id: -1
453
  max_seq_len_source: 513
@@ -479,7 +485,7 @@ config_embed_source: !EmbeddingConfig
479
  factor_configs: null
480
  num_embed: 512
481
  num_factors: 1
482
- vocab_size: 46256
483
  config_embed_target: !EmbeddingConfig
484
  allow_sparse_grad: false
485
  dropout: 0.5
@@ -531,6 +537,6 @@ dtype: float32
531
  lhuc: false
532
  neural_vocab_selection: null
533
  neural_vocab_selection_block_loss: false
534
- vocab_source_size: 46256
535
  vocab_target_size: 656
536
  weight_tying_type: trg_softmax
 
2
  config_data: !DataConfig
3
  data_statistics: !DataStatistics
4
  average_len_target_per_bucket:
5
+ - 6.01988730121871
6
+ - 10.49707202236441
7
+ - 18.536005711954232
8
+ - 25.91453940066591
9
+ - 33.44474802671516
10
+ - 41.29017292281736
11
+ - 50.38165137614682
12
+ - 59.57928802588991
13
+ - 67.86491420226359
14
+ - 75.76032388663967
15
+ - 82.68249075215772
16
+ - 12.0
17
+ - 23.333333333333332
18
+ - 24.88888888888889
19
+ - 15.857142857142856
20
+ - 8.6
21
+ - 8.0
22
+ - 6.5
23
+ - 4.5
24
+ - null
25
+ - 6.25
26
+ - 6.0
27
+ - 8.0
28
+ - 10.0
29
  - null
30
  - null
31
  - null
 
40
  - null
41
  - null
42
  - null
 
43
  - null
44
  - null
45
  - null
 
263
  - !!python/tuple
264
  - 513
265
  - 513
266
+ length_ratio_mean: 1.4422861755889766
267
  length_ratio_stats_per_bucket:
268
  - !!python/tuple
269
+ - 1.1255982284370691
270
+ - 0.3093025169709561
271
  - !!python/tuple
272
+ - 1.6064942041128283
273
+ - 0.6417946634210556
274
  - !!python/tuple
275
+ - 2.359196679910085
276
+ - 0.9575904838242857
277
  - !!python/tuple
278
+ - 2.9607196399710274
279
+ - 1.5584344652106463
280
  - !!python/tuple
281
+ - 2.9543389770526325
282
+ - 2.297144978089179
283
  - !!python/tuple
284
+ - 3.002340450312629
285
+ - 2.18681603522054
286
  - !!python/tuple
287
+ - 3.081058473996043
288
+ - 2.5011199006515183
289
  - !!python/tuple
290
+ - 2.9163894753348045
291
+ - 2.2789742432670086
292
  - !!python/tuple
293
+ - 2.9722600022754504
294
+ - 2.230352263818367
295
  - !!python/tuple
296
+ - 3.138369081443168
297
+ - 2.4620594208603235
298
  - !!python/tuple
299
+ - 2.854253034817575
300
+ - 1.6376340581023332
301
  - !!python/tuple
302
+ - 0.12974460739238317
303
+ - 0.160679251677897
304
  - !!python/tuple
305
+ - 0.23436597326420017
306
+ - 0.24015947073924906
307
  - !!python/tuple
308
+ - 0.23457181630569815
309
+ - 0.2675720247460546
310
  - !!python/tuple
311
+ - 0.1366625632624212
312
+ - 0.16557849394412172
313
  - !!python/tuple
314
+ - 0.06941451000342352
315
+ - 0.02389100863634256
316
  - !!python/tuple
317
+ - 0.05970149253731343
318
+ - 0.0
319
  - !!python/tuple
320
+ - 0.04609929078014184
321
+ - 0.017730496453900707
322
+ - !!python/tuple
323
+ - 0.03063680118474639
324
+ - 0.0036097741577193615
325
  - &id001 !!python/tuple
326
  - null
327
  - null
328
  - !!python/tuple
329
+ - 0.038657633805228714
330
+ - 0.010237907973024957
331
+ - !!python/tuple
332
+ - 0.03469146238377008
333
+ - 0.004700847851307781
334
+ - !!python/tuple
335
+ - 0.0446927374301676
336
+ - 0.0
337
+ - !!python/tuple
338
+ - 0.05405405405405406
339
  - 0.0
340
  - *id001
341
  - *id001
 
354
  - *id001
355
  - *id001
356
  - *id001
 
 
 
 
 
 
357
  - *id001
358
  - *id001
359
  - *id001
 
378
  - *id001
379
  - *id001
380
  - *id001
381
+ length_ratio_std: 0.8479651722336846
382
+ max_observed_len_source: 185
383
  max_observed_len_target: 87
384
  num_discarded: 0
385
+ num_sents: 425392
386
  num_sents_per_bucket:
387
+ - 245433
388
+ - 135930
389
+ - 19608
390
+ - 7208
391
+ - 3294
392
+ - 2371
393
+ - 2180
394
+ - 2472
395
+ - 2739
396
+ - 2470
397
+ - 1622
398
+ - 20
 
 
 
 
399
  - 9
400
  - 9
401
+ - 7
402
+ - 5
403
+ - 1
404
+ - 2
405
+ - 2
406
  - 0
407
+ - 4
408
  - 3
409
+ - 1
410
+ - 2
411
  - 0
412
  - 0
413
  - 0
 
425
  - 0
426
  - 0
427
  - 0
 
 
 
 
428
  - 0
429
  - 0
430
  - 0
 
449
  - 0
450
  - 0
451
  - 0
452
+ num_tokens_source: 3056735
453
+ num_tokens_target: 4427820
454
  num_unks_source: 0
455
  num_unks_target: 0
456
+ size_vocab_source: 8016
457
  size_vocab_target: 656
458
  eop_id: -1
459
  max_seq_len_source: 513
 
485
  factor_configs: null
486
  num_embed: 512
487
  num_factors: 1
488
+ vocab_size: 8016
489
  config_embed_target: !EmbeddingConfig
490
  allow_sparse_grad: false
491
  dropout: 0.5
 
537
  lhuc: false
538
  neural_vocab_selection: null
539
  neural_vocab_selection_block_loss: false
540
+ vocab_source_size: 8016
541
  vocab_target_size: 656
542
  weight_tying_type: trg_softmax
metrics CHANGED
The diff for this file is too large to render. See raw diff
 
params.best CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c57f2a6fd2b40d982a122389c2fdd52c8d3bf1b2527fbd673cb75302803153fa
3
- size 279564030
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbc40d947ce0a1c03679cc4c62a4a94c11b179a485637727fc1b491a063042c4
3
+ size 201248510
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab.src.0.json CHANGED
The diff for this file is too large to render. See raw diff