Upload folder using huggingface_hub
Browse files- args.yaml +9 -9
- config +102 -96
- metrics +0 -0
- params.best +2 -2
- tokenizer.json +0 -0
- vocab.src.0.json +0 -0
args.yaml
CHANGED
@@ -83,11 +83,11 @@ optimizer_betas:
|
|
83 |
- 0.9
|
84 |
- 0.999
|
85 |
optimizer_eps: 1.0e-08
|
86 |
-
output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-
|
87 |
overwrite_output: false
|
88 |
pad_vocab_to_multiple_of: 8
|
89 |
-
params:
|
90 |
-
prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-
|
91 |
quiet: false
|
92 |
quiet_secondary_workers: false
|
93 |
seed: 1
|
@@ -152,14 +152,14 @@ transformer_preprocess:
|
|
152 |
- n
|
153 |
update_interval: 1
|
154 |
use_cpu: false
|
155 |
-
validation_source: /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/source.txt
|
156 |
validation_source_factors: []
|
157 |
-
validation_target: /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_0.txt
|
158 |
validation_target_factors:
|
159 |
-
- /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_1.txt
|
160 |
-
- /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_2.txt
|
161 |
-
- /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_3.txt
|
162 |
-
- /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_4.txt
|
163 |
weight_decay: 0.0
|
164 |
weight_tying_type: trg_softmax
|
165 |
word_min_count:
|
|
|
83 |
- 0.9
|
84 |
- 0.999
|
85 |
optimizer_eps: 1.0e-08
|
86 |
+
output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-tuned/model
|
87 |
overwrite_output: false
|
88 |
pad_vocab_to_multiple_of: 8
|
89 |
+
params: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v4/model/params.best
|
90 |
+
prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-tuned/train_data
|
91 |
quiet: false
|
92 |
quiet_secondary_workers: false
|
93 |
seed: 1
|
|
|
152 |
- n
|
153 |
update_interval: 1
|
154 |
use_cpu: false
|
155 |
+
validation_source: /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/source.txt
|
156 |
validation_source_factors: []
|
157 |
+
validation_target: /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_0.txt
|
158 |
validation_target_factors:
|
159 |
+
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_1.txt
|
160 |
+
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_2.txt
|
161 |
+
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_3.txt
|
162 |
+
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_4.txt
|
163 |
weight_decay: 0.0
|
164 |
weight_tying_type: trg_softmax
|
165 |
word_min_count:
|
config
CHANGED
@@ -2,29 +2,30 @@
|
|
2 |
config_data: !DataConfig
|
3 |
data_statistics: !DataStatistics
|
4 |
average_len_target_per_bucket:
|
5 |
-
- 6.
|
6 |
-
- 10.
|
7 |
-
- 18.
|
8 |
-
-
|
9 |
-
- 33.
|
10 |
-
- 41.
|
11 |
-
-
|
12 |
-
- 59.
|
13 |
-
-
|
14 |
-
- 75.
|
15 |
-
- 82.
|
16 |
-
-
|
17 |
-
-
|
18 |
-
-
|
19 |
-
-
|
20 |
-
- 8.
|
21 |
-
-
|
22 |
-
- 6.
|
23 |
-
-
|
24 |
-
-
|
25 |
-
-
|
26 |
-
-
|
27 |
-
-
|
|
|
28 |
- null
|
29 |
- null
|
30 |
- null
|
@@ -39,7 +40,6 @@ config_data: !DataConfig
|
|
39 |
- null
|
40 |
- null
|
41 |
- null
|
42 |
-
- 6.0
|
43 |
- null
|
44 |
- null
|
45 |
- null
|
@@ -263,67 +263,79 @@ config_data: !DataConfig
|
|
263 |
- !!python/tuple
|
264 |
- 513
|
265 |
- 513
|
266 |
-
length_ratio_mean: 1.
|
267 |
length_ratio_stats_per_bucket:
|
268 |
- !!python/tuple
|
269 |
-
- 1.
|
270 |
-
- 0.
|
271 |
- !!python/tuple
|
272 |
-
- 1.
|
273 |
-
- 0.
|
274 |
- !!python/tuple
|
275 |
-
- 2.
|
276 |
-
-
|
277 |
- !!python/tuple
|
278 |
-
-
|
279 |
-
- 1.
|
280 |
- !!python/tuple
|
281 |
-
-
|
282 |
-
- 2.
|
283 |
- !!python/tuple
|
284 |
-
- 3.
|
285 |
-
- 2.
|
286 |
- !!python/tuple
|
287 |
-
- 3.
|
288 |
-
- 2.
|
289 |
- !!python/tuple
|
290 |
-
-
|
291 |
-
- 2.
|
292 |
- !!python/tuple
|
293 |
-
-
|
294 |
-
- 2.
|
295 |
- !!python/tuple
|
296 |
-
- 3.
|
297 |
-
- 2.
|
298 |
- !!python/tuple
|
299 |
-
-
|
300 |
-
-
|
301 |
- !!python/tuple
|
302 |
-
- 0.
|
303 |
-
- 0.
|
304 |
- !!python/tuple
|
305 |
-
- 0.
|
306 |
-
- 0.
|
307 |
- !!python/tuple
|
308 |
-
- 0.
|
309 |
-
- 0.
|
310 |
- !!python/tuple
|
311 |
-
- 0.
|
312 |
-
- 0.
|
313 |
- !!python/tuple
|
314 |
-
- 0.
|
315 |
-
- 0.
|
316 |
- !!python/tuple
|
317 |
-
- 0.
|
318 |
-
- 0.
|
319 |
- !!python/tuple
|
320 |
-
- 0.
|
321 |
-
- 0.
|
|
|
|
|
|
|
322 |
- &id001 !!python/tuple
|
323 |
- null
|
324 |
- null
|
325 |
- !!python/tuple
|
326 |
-
- 0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
327 |
- 0.0
|
328 |
- *id001
|
329 |
- *id001
|
@@ -342,12 +354,6 @@ config_data: !DataConfig
|
|
342 |
- *id001
|
343 |
- *id001
|
344 |
- *id001
|
345 |
-
- !!python/tuple
|
346 |
-
- 0.020066889632107024
|
347 |
-
- 0.0
|
348 |
-
- *id001
|
349 |
-
- *id001
|
350 |
-
- *id001
|
351 |
- *id001
|
352 |
- *id001
|
353 |
- *id001
|
@@ -372,32 +378,36 @@ config_data: !DataConfig
|
|
372 |
- *id001
|
373 |
- *id001
|
374 |
- *id001
|
375 |
-
length_ratio_std: 0.
|
376 |
-
max_observed_len_source:
|
377 |
max_observed_len_target: 87
|
378 |
num_discarded: 0
|
379 |
-
num_sents:
|
380 |
num_sents_per_bucket:
|
381 |
-
-
|
382 |
-
-
|
383 |
-
-
|
384 |
-
-
|
385 |
-
-
|
386 |
-
-
|
387 |
-
-
|
388 |
-
-
|
389 |
-
-
|
390 |
-
-
|
391 |
-
-
|
392 |
-
-
|
393 |
-
- 17
|
394 |
-
- 17
|
395 |
-
- 4
|
396 |
-
- 12
|
397 |
- 9
|
398 |
- 9
|
|
|
|
|
|
|
|
|
|
|
399 |
- 0
|
|
|
400 |
- 3
|
|
|
|
|
401 |
- 0
|
402 |
- 0
|
403 |
- 0
|
@@ -415,10 +425,6 @@ config_data: !DataConfig
|
|
415 |
- 0
|
416 |
- 0
|
417 |
- 0
|
418 |
-
- 1
|
419 |
-
- 0
|
420 |
-
- 0
|
421 |
-
- 0
|
422 |
- 0
|
423 |
- 0
|
424 |
- 0
|
@@ -443,11 +449,11 @@ config_data: !DataConfig
|
|
443 |
- 0
|
444 |
- 0
|
445 |
- 0
|
446 |
-
num_tokens_source:
|
447 |
-
num_tokens_target:
|
448 |
num_unks_source: 0
|
449 |
num_unks_target: 0
|
450 |
-
size_vocab_source:
|
451 |
size_vocab_target: 656
|
452 |
eop_id: -1
|
453 |
max_seq_len_source: 513
|
@@ -479,7 +485,7 @@ config_embed_source: !EmbeddingConfig
|
|
479 |
factor_configs: null
|
480 |
num_embed: 512
|
481 |
num_factors: 1
|
482 |
-
vocab_size:
|
483 |
config_embed_target: !EmbeddingConfig
|
484 |
allow_sparse_grad: false
|
485 |
dropout: 0.5
|
@@ -531,6 +537,6 @@ dtype: float32
|
|
531 |
lhuc: false
|
532 |
neural_vocab_selection: null
|
533 |
neural_vocab_selection_block_loss: false
|
534 |
-
vocab_source_size:
|
535 |
vocab_target_size: 656
|
536 |
weight_tying_type: trg_softmax
|
|
|
2 |
config_data: !DataConfig
|
3 |
data_statistics: !DataStatistics
|
4 |
average_len_target_per_bucket:
|
5 |
+
- 6.01988730121871
|
6 |
+
- 10.49707202236441
|
7 |
+
- 18.536005711954232
|
8 |
+
- 25.91453940066591
|
9 |
+
- 33.44474802671516
|
10 |
+
- 41.29017292281736
|
11 |
+
- 50.38165137614682
|
12 |
+
- 59.57928802588991
|
13 |
+
- 67.86491420226359
|
14 |
+
- 75.76032388663967
|
15 |
+
- 82.68249075215772
|
16 |
+
- 12.0
|
17 |
+
- 23.333333333333332
|
18 |
+
- 24.88888888888889
|
19 |
+
- 15.857142857142856
|
20 |
+
- 8.6
|
21 |
+
- 8.0
|
22 |
+
- 6.5
|
23 |
+
- 4.5
|
24 |
+
- null
|
25 |
+
- 6.25
|
26 |
+
- 6.0
|
27 |
+
- 8.0
|
28 |
+
- 10.0
|
29 |
- null
|
30 |
- null
|
31 |
- null
|
|
|
40 |
- null
|
41 |
- null
|
42 |
- null
|
|
|
43 |
- null
|
44 |
- null
|
45 |
- null
|
|
|
263 |
- !!python/tuple
|
264 |
- 513
|
265 |
- 513
|
266 |
+
length_ratio_mean: 1.4422861755889766
|
267 |
length_ratio_stats_per_bucket:
|
268 |
- !!python/tuple
|
269 |
+
- 1.1255982284370691
|
270 |
+
- 0.3093025169709561
|
271 |
- !!python/tuple
|
272 |
+
- 1.6064942041128283
|
273 |
+
- 0.6417946634210556
|
274 |
- !!python/tuple
|
275 |
+
- 2.359196679910085
|
276 |
+
- 0.9575904838242857
|
277 |
- !!python/tuple
|
278 |
+
- 2.9607196399710274
|
279 |
+
- 1.5584344652106463
|
280 |
- !!python/tuple
|
281 |
+
- 2.9543389770526325
|
282 |
+
- 2.297144978089179
|
283 |
- !!python/tuple
|
284 |
+
- 3.002340450312629
|
285 |
+
- 2.18681603522054
|
286 |
- !!python/tuple
|
287 |
+
- 3.081058473996043
|
288 |
+
- 2.5011199006515183
|
289 |
- !!python/tuple
|
290 |
+
- 2.9163894753348045
|
291 |
+
- 2.2789742432670086
|
292 |
- !!python/tuple
|
293 |
+
- 2.9722600022754504
|
294 |
+
- 2.230352263818367
|
295 |
- !!python/tuple
|
296 |
+
- 3.138369081443168
|
297 |
+
- 2.4620594208603235
|
298 |
- !!python/tuple
|
299 |
+
- 2.854253034817575
|
300 |
+
- 1.6376340581023332
|
301 |
- !!python/tuple
|
302 |
+
- 0.12974460739238317
|
303 |
+
- 0.160679251677897
|
304 |
- !!python/tuple
|
305 |
+
- 0.23436597326420017
|
306 |
+
- 0.24015947073924906
|
307 |
- !!python/tuple
|
308 |
+
- 0.23457181630569815
|
309 |
+
- 0.2675720247460546
|
310 |
- !!python/tuple
|
311 |
+
- 0.1366625632624212
|
312 |
+
- 0.16557849394412172
|
313 |
- !!python/tuple
|
314 |
+
- 0.06941451000342352
|
315 |
+
- 0.02389100863634256
|
316 |
- !!python/tuple
|
317 |
+
- 0.05970149253731343
|
318 |
+
- 0.0
|
319 |
- !!python/tuple
|
320 |
+
- 0.04609929078014184
|
321 |
+
- 0.017730496453900707
|
322 |
+
- !!python/tuple
|
323 |
+
- 0.03063680118474639
|
324 |
+
- 0.0036097741577193615
|
325 |
- &id001 !!python/tuple
|
326 |
- null
|
327 |
- null
|
328 |
- !!python/tuple
|
329 |
+
- 0.038657633805228714
|
330 |
+
- 0.010237907973024957
|
331 |
+
- !!python/tuple
|
332 |
+
- 0.03469146238377008
|
333 |
+
- 0.004700847851307781
|
334 |
+
- !!python/tuple
|
335 |
+
- 0.0446927374301676
|
336 |
+
- 0.0
|
337 |
+
- !!python/tuple
|
338 |
+
- 0.05405405405405406
|
339 |
- 0.0
|
340 |
- *id001
|
341 |
- *id001
|
|
|
354 |
- *id001
|
355 |
- *id001
|
356 |
- *id001
|
|
|
|
|
|
|
|
|
|
|
|
|
357 |
- *id001
|
358 |
- *id001
|
359 |
- *id001
|
|
|
378 |
- *id001
|
379 |
- *id001
|
380 |
- *id001
|
381 |
+
length_ratio_std: 0.8479651722336846
|
382 |
+
max_observed_len_source: 185
|
383 |
max_observed_len_target: 87
|
384 |
num_discarded: 0
|
385 |
+
num_sents: 425392
|
386 |
num_sents_per_bucket:
|
387 |
+
- 245433
|
388 |
+
- 135930
|
389 |
+
- 19608
|
390 |
+
- 7208
|
391 |
+
- 3294
|
392 |
+
- 2371
|
393 |
+
- 2180
|
394 |
+
- 2472
|
395 |
+
- 2739
|
396 |
+
- 2470
|
397 |
+
- 1622
|
398 |
+
- 20
|
|
|
|
|
|
|
|
|
399 |
- 9
|
400 |
- 9
|
401 |
+
- 7
|
402 |
+
- 5
|
403 |
+
- 1
|
404 |
+
- 2
|
405 |
+
- 2
|
406 |
- 0
|
407 |
+
- 4
|
408 |
- 3
|
409 |
+
- 1
|
410 |
+
- 2
|
411 |
- 0
|
412 |
- 0
|
413 |
- 0
|
|
|
425 |
- 0
|
426 |
- 0
|
427 |
- 0
|
|
|
|
|
|
|
|
|
428 |
- 0
|
429 |
- 0
|
430 |
- 0
|
|
|
449 |
- 0
|
450 |
- 0
|
451 |
- 0
|
452 |
+
num_tokens_source: 3056735
|
453 |
+
num_tokens_target: 4427820
|
454 |
num_unks_source: 0
|
455 |
num_unks_target: 0
|
456 |
+
size_vocab_source: 8016
|
457 |
size_vocab_target: 656
|
458 |
eop_id: -1
|
459 |
max_seq_len_source: 513
|
|
|
485 |
factor_configs: null
|
486 |
num_embed: 512
|
487 |
num_factors: 1
|
488 |
+
vocab_size: 8016
|
489 |
config_embed_target: !EmbeddingConfig
|
490 |
allow_sparse_grad: false
|
491 |
dropout: 0.5
|
|
|
537 |
lhuc: false
|
538 |
neural_vocab_selection: null
|
539 |
neural_vocab_selection_block_loss: false
|
540 |
+
vocab_source_size: 8016
|
541 |
vocab_target_size: 656
|
542 |
weight_tying_type: trg_softmax
|
metrics
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
params.best
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbc40d947ce0a1c03679cc4c62a4a94c11b179a485637727fc1b491a063042c4
|
3 |
+
size 201248510
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vocab.src.0.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|