diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/adapter_config.json b/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/adapter_model.bin b/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..251e9262fdd365e11c9c97fe4d5371525fa47cd7 --- /dev/null +++ b/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c6758d97d365c10604d10e27b6be873c3ad2e83a9785463a6ba10bfe630d8e +size 7819417 diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000000000000000000000000000000000000..3b709b03c3ec85d406b36c7012506ade625a1842 --- /dev/null +++ b/all_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 2.0, + "train_loss": 1.978195481530868, + "train_runtime": 26343.521, + "train_samples_per_second": 26.232, + "train_steps_per_second": 0.41 +} \ No newline at end of file diff --git a/checkpoint-1000/README.md b/checkpoint-1000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-1000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-1000/adapter_config.json b/checkpoint-1000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-1000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-1000/adapter_model.bin b/checkpoint-1000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..dfcabda4ad6a2d8beec46a1a4b457fde83fc854c --- /dev/null +++ b/checkpoint-1000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d168ef0b419dc788a731c7120dada236c6fbae4d8e809d70c45f93f345fa67ab +size 7819417 diff --git a/checkpoint-1000/finetuning_args.json b/checkpoint-1000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-1000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-1000/optimizer.pt b/checkpoint-1000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09c5689929370718c5d5335e93f67a64b08aae7 --- /dev/null +++ b/checkpoint-1000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207da355524f4452d88bdbb9d13f0ed7b4aa02f827dc0adeaa53dd3c4a1d13a1 +size 15644485 diff --git a/checkpoint-1000/rng_state_0.pth b/checkpoint-1000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c1af3f61fa646759f0f8f38bc63c0d23f4a42288 --- /dev/null +++ b/checkpoint-1000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a2684ce62e8d7c210c23c57d059a952c18a26260da209f1d6ebe314693e4974 +size 18679 diff --git a/checkpoint-1000/rng_state_1.pth b/checkpoint-1000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6cae49dc265b58f60475d0fc4e1e38d842646bb7 --- /dev/null +++ b/checkpoint-1000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de719cf6845a3b19b96284a78513c960a388c70f13766d1ea991700b32e79d53 +size 18679 diff --git a/checkpoint-1000/rng_state_2.pth b/checkpoint-1000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..80f2a1ed793565069a4491a3e20380424ea13a38 --- /dev/null +++ b/checkpoint-1000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e0772c04da6662579787b6678d4d2795a96e4da23118d565f8dd6c2e25617b +size 18679 diff --git a/checkpoint-1000/rng_state_3.pth b/checkpoint-1000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..28788ae13947c0f4517719ea43d53fbf5e987b6d --- /dev/null +++ b/checkpoint-1000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f40b16d80d11c0cf20f8dc79b69affdfca686fdae7995161a0db1c59c9ceed +size 18679 diff --git a/checkpoint-1000/scheduler.pt b/checkpoint-1000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab66859aada790b8b5182894bb8bf5c69f11709f --- /dev/null +++ b/checkpoint-1000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f01619e7f8d789aa01ef80c209d2e88c5d1080670973e05d35c732aa495fa39 +size 627 diff --git a/checkpoint-1000/trainer_state.json b/checkpoint-1000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..a38a10b7d592500e2106904ab9292e744929d4ef --- /dev/null +++ b/checkpoint-1000/trainer_state.json @@ -0,0 +1,616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.18521948508983144, + "global_step": 1000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 9.498667895656284e+17, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-1000/training_args.bin b/checkpoint-1000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-1000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-10000/README.md b/checkpoint-10000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-10000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-10000/adapter_config.json b/checkpoint-10000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-10000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-10000/adapter_model.bin b/checkpoint-10000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad5f1001a916b5e2000a718ac5b672ebdb07c475 --- /dev/null +++ b/checkpoint-10000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9903abff597676a5d85a3f42ba3f950256d00e4aa93564c8ebb5fd5f4a0ebbbe +size 7819417 diff --git a/checkpoint-10000/finetuning_args.json b/checkpoint-10000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-10000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-10000/optimizer.pt b/checkpoint-10000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..051cf4241cb461c0d0eb20ef2c63940af3d65bef --- /dev/null +++ b/checkpoint-10000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9986fb97ca3fa48e2015b70aa583802fa73acc98d578bb5ac096548c91c4f424 +size 15644485 diff --git a/checkpoint-10000/rng_state_0.pth b/checkpoint-10000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd5674f85ccaa628647ff7ec5256d2bd525ae51c --- /dev/null +++ b/checkpoint-10000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37fd716397629e3be922b426ba94f12d00c46352e66dbe11b85822a76d3e35e1 +size 18679 diff --git a/checkpoint-10000/rng_state_1.pth b/checkpoint-10000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..095431b9d2c56cfc944208c81ff9f7779a523589 --- /dev/null +++ b/checkpoint-10000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74bfb7ea10ec3e65f8eca160d3bf18eef130d179b66b4138138d46fceab4daca +size 18679 diff --git a/checkpoint-10000/rng_state_2.pth b/checkpoint-10000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7015ad5b64da5179837794be3661edc090a2aaed --- /dev/null +++ b/checkpoint-10000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:488534d9a95b06aeefe2b45dfed265600bde02bf26605bfacb8ea0bca14920a4 +size 18679 diff --git a/checkpoint-10000/rng_state_3.pth b/checkpoint-10000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..2b49645f09d6a512da14b377e3d6997e9b7bd977 --- /dev/null +++ b/checkpoint-10000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9edad9c0f7873d58b81e886e6d846f91293545f6932489450d12b86cf6e02700 +size 18679 diff --git a/checkpoint-10000/scheduler.pt b/checkpoint-10000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8e983271bf8a59f15071047b0ce17d6721d846e --- /dev/null +++ b/checkpoint-10000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d31ab5731d5270c6c302ae9dc8c05030cf9f832744fe07067f6bed6ea7d85df0 +size 627 diff --git a/checkpoint-10000/trainer_state.json b/checkpoint-10000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb5b03bda6fcb828ba110d349e03b797bcff471 --- /dev/null +++ b/checkpoint-10000/trainer_state.json @@ -0,0 +1,6016 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.8521948508983144, + "global_step": 10000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005569011071543997, + "loss": 1.9859, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005554556085681757, + "loss": 1.9607, + "step": 5020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005540096405655409, + "loss": 1.9825, + "step": 5030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005525632153862152, + "loss": 1.9875, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005511163452737884, + "loss": 2.0051, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005496690424756164, + "loss": 2.0089, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005482213192427174, + "loss": 1.9495, + "step": 5070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005467731878296688, + "loss": 1.9701, + "step": 5080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005453246604945034, + "loss": 1.9588, + "step": 5090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005438757494986044, + "loss": 1.9833, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005424264671066038, + "loss": 1.9974, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005409768255862766, + "loss": 1.9746, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005395268372084378, + "loss": 1.9757, + "step": 5130 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005380765142468387, + "loss": 1.9908, + "step": 5140 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005366258689780625, + "loss": 2.006, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005351749136814208, + "loss": 1.9957, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005337236606388495, + "loss": 1.959, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005322721221348047, + "loss": 2.0027, + "step": 5180 + }, + { + "epoch": 0.96, + "learning_rate": 0.000530820310456159, + "loss": 1.9248, + "step": 5190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005293682378920974, + "loss": 1.9742, + "step": 5200 + }, + { + "epoch": 0.96, + "learning_rate": 0.000527915916734013, + "loss": 1.9844, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005264633592754035, + "loss": 1.9985, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005250105778117661, + "loss": 2.0074, + "step": 5230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005235575846404952, + "loss": 1.9901, + "step": 5240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005221043920607763, + "loss": 1.9861, + "step": 5250 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005206510123734837, + "loss": 1.9576, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005191974578810746, + "loss": 1.9741, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005177437408874868, + "loss": 1.9794, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005162898736980327, + "loss": 1.9883, + "step": 5290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005148358686192967, + "loss": 1.969, + "step": 5300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005133817379590302, + "loss": 2.0018, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005119274940260476, + "loss": 1.971, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005104731491301225, + "loss": 1.9564, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005090187155818823, + "loss": 1.9798, + "step": 5340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005075642056927057, + "loss": 2.0331, + "step": 5350 + }, + { + "epoch": 0.99, + "learning_rate": 0.000506109631774617, + "loss": 1.9505, + "step": 5360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005046550061401825, + "loss": 1.9348, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005032003411024067, + "loss": 2.0099, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005017456489746275, + "loss": 1.9756, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005002909420704116, + "loss": 1.9444, + "step": 5400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004988362327034516, + "loss": 1.976, + "step": 5410 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004973815331874603, + "loss": 1.9593, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004959268558360675, + "loss": 1.9251, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004944722129627151, + "loss": 1.972, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004930176168805531, + "loss": 1.9307, + "step": 5450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004915630799023359, + "loss": 1.9541, + "step": 5460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004901086143403172, + "loss": 1.9212, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004886542325061464, + "loss": 1.965, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004871999467107639, + "loss": 2.0083, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004857457692642974, + "loss": 1.9676, + "step": 5500 + }, + { + "epoch": 1.02, + "learning_rate": 0.000484291712475957, + "loss": 1.9384, + "step": 5510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00048283778865393243, + "loss": 1.9339, + "step": 5520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004813840101052869, + "loss": 2.0182, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004799303891358545, + "loss": 1.9262, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004784769380501352, + "loss": 1.9397, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004770236691511908, + "loss": 1.9404, + "step": 5560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004755705947405417, + "loss": 1.9415, + "step": 5570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00047411772711806105, + "loss": 1.9292, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000472665078581872, + "loss": 1.9487, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00047121266142824354, + "loss": 1.9435, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004697604879514853, + "loss": 1.9145, + "step": 5610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004683085704438451, + "loss": 1.9975, + "step": 5620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046685692119540357, + "loss": 1.9696, + "step": 5630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046540555249397056, + "loss": 1.9598, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046395447662498117, + "loss": 1.9366, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046250370587139206, + "loss": 1.9748, + "step": 5660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046105325251357695, + "loss": 1.9125, + "step": 5670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045960312882922306, + "loss": 1.9595, + "step": 5680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045815334709322665, + "loss": 1.9369, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004567039195775899, + "loss": 1.9564, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 0.000455254858551316, + "loss": 1.9274, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045380617628030693, + "loss": 1.9366, + "step": 5720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045235788502725777, + "loss": 1.9446, + "step": 5730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045090999705155383, + "loss": 1.9236, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004494625246091672, + "loss": 1.9397, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044801547995255194, + "loss": 1.9849, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044656887533054193, + "loss": 1.9367, + "step": 5770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004451227229882455, + "loss": 1.9451, + "step": 5780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004436770351669429, + "loss": 1.9578, + "step": 5790 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004422318241039821, + "loss": 1.9095, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00044078710203267576, + "loss": 1.9337, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004393428811821971, + "loss": 1.9904, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043789917377747695, + "loss": 1.9569, + "step": 5830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004364559920390996, + "loss": 1.9423, + "step": 5840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043501334818320004, + "loss": 2.0013, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004335712544213597, + "loss": 1.9585, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004321297229605044, + "loss": 1.9148, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00043068876600279964, + "loss": 1.9558, + "step": 5880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004292483957455482, + "loss": 1.9899, + "step": 5890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042780862438108655, + "loss": 1.9597, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042636946409668123, + "loss": 1.9603, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042493092707442717, + "loss": 1.9771, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004234930254911427, + "loss": 1.9416, + "step": 5930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042205577151826747, + "loss": 1.9417, + "step": 5940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042061917732175966, + "loss": 1.9636, + "step": 5950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000419183255061992, + "loss": 1.966, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004177480168936504, + "loss": 1.9885, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041631347496562913, + "loss": 1.9525, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004148796414209297, + "loss": 1.9809, + "step": 5990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004134465283965568, + "loss": 1.8982, + "step": 6000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041201414802341643, + "loss": 1.8978, + "step": 6010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00041058251242621295, + "loss": 1.9406, + "step": 6020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004091516337233464, + "loss": 1.919, + "step": 6030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040772152402680973, + "loss": 1.9897, + "step": 6040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040629219544208644, + "loss": 1.9473, + "step": 6050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040486366006804817, + "loss": 1.9589, + "step": 6060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040343592999685264, + "loss": 1.8972, + "step": 6070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004020090173138404, + "loss": 1.9611, + "step": 6080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00040058293409743316, + "loss": 1.9164, + "step": 6090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00039915769241903175, + "loss": 1.939, + "step": 6100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003977333043429129, + "loss": 1.9233, + "step": 6110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003963097819261288, + "loss": 1.9742, + "step": 6120 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003948871372184033, + "loss": 1.9719, + "step": 6130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003934653822620309, + "loss": 1.9861, + "step": 6140 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003920445290917747, + "loss": 1.9514, + "step": 6150 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003906245897347643, + "loss": 2.0047, + "step": 6160 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003892055762103943, + "loss": 1.934, + "step": 6170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003877875005302223, + "loss": 1.9619, + "step": 6180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038637037469786727, + "loss": 1.9085, + "step": 6190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038495421070890796, + "loss": 1.9222, + "step": 6200 + }, + { + "epoch": 1.15, + "learning_rate": 0.0003835390205507812, + "loss": 1.9409, + "step": 6210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038212481620268125, + "loss": 1.9439, + "step": 6220 + }, + { + "epoch": 1.15, + "learning_rate": 0.000380711609635457, + "loss": 1.974, + "step": 6230 + }, + { + "epoch": 1.16, + "learning_rate": 0.000379299412811512, + "loss": 1.9141, + "step": 6240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037788823768470227, + "loss": 1.8982, + "step": 6250 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003764780962002352, + "loss": 1.9384, + "step": 6260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003750690002945695, + "loss": 1.9174, + "step": 6270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037366096189531253, + "loss": 1.927, + "step": 6280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003722539929211205, + "loss": 1.9449, + "step": 6290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003708481052815973, + "loss": 2.008, + "step": 6300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003694433108771933, + "loss": 1.9345, + "step": 6310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00036803962159910543, + "loss": 1.8619, + "step": 6320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003666370493291757, + "loss": 1.9612, + "step": 6330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003652356059397909, + "loss": 1.9371, + "step": 6340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036383530329378225, + "loss": 1.9193, + "step": 6350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036243615324432494, + "loss": 1.9509, + "step": 6360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036103816763483775, + "loss": 1.9517, + "step": 6370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035964135829888287, + "loss": 1.9141, + "step": 6380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035824573706006547, + "loss": 1.9985, + "step": 6390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035685131573193386, + "loss": 1.9791, + "step": 6400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035545810611787925, + "loss": 1.8865, + "step": 6410 + }, + { + "epoch": 1.19, + "learning_rate": 0.0003540661200110367, + "loss": 1.9409, + "step": 6420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035267536919418395, + "loss": 1.9928, + "step": 6430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035128586543964243, + "loss": 1.9149, + "step": 6440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00034989762050917784, + "loss": 1.9837, + "step": 6450 + }, + { + "epoch": 1.2, + "learning_rate": 0.0003485106461538999, + "loss": 1.9142, + "step": 6460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034712495411416385, + "loss": 1.9284, + "step": 6470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034574055611946984, + "loss": 1.8848, + "step": 6480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034435746388836457, + "loss": 1.9295, + "step": 6490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034297568912834177, + "loss": 1.9635, + "step": 6500 + }, + { + "epoch": 1.21, + "learning_rate": 0.0003415952435357431, + "loss": 1.9794, + "step": 6510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00034021613879565944, + "loss": 1.9347, + "step": 6520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033883838658183154, + "loss": 1.9282, + "step": 6530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033746199855655125, + "loss": 1.9973, + "step": 6540 + }, + { + "epoch": 1.21, + "learning_rate": 0.000336086986370563, + "loss": 1.9718, + "step": 6550 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003347133616629652, + "loss": 1.9157, + "step": 6560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033334113606111194, + "loss": 1.9528, + "step": 6570 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003319703211805135, + "loss": 1.9369, + "step": 6580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033060092862473967, + "loss": 1.9552, + "step": 6590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00032923296998532003, + "loss": 1.9581, + "step": 6600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003278664568416465, + "loss": 1.9406, + "step": 6610 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003265014007608758, + "loss": 1.9672, + "step": 6620 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003251378132978304, + "loss": 1.9166, + "step": 6630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032377570599490164, + "loss": 1.9356, + "step": 6640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032241509038195165, + "loss": 1.9092, + "step": 6650 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003210559779762157, + "loss": 1.9343, + "step": 6660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031969838028220513, + "loss": 1.9796, + "step": 6670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031834230879160947, + "loss": 1.8932, + "step": 6680 + }, + { + "epoch": 1.24, + "learning_rate": 0.0003169877749831993, + "loss": 1.9279, + "step": 6690 + }, + { + "epoch": 1.24, + "learning_rate": 0.000315634790322729, + "loss": 1.9444, + "step": 6700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031428336626284037, + "loss": 1.9296, + "step": 6710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031293351424296467, + "loss": 1.9341, + "step": 6720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031158524568922663, + "loss": 1.9589, + "step": 6730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031023857201434703, + "loss": 1.8997, + "step": 6740 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003088935046175466, + "loss": 1.9417, + "step": 6750 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003075500548844492, + "loss": 1.9058, + "step": 6760 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003062082341869862, + "loss": 1.9511, + "step": 6770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030486805388329894, + "loss": 1.922, + "step": 6780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030352952531764363, + "loss": 1.9634, + "step": 6790 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003021926598202949, + "loss": 1.9555, + "step": 6800 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003008574687074498, + "loss": 1.9254, + "step": 6810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00029952396328113265, + "loss": 1.9211, + "step": 6820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029819215482909846, + "loss": 1.9504, + "step": 6830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029686205462473784, + "loss": 1.9174, + "step": 6840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029553367392698177, + "loss": 1.9368, + "step": 6850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029420702398020595, + "loss": 1.8939, + "step": 6860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029288211601413586, + "loss": 1.9097, + "step": 6870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029155896124375156, + "loss": 1.9885, + "step": 6880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002902375708691925, + "loss": 1.9752, + "step": 6890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002889179560756634, + "loss": 1.9321, + "step": 6900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002876001280333391, + "loss": 1.9345, + "step": 6910 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002862840978972698, + "loss": 1.9192, + "step": 6920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002849698768072877, + "loss": 1.9499, + "step": 6930 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002836574758879107, + "loss": 1.9217, + "step": 6940 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002823469062482503, + "loss": 1.9318, + "step": 6950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002810381789819167, + "loss": 1.9422, + "step": 6960 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002797313051669247, + "loss": 1.9562, + "step": 6970 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002784262958656003, + "loss": 1.9189, + "step": 6980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00027712316212448663, + "loss": 1.9453, + "step": 6990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027582191497425114, + "loss": 1.9335, + "step": 7000 + }, + { + "epoch": 1.3, + "learning_rate": 0.000274522565429591, + "loss": 1.9724, + "step": 7010 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002732251244891421, + "loss": 1.9236, + "step": 7020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027192960313538307, + "loss": 1.9407, + "step": 7030 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002706360123345445, + "loss": 1.8948, + "step": 7040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026934436303651554, + "loss": 1.9354, + "step": 7050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026805466617475007, + "loss": 1.955, + "step": 7060 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002667669326661767, + "loss": 1.9595, + "step": 7070 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002654811734111033, + "loss": 1.9766, + "step": 7080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026419739929312713, + "loss": 1.9626, + "step": 7090 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002629156211790417, + "loss": 1.9096, + "step": 7100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026163584991874413, + "loss": 1.9522, + "step": 7110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026035809634514543, + "loss": 1.9387, + "step": 7120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00025908237127407626, + "loss": 1.8788, + "step": 7130 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002578086855041973, + "loss": 1.9326, + "step": 7140 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002565370498169064, + "loss": 1.92, + "step": 7150 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002552674749762487, + "loss": 1.9131, + "step": 7160 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002539999717288246, + "loss": 1.9263, + "step": 7170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025286099888629365, + "loss": 1.919, + "step": 7180 + }, + { + "epoch": 1.33, + "learning_rate": 0.000251597461210021, + "loss": 1.9281, + "step": 7190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025033602619263507, + "loss": 1.9831, + "step": 7200 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024907670451183454, + "loss": 1.9535, + "step": 7210 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024781950682742983, + "loss": 1.8798, + "step": 7220 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024656444378125204, + "loss": 1.9124, + "step": 7230 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024531152599706346, + "loss": 1.9472, + "step": 7240 + }, + { + "epoch": 1.34, + "learning_rate": 0.0002440607640804668, + "loss": 1.9697, + "step": 7250 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024281216861881633, + "loss": 1.938, + "step": 7260 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024156575018112787, + "loss": 1.9035, + "step": 7270 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024032151931798918, + "loss": 1.9379, + "step": 7280 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002390794865614711, + "loss": 1.9176, + "step": 7290 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002378396624250375, + "loss": 1.9392, + "step": 7300 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002366020574034576, + "loss": 1.9235, + "step": 7310 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023536668197271588, + "loss": 1.939, + "step": 7320 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002341335465899243, + "loss": 1.889, + "step": 7330 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023290266169323354, + "loss": 1.9247, + "step": 7340 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002316740377017438, + "loss": 1.935, + "step": 7350 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002304476850154183, + "loss": 1.9198, + "step": 7360 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022922361401499325, + "loss": 1.9068, + "step": 7370 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022800183506189238, + "loss": 1.9505, + "step": 7380 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022678235849813645, + "loss": 1.9459, + "step": 7390 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022556519464625807, + "loss": 1.9302, + "step": 7400 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022435035380921321, + "loss": 1.9345, + "step": 7410 + }, + { + "epoch": 1.37, + "learning_rate": 0.0002231378462702935, + "loss": 1.9304, + "step": 7420 + }, + { + "epoch": 1.38, + "learning_rate": 0.00022192768229304107, + "loss": 1.9457, + "step": 7430 + }, + { + "epoch": 1.38, + "learning_rate": 0.0002207198721211593, + "loss": 1.9395, + "step": 7440 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021951442597842785, + "loss": 1.9867, + "step": 7450 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021831135406861558, + "loss": 1.9217, + "step": 7460 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021711066657539342, + "loss": 1.991, + "step": 7470 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021591237366225008, + "loss": 1.9492, + "step": 7480 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021471648547240365, + "loss": 1.9376, + "step": 7490 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021352301212871762, + "loss": 1.9436, + "step": 7500 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021233196373361397, + "loss": 1.9267, + "step": 7510 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021114335036898852, + "loss": 1.9483, + "step": 7520 + }, + { + "epoch": 1.39, + "learning_rate": 0.0002099571820961252, + "loss": 1.9485, + "step": 7530 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020877346895561082, + "loss": 1.9607, + "step": 7540 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020759222096725034, + "loss": 1.9665, + "step": 7550 + }, + { + "epoch": 1.4, + "learning_rate": 0.0002064134481299814, + "loss": 1.9202, + "step": 7560 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020523716042179075, + "loss": 1.9375, + "step": 7570 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020406336779962888, + "loss": 1.9406, + "step": 7580 + }, + { + "epoch": 1.41, + "learning_rate": 0.00020289208019932635, + "loss": 1.9357, + "step": 7590 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002017233075355089, + "loss": 1.9432, + "step": 7600 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002005570597015145, + "loss": 1.962, + "step": 7610 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019939334656930892, + "loss": 1.9237, + "step": 7620 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019823217798940247, + "loss": 1.9688, + "step": 7630 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019707356379076668, + "loss": 1.9524, + "step": 7640 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019591751378075035, + "loss": 1.981, + "step": 7650 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019476403774499774, + "loss": 1.9405, + "step": 7660 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001936131454473649, + "loss": 1.9, + "step": 7670 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019246484662983733, + "loss": 1.8852, + "step": 7680 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019131915101244752, + "loss": 1.9447, + "step": 7690 + }, + { + "epoch": 1.43, + "learning_rate": 0.00019017606829319205, + "loss": 1.9221, + "step": 7700 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018903560814795086, + "loss": 1.9481, + "step": 7710 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018789778023040355, + "loss": 1.8919, + "step": 7720 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001867625941719499, + "loss": 1.94, + "step": 7730 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018563005958162587, + "loss": 1.9089, + "step": 7740 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018450018604602414, + "loss": 1.9105, + "step": 7750 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001833729831292123, + "loss": 1.9568, + "step": 7760 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018224846037265125, + "loss": 1.9156, + "step": 7770 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001811266272951162, + "loss": 1.9445, + "step": 7780 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001800074933926138, + "loss": 1.8871, + "step": 7790 + }, + { + "epoch": 1.44, + "learning_rate": 0.00017889106813830363, + "loss": 1.9684, + "step": 7800 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001777773609824173, + "loss": 1.9411, + "step": 7810 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017666638135217783, + "loss": 1.9295, + "step": 7820 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001755581386517216, + "loss": 1.9499, + "step": 7830 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001744526422620165, + "loss": 1.9499, + "step": 7840 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017334990154078446, + "loss": 1.9262, + "step": 7850 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017224992582242076, + "loss": 1.9554, + "step": 7860 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017115272441791635, + "loss": 1.9685, + "step": 7870 + }, + { + "epoch": 1.46, + "learning_rate": 0.000170058306614778, + "loss": 1.9021, + "step": 7880 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016896668167695018, + "loss": 1.8804, + "step": 7890 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016787785884473665, + "loss": 1.9164, + "step": 7900 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016679184733472163, + "loss": 1.9409, + "step": 7910 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016570865633969283, + "loss": 1.9329, + "step": 7920 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016462829502856286, + "loss": 1.9518, + "step": 7930 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016355077254629196, + "loss": 1.9494, + "step": 7940 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016247609801381003, + "loss": 1.9376, + "step": 7950 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016140428052794042, + "loss": 1.9312, + "step": 7960 + }, + { + "epoch": 1.48, + "learning_rate": 0.00016033532916132203, + "loss": 1.9528, + "step": 7970 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015926925296233296, + "loss": 1.9698, + "step": 7980 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015820606095501405, + "loss": 1.936, + "step": 7990 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015714576213899167, + "loss": 1.962, + "step": 8000 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015608836548940252, + "loss": 1.9439, + "step": 8010 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015503387995681732, + "loss": 1.9274, + "step": 8020 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001539823144671648, + "loss": 1.9029, + "step": 8030 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015293367792165664, + "loss": 1.928, + "step": 8040 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015188797919671115, + "loss": 1.9405, + "step": 8050 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015084522714387967, + "loss": 1.909, + "step": 8060 + }, + { + "epoch": 1.49, + "learning_rate": 0.00014980543058976977, + "loss": 1.9286, + "step": 8070 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014876859833597278, + "loss": 1.9358, + "step": 8080 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014773473915898695, + "loss": 1.9073, + "step": 8090 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014670386181014477, + "loss": 1.9044, + "step": 8100 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014567597501553847, + "loss": 1.9133, + "step": 8110 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001446510874759454, + "loss": 1.9583, + "step": 8120 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014362920786675616, + "loss": 1.9381, + "step": 8130 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014261034483789892, + "loss": 1.951, + "step": 8140 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014159450701376803, + "loss": 1.9806, + "step": 8150 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014058170299315027, + "loss": 1.9101, + "step": 8160 + }, + { + "epoch": 1.51, + "learning_rate": 0.00013957194134915147, + "loss": 1.9122, + "step": 8170 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013856523062912569, + "loss": 1.91, + "step": 8180 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001375615793546006, + "loss": 1.9182, + "step": 8190 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013656099602120752, + "loss": 1.9312, + "step": 8200 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013556348909860762, + "loss": 1.9327, + "step": 8210 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013456906703042165, + "loss": 1.9184, + "step": 8220 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013357773823415782, + "loss": 1.8876, + "step": 8230 + }, + { + "epoch": 1.53, + "learning_rate": 0.00013258951110114054, + "loss": 1.927, + "step": 8240 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001316043939964398, + "loss": 1.9525, + "step": 8250 + }, + { + "epoch": 1.53, + "learning_rate": 0.00013062239525879943, + "loss": 1.8933, + "step": 8260 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001296435232005677, + "loss": 1.9433, + "step": 8270 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001286677861076263, + "loss": 1.9306, + "step": 8280 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012769519223932034, + "loss": 1.8962, + "step": 8290 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012672574982838802, + "loss": 1.9322, + "step": 8300 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012575946708089176, + "loss": 1.9191, + "step": 8310 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001247963521761481, + "loss": 1.9308, + "step": 8320 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012383641326665874, + "loss": 1.8876, + "step": 8330 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012287965847804162, + "loss": 1.9103, + "step": 8340 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012192609590896142, + "loss": 1.8804, + "step": 8350 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012097573363106218, + "loss": 1.944, + "step": 8360 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012002857968889797, + "loss": 1.9259, + "step": 8370 + }, + { + "epoch": 1.55, + "learning_rate": 0.00011908464209986541, + "loss": 1.9421, + "step": 8380 + }, + { + "epoch": 1.55, + "learning_rate": 0.00011814392885413567, + "loss": 1.9251, + "step": 8390 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011720644791458623, + "loss": 1.9106, + "step": 8400 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011627220721673459, + "loss": 1.8928, + "step": 8410 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011534121466866986, + "loss": 1.9323, + "step": 8420 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011441347815098735, + "loss": 1.9238, + "step": 8430 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001134890055167201, + "loss": 1.9831, + "step": 8440 + }, + { + "epoch": 1.57, + "learning_rate": 0.00011256780459127374, + "loss": 1.85, + "step": 8450 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001116498831723598, + "loss": 1.9391, + "step": 8460 + }, + { + "epoch": 1.57, + "learning_rate": 0.00011073524902992921, + "loss": 1.9071, + "step": 8470 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010982390990610791, + "loss": 1.9538, + "step": 8480 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010891587351512949, + "loss": 1.8972, + "step": 8490 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010801114754327135, + "loss": 1.9184, + "step": 8500 + }, + { + "epoch": 1.58, + "learning_rate": 0.00010710973964878906, + "loss": 1.9567, + "step": 8510 + }, + { + "epoch": 1.58, + "learning_rate": 0.00010621165746185113, + "loss": 1.9755, + "step": 8520 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001053169085844758, + "loss": 1.9256, + "step": 8530 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001044255005904648, + "loss": 1.9742, + "step": 8540 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001035374410253408, + "loss": 1.9562, + "step": 8550 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001026527374062825, + "loss": 1.9432, + "step": 8560 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010177139722206191, + "loss": 1.9007, + "step": 8570 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010089342793298028, + "loss": 1.9834, + "step": 8580 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010001883697080504, + "loss": 1.9063, + "step": 8590 + }, + { + "epoch": 1.59, + "learning_rate": 9.914763173870738e-05, + "loss": 1.9063, + "step": 8600 + }, + { + "epoch": 1.59, + "learning_rate": 9.827981961119869e-05, + "loss": 1.9149, + "step": 8610 + }, + { + "epoch": 1.6, + "learning_rate": 9.741540793406911e-05, + "loss": 1.9096, + "step": 8620 + }, + { + "epoch": 1.6, + "learning_rate": 9.655440402432464e-05, + "loss": 1.8657, + "step": 8630 + }, + { + "epoch": 1.6, + "learning_rate": 9.569681517012585e-05, + "loss": 1.9237, + "step": 8640 + }, + { + "epoch": 1.6, + "learning_rate": 9.484264863072523e-05, + "loss": 1.9739, + "step": 8650 + }, + { + "epoch": 1.6, + "learning_rate": 9.399191163640675e-05, + "loss": 1.9199, + "step": 8660 + }, + { + "epoch": 1.61, + "learning_rate": 9.314461138842406e-05, + "loss": 1.9639, + "step": 8670 + }, + { + "epoch": 1.61, + "learning_rate": 9.230075505893987e-05, + "loss": 1.9391, + "step": 8680 + }, + { + "epoch": 1.61, + "learning_rate": 9.146034979096496e-05, + "loss": 1.9326, + "step": 8690 + }, + { + "epoch": 1.61, + "learning_rate": 9.06234026982976e-05, + "loss": 1.9501, + "step": 8700 + }, + { + "epoch": 1.61, + "learning_rate": 8.9789920865464e-05, + "loss": 1.9041, + "step": 8710 + }, + { + "epoch": 1.62, + "learning_rate": 8.895991134765758e-05, + "loss": 1.931, + "step": 8720 + }, + { + "epoch": 1.62, + "learning_rate": 8.813338117067965e-05, + "loss": 1.9589, + "step": 8730 + }, + { + "epoch": 1.62, + "learning_rate": 8.731033733088012e-05, + "loss": 1.9226, + "step": 8740 + }, + { + "epoch": 1.62, + "learning_rate": 8.649078679509742e-05, + "loss": 1.911, + "step": 8750 + }, + { + "epoch": 1.62, + "learning_rate": 8.567473650060082e-05, + "loss": 1.9641, + "step": 8760 + }, + { + "epoch": 1.62, + "learning_rate": 8.486219335503026e-05, + "loss": 1.8924, + "step": 8770 + }, + { + "epoch": 1.63, + "learning_rate": 8.405316423633958e-05, + "loss": 1.9583, + "step": 8780 + }, + { + "epoch": 1.63, + "learning_rate": 8.324765599273649e-05, + "loss": 1.9399, + "step": 8790 + }, + { + "epoch": 1.63, + "learning_rate": 8.244567544262588e-05, + "loss": 1.9362, + "step": 8800 + }, + { + "epoch": 1.63, + "learning_rate": 8.164722937455177e-05, + "loss": 1.9283, + "step": 8810 + }, + { + "epoch": 1.63, + "learning_rate": 8.08523245471392e-05, + "loss": 1.9588, + "step": 8820 + }, + { + "epoch": 1.64, + "learning_rate": 8.006096768903848e-05, + "loss": 1.9126, + "step": 8830 + }, + { + "epoch": 1.64, + "learning_rate": 7.927316549886659e-05, + "loss": 1.9331, + "step": 8840 + }, + { + "epoch": 1.64, + "learning_rate": 7.84889246451515e-05, + "loss": 1.8967, + "step": 8850 + }, + { + "epoch": 1.64, + "learning_rate": 7.77082517662756e-05, + "loss": 1.927, + "step": 8860 + }, + { + "epoch": 1.64, + "learning_rate": 7.693115347041884e-05, + "loss": 1.8978, + "step": 8870 + }, + { + "epoch": 1.64, + "learning_rate": 7.615763633550421e-05, + "loss": 1.9142, + "step": 8880 + }, + { + "epoch": 1.65, + "learning_rate": 7.538770690914015e-05, + "loss": 1.9001, + "step": 8890 + }, + { + "epoch": 1.65, + "learning_rate": 7.462137170856698e-05, + "loss": 1.8979, + "step": 8900 + }, + { + "epoch": 1.65, + "learning_rate": 7.385863722060022e-05, + "loss": 1.892, + "step": 8910 + }, + { + "epoch": 1.65, + "learning_rate": 7.309950990157677e-05, + "loss": 1.9496, + "step": 8920 + }, + { + "epoch": 1.65, + "learning_rate": 7.234399617729976e-05, + "loss": 1.8879, + "step": 8930 + }, + { + "epoch": 1.66, + "learning_rate": 7.159210244298414e-05, + "loss": 1.921, + "step": 8940 + }, + { + "epoch": 1.66, + "learning_rate": 7.084383506320291e-05, + "loss": 1.9408, + "step": 8950 + }, + { + "epoch": 1.66, + "learning_rate": 7.009920037183248e-05, + "loss": 1.9258, + "step": 8960 + }, + { + "epoch": 1.66, + "learning_rate": 6.935820467200005e-05, + "loss": 1.9182, + "step": 8970 + }, + { + "epoch": 1.66, + "learning_rate": 6.862085423602955e-05, + "loss": 1.9668, + "step": 8980 + }, + { + "epoch": 1.67, + "learning_rate": 6.78871553053888e-05, + "loss": 1.898, + "step": 8990 + }, + { + "epoch": 1.67, + "learning_rate": 6.715711409063652e-05, + "loss": 1.9261, + "step": 9000 + }, + { + "epoch": 1.67, + "learning_rate": 6.643073677136996e-05, + "loss": 1.9167, + "step": 9010 + }, + { + "epoch": 1.67, + "learning_rate": 6.570802949617261e-05, + "loss": 1.9066, + "step": 9020 + }, + { + "epoch": 1.67, + "learning_rate": 6.49889983825619e-05, + "loss": 1.9091, + "step": 9030 + }, + { + "epoch": 1.67, + "learning_rate": 6.427364951693776e-05, + "loss": 1.8853, + "step": 9040 + }, + { + "epoch": 1.68, + "learning_rate": 6.356198895453053e-05, + "loss": 1.9459, + "step": 9050 + }, + { + "epoch": 1.68, + "learning_rate": 6.285402271935048e-05, + "loss": 1.9073, + "step": 9060 + }, + { + "epoch": 1.68, + "learning_rate": 6.214975680413621e-05, + "loss": 1.902, + "step": 9070 + }, + { + "epoch": 1.68, + "learning_rate": 6.144919717030417e-05, + "loss": 1.8812, + "step": 9080 + }, + { + "epoch": 1.68, + "learning_rate": 6.075234974789839e-05, + "loss": 1.8672, + "step": 9090 + }, + { + "epoch": 1.69, + "learning_rate": 6.005922043553952e-05, + "loss": 1.9297, + "step": 9100 + }, + { + "epoch": 1.69, + "learning_rate": 5.9369815100376037e-05, + "loss": 1.8775, + "step": 9110 + }, + { + "epoch": 1.69, + "learning_rate": 5.868413957803331e-05, + "loss": 1.8831, + "step": 9120 + }, + { + "epoch": 1.69, + "learning_rate": 5.800219967256576e-05, + "loss": 1.9026, + "step": 9130 + }, + { + "epoch": 1.69, + "learning_rate": 5.7324001156406014e-05, + "loss": 1.8944, + "step": 9140 + }, + { + "epoch": 1.69, + "learning_rate": 5.664954977031733e-05, + "loss": 1.9154, + "step": 9150 + }, + { + "epoch": 1.7, + "learning_rate": 5.5978851223344455e-05, + "loss": 1.8994, + "step": 9160 + }, + { + "epoch": 1.7, + "learning_rate": 5.531191119276513e-05, + "loss": 1.9397, + "step": 9170 + }, + { + "epoch": 1.7, + "learning_rate": 5.4648735324042855e-05, + "loss": 1.9416, + "step": 9180 + }, + { + "epoch": 1.7, + "learning_rate": 5.398932923077793e-05, + "loss": 1.9207, + "step": 9190 + }, + { + "epoch": 1.7, + "learning_rate": 5.333369849466091e-05, + "loss": 1.9061, + "step": 9200 + }, + { + "epoch": 1.71, + "learning_rate": 5.268184866542502e-05, + "loss": 1.8861, + "step": 9210 + }, + { + "epoch": 1.71, + "learning_rate": 5.2033785260798716e-05, + "loss": 1.9433, + "step": 9220 + }, + { + "epoch": 1.71, + "learning_rate": 5.138951376646012e-05, + "loss": 1.9158, + "step": 9230 + }, + { + "epoch": 1.71, + "learning_rate": 5.074903963598926e-05, + "loss": 1.8898, + "step": 9240 + }, + { + "epoch": 1.71, + "learning_rate": 5.0112368290822885e-05, + "loss": 1.9041, + "step": 9250 + }, + { + "epoch": 1.72, + "learning_rate": 4.9479505120207934e-05, + "loss": 1.9605, + "step": 9260 + }, + { + "epoch": 1.72, + "learning_rate": 4.885045548115646e-05, + "loss": 1.8975, + "step": 9270 + }, + { + "epoch": 1.72, + "learning_rate": 4.822522469839996e-05, + "loss": 1.9396, + "step": 9280 + }, + { + "epoch": 1.72, + "learning_rate": 4.760381806434427e-05, + "loss": 1.9263, + "step": 9290 + }, + { + "epoch": 1.72, + "learning_rate": 4.698624083902503e-05, + "loss": 1.948, + "step": 9300 + }, + { + "epoch": 1.72, + "learning_rate": 4.637249825006273e-05, + "loss": 1.9206, + "step": 9310 + }, + { + "epoch": 1.73, + "learning_rate": 4.5762595492618906e-05, + "loss": 1.9129, + "step": 9320 + }, + { + "epoch": 1.73, + "learning_rate": 4.515653772935207e-05, + "loss": 1.9036, + "step": 9330 + }, + { + "epoch": 1.73, + "learning_rate": 4.455433009037385e-05, + "loss": 1.928, + "step": 9340 + }, + { + "epoch": 1.73, + "learning_rate": 4.395597767320536e-05, + "loss": 1.9427, + "step": 9350 + }, + { + "epoch": 1.73, + "learning_rate": 4.336148554273467e-05, + "loss": 1.8882, + "step": 9360 + }, + { + "epoch": 1.74, + "learning_rate": 4.277085873117354e-05, + "loss": 1.9412, + "step": 9370 + }, + { + "epoch": 1.74, + "learning_rate": 4.218410223801472e-05, + "loss": 1.9014, + "step": 9380 + }, + { + "epoch": 1.74, + "learning_rate": 4.1601221029989976e-05, + "loss": 1.9056, + "step": 9390 + }, + { + "epoch": 1.74, + "learning_rate": 4.102222004102768e-05, + "loss": 1.9665, + "step": 9400 + }, + { + "epoch": 1.74, + "learning_rate": 4.04471041722112e-05, + "loss": 1.8911, + "step": 9410 + }, + { + "epoch": 1.74, + "learning_rate": 3.987587829173772e-05, + "loss": 1.885, + "step": 9420 + }, + { + "epoch": 1.75, + "learning_rate": 3.930854723487642e-05, + "loss": 1.8958, + "step": 9430 + }, + { + "epoch": 1.75, + "learning_rate": 3.874511580392814e-05, + "loss": 1.9197, + "step": 9440 + }, + { + "epoch": 1.75, + "learning_rate": 3.818558876818418e-05, + "loss": 1.9174, + "step": 9450 + }, + { + "epoch": 1.75, + "learning_rate": 3.762997086388653e-05, + "loss": 1.9321, + "step": 9460 + }, + { + "epoch": 1.75, + "learning_rate": 3.707826679418702e-05, + "loss": 1.8835, + "step": 9470 + }, + { + "epoch": 1.76, + "learning_rate": 3.653048122910862e-05, + "loss": 1.9083, + "step": 9480 + }, + { + "epoch": 1.76, + "learning_rate": 3.598661880550452e-05, + "loss": 1.9082, + "step": 9490 + }, + { + "epoch": 1.76, + "learning_rate": 3.544668412702007e-05, + "loss": 1.9696, + "step": 9500 + }, + { + "epoch": 1.76, + "learning_rate": 3.491068176405326e-05, + "loss": 1.9232, + "step": 9510 + }, + { + "epoch": 1.76, + "learning_rate": 3.43786162537158e-05, + "loss": 1.8944, + "step": 9520 + }, + { + "epoch": 1.77, + "learning_rate": 3.385049209979568e-05, + "loss": 1.9341, + "step": 9530 + }, + { + "epoch": 1.77, + "learning_rate": 3.3326313772717667e-05, + "loss": 1.9, + "step": 9540 + }, + { + "epoch": 1.77, + "learning_rate": 3.2806085709506716e-05, + "loss": 1.9157, + "step": 9550 + }, + { + "epoch": 1.77, + "learning_rate": 3.228981231374972e-05, + "loss": 1.9287, + "step": 9560 + }, + { + "epoch": 1.77, + "learning_rate": 3.177749795555812e-05, + "loss": 1.9375, + "step": 9570 + }, + { + "epoch": 1.77, + "learning_rate": 3.126914697153182e-05, + "loss": 1.9171, + "step": 9580 + }, + { + "epoch": 1.78, + "learning_rate": 3.076476366472131e-05, + "loss": 1.8778, + "step": 9590 + }, + { + "epoch": 1.78, + "learning_rate": 3.0264352304592123e-05, + "loss": 1.919, + "step": 9600 + }, + { + "epoch": 1.78, + "learning_rate": 2.9767917126987952e-05, + "loss": 1.891, + "step": 9610 + }, + { + "epoch": 1.78, + "learning_rate": 2.927546233409567e-05, + "loss": 1.921, + "step": 9620 + }, + { + "epoch": 1.78, + "learning_rate": 2.8786992094409102e-05, + "loss": 1.9178, + "step": 9630 + }, + { + "epoch": 1.79, + "learning_rate": 2.8302510542693782e-05, + "loss": 1.8917, + "step": 9640 + }, + { + "epoch": 1.79, + "learning_rate": 2.7822021779952467e-05, + "loss": 1.9141, + "step": 9650 + }, + { + "epoch": 1.79, + "learning_rate": 2.7345529873389618e-05, + "loss": 1.8737, + "step": 9660 + }, + { + "epoch": 1.79, + "learning_rate": 2.687303885637765e-05, + "loss": 1.9349, + "step": 9670 + }, + { + "epoch": 1.79, + "learning_rate": 2.6404552728422625e-05, + "loss": 1.919, + "step": 9680 + }, + { + "epoch": 1.79, + "learning_rate": 2.5940075455130217e-05, + "loss": 1.9411, + "step": 9690 + }, + { + "epoch": 1.8, + "learning_rate": 2.547961096817214e-05, + "loss": 1.9616, + "step": 9700 + }, + { + "epoch": 1.8, + "learning_rate": 2.5023163165253272e-05, + "loss": 1.9431, + "step": 9710 + }, + { + "epoch": 1.8, + "learning_rate": 2.4570735910078078e-05, + "loss": 1.9488, + "step": 9720 + }, + { + "epoch": 1.8, + "learning_rate": 2.4122333032318367e-05, + "loss": 1.9376, + "step": 9730 + }, + { + "epoch": 1.8, + "learning_rate": 2.3677958327580683e-05, + "loss": 1.9038, + "step": 9740 + }, + { + "epoch": 1.81, + "learning_rate": 2.3237615557374137e-05, + "loss": 1.91, + "step": 9750 + }, + { + "epoch": 1.81, + "learning_rate": 2.2801308449078684e-05, + "loss": 1.9058, + "step": 9760 + }, + { + "epoch": 1.81, + "learning_rate": 2.2369040695913445e-05, + "loss": 1.9275, + "step": 9770 + }, + { + "epoch": 1.81, + "learning_rate": 2.1940815956905612e-05, + "loss": 1.9646, + "step": 9780 + }, + { + "epoch": 1.81, + "learning_rate": 2.1516637856859422e-05, + "loss": 1.9127, + "step": 9790 + }, + { + "epoch": 1.82, + "learning_rate": 2.109650998632512e-05, + "loss": 1.9564, + "step": 9800 + }, + { + "epoch": 1.82, + "learning_rate": 2.068043590156926e-05, + "loss": 1.929, + "step": 9810 + }, + { + "epoch": 1.82, + "learning_rate": 2.0268419124544078e-05, + "loss": 1.9185, + "step": 9820 + }, + { + "epoch": 1.82, + "learning_rate": 1.986046314285772e-05, + "loss": 1.8714, + "step": 9830 + }, + { + "epoch": 1.82, + "learning_rate": 1.9456571409744938e-05, + "loss": 1.9149, + "step": 9840 + }, + { + "epoch": 1.82, + "learning_rate": 1.9056747344037616e-05, + "loss": 1.8945, + "step": 9850 + }, + { + "epoch": 1.83, + "learning_rate": 1.8660994330136184e-05, + "loss": 1.9634, + "step": 9860 + }, + { + "epoch": 1.83, + "learning_rate": 1.8269315717980518e-05, + "loss": 1.9449, + "step": 9870 + }, + { + "epoch": 1.83, + "learning_rate": 1.7881714823021976e-05, + "loss": 1.8911, + "step": 9880 + }, + { + "epoch": 1.83, + "learning_rate": 1.7498194926194978e-05, + "loss": 1.9169, + "step": 9890 + }, + { + "epoch": 1.83, + "learning_rate": 1.7118759273889615e-05, + "loss": 1.8699, + "step": 9900 + }, + { + "epoch": 1.84, + "learning_rate": 1.674341107792382e-05, + "loss": 1.9187, + "step": 9910 + }, + { + "epoch": 1.84, + "learning_rate": 1.6372153515516463e-05, + "loss": 1.8754, + "step": 9920 + }, + { + "epoch": 1.84, + "learning_rate": 1.600498972926029e-05, + "loss": 1.9913, + "step": 9930 + }, + { + "epoch": 1.84, + "learning_rate": 1.5641922827095256e-05, + "loss": 1.9162, + "step": 9940 + }, + { + "epoch": 1.84, + "learning_rate": 1.528295588228251e-05, + "loss": 1.9475, + "step": 9950 + }, + { + "epoch": 1.84, + "learning_rate": 1.4928091933378018e-05, + "loss": 1.8907, + "step": 9960 + }, + { + "epoch": 1.85, + "learning_rate": 1.4577333984207186e-05, + "loss": 1.9031, + "step": 9970 + }, + { + "epoch": 1.85, + "learning_rate": 1.4230685003839117e-05, + "loss": 1.8969, + "step": 9980 + }, + { + "epoch": 1.85, + "learning_rate": 1.3888147926561733e-05, + "loss": 1.9272, + "step": 9990 + }, + { + "epoch": 1.85, + "learning_rate": 1.3549725651856804e-05, + "loss": 1.9313, + "step": 10000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 9.488737619882803e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-10000/training_args.bin b/checkpoint-10000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-10000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-2000/README.md b/checkpoint-2000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-2000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-2000/adapter_config.json b/checkpoint-2000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-2000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-2000/adapter_model.bin b/checkpoint-2000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..28bfc2abb2b3a097244b044b9b0c8b5e26e4c536 --- /dev/null +++ b/checkpoint-2000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f081bbdfbb5e387ee0824fff7f0f47949ffa6e68e7943ffa59134934c4cc853 +size 7819417 diff --git a/checkpoint-2000/finetuning_args.json b/checkpoint-2000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-2000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-2000/optimizer.pt b/checkpoint-2000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..4508d60f9b5aa253343f8b470a4d8cb1a3fa941a --- /dev/null +++ b/checkpoint-2000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9fe37c01b31ebef944ca17d10d8d5aaacb5798001799c604caf3846715c32d +size 15644485 diff --git a/checkpoint-2000/rng_state_0.pth b/checkpoint-2000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..56095a7d4934b269e9ec771400d32ef5ba253829 --- /dev/null +++ b/checkpoint-2000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8cb970e4ced27f56008fda1204003f4d92bee7bbcb658b1d95feeb1ee2d9c9 +size 18679 diff --git a/checkpoint-2000/rng_state_1.pth b/checkpoint-2000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3434ac1cc42a275b957439b041b97af51cdb75fd --- /dev/null +++ b/checkpoint-2000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc409f2fff3209bb2720c94bd3a28d16c2aea229945134be8dfd24bd233b555a +size 18679 diff --git a/checkpoint-2000/rng_state_2.pth b/checkpoint-2000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..67482342f839e71489eadbc81e18336be9879b32 --- /dev/null +++ b/checkpoint-2000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994276963fc670cf27a5b4003c9939fb3694b73e3468dcf68c44d82388fb664e +size 18679 diff --git a/checkpoint-2000/rng_state_3.pth b/checkpoint-2000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..7ad7b228d96895f19c586bb748c8e2880be8ec50 --- /dev/null +++ b/checkpoint-2000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19db02794e617e7615491a559802b701bc18a3aebaf0b383447ebdfcb7a6c4ca +size 18679 diff --git a/checkpoint-2000/scheduler.pt b/checkpoint-2000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8ba5a6dec6574075b40475fba435ec179b4492e --- /dev/null +++ b/checkpoint-2000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b5152c9a31debe910da86a00a4ef326dfa0b3a55c019894c4686f1176be2b3 +size 627 diff --git a/checkpoint-2000/trainer_state.json b/checkpoint-2000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..3780287455d122c88de45eb437ca1300ebe80d7d --- /dev/null +++ b/checkpoint-2000/trainer_state.json @@ -0,0 +1,1216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.3704389701796629, + "global_step": 2000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 1.8983090426321306e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-2000/training_args.bin b/checkpoint-2000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-2000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-3000/README.md b/checkpoint-3000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-3000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-3000/adapter_config.json b/checkpoint-3000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-3000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-3000/adapter_model.bin b/checkpoint-3000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..11d11c7130354f39baabefe2f2f090241614b113 --- /dev/null +++ b/checkpoint-3000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3cd0c710c3e6e522341f9bc18338a3a5d364603e39d5a7138ce0ece693cada4 +size 7819417 diff --git a/checkpoint-3000/finetuning_args.json b/checkpoint-3000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-3000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-3000/optimizer.pt b/checkpoint-3000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ba47f20dff206940b167b29c42a0b419a94f9bd --- /dev/null +++ b/checkpoint-3000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2286a7eb891d1c724b052fc718f53e053668dd120909c7d17063e0b11f1046c7 +size 15644485 diff --git a/checkpoint-3000/rng_state_0.pth b/checkpoint-3000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3fb13afc66bd8d20dce41ffb24055f4273761822 --- /dev/null +++ b/checkpoint-3000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28df0ebee892c2cd596ed2d9c3c1b1bce8aacce528339850151675cb3e979e11 +size 18679 diff --git a/checkpoint-3000/rng_state_1.pth b/checkpoint-3000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1a7526a3f9401955d5ef21d6eb230e56787a6d8e --- /dev/null +++ b/checkpoint-3000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff24f859606279e5f5564c5772b357bdf34d74d1fb9f644a200359edb9d5a2bb +size 18679 diff --git a/checkpoint-3000/rng_state_2.pth b/checkpoint-3000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..91beefe99ddf22a58462841a38266359d8018df5 --- /dev/null +++ b/checkpoint-3000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cf19f9e07dfb1c6a4f9b043721d057abeb2a702aa4992a0d2dab15224d64805 +size 18679 diff --git a/checkpoint-3000/rng_state_3.pth b/checkpoint-3000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..615d9845a6ed022039378fe2ae49bce2de6433ff --- /dev/null +++ b/checkpoint-3000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723718e2b5b73a3d4bfee55008ffbae341c90ae5f2480575806ffc1134c69a8e +size 18679 diff --git a/checkpoint-3000/scheduler.pt b/checkpoint-3000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a8dd866db1778b2d757189aedf7365ce0d1d90 --- /dev/null +++ b/checkpoint-3000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf9b363bf12cc68bc5c1a58285c6f89fc38fb83c9837ee26212120079972ec5 +size 627 diff --git a/checkpoint-3000/trainer_state.json b/checkpoint-3000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..0c1430685bd4028718c3f7e22a2e9722619ce299 --- /dev/null +++ b/checkpoint-3000/trainer_state.json @@ -0,0 +1,1816 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.5556584552694943, + "global_step": 3000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 2.8455634151187415e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-3000/training_args.bin b/checkpoint-3000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-3000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-4000/README.md b/checkpoint-4000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-4000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-4000/adapter_config.json b/checkpoint-4000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-4000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-4000/adapter_model.bin b/checkpoint-4000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..5023e88e22e9a4e6e32aa0c0709d6f1d891af32e --- /dev/null +++ b/checkpoint-4000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83c28c7acc51529c2fcfdb8bacb82a4609ba2705fe99c2a2ea57056d2be6bff +size 7819417 diff --git a/checkpoint-4000/finetuning_args.json b/checkpoint-4000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-4000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-4000/optimizer.pt b/checkpoint-4000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..73479b35b60a6c827520a22b6224998be6fc117e --- /dev/null +++ b/checkpoint-4000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe31188d0586f5d0a6c0537efea87615e85aea72c2ad5168252a5468fc548e7 +size 15644485 diff --git a/checkpoint-4000/rng_state_0.pth b/checkpoint-4000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..1629aea1cb21998dcf7ad33aadc95dc40a9c1d54 --- /dev/null +++ b/checkpoint-4000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015c277ea438ae1dc89ffd34cfe428587a4214b50dc61918c058dab30123aa1d +size 18679 diff --git a/checkpoint-4000/rng_state_1.pth b/checkpoint-4000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..db66a98c02dd265071df8cd304d057c76f8b1eba --- /dev/null +++ b/checkpoint-4000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8cf1e697a865a04e2f48b31f6c2728bcc5769483eefaee3df5e8acdd57afddd +size 18679 diff --git a/checkpoint-4000/rng_state_2.pth b/checkpoint-4000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..73a0bb4b126cd45cc92b6051486ed866264359f3 --- /dev/null +++ b/checkpoint-4000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fc9cd6a77be4099fe9a1479d42e7bb360a23e7daada4131ad9fcc394e33848c +size 18679 diff --git a/checkpoint-4000/rng_state_3.pth b/checkpoint-4000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..c810c88157c544e13ce877fbf9624d865256572b --- /dev/null +++ b/checkpoint-4000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa6c072d3c5aaed34f62adddd27365923b4acc572f08dc643d4b56666b49e43 +size 18679 diff --git a/checkpoint-4000/scheduler.pt b/checkpoint-4000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d0487adfce05c7d7ffb21b3b1f440ddfb75fb6 --- /dev/null +++ b/checkpoint-4000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa0415e4285466aa8bf5cb07c9fc689721748234e4b7fd1e6f7615253b2a67c9 +size 627 diff --git a/checkpoint-4000/trainer_state.json b/checkpoint-4000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..5306cd8f4045d6810b239e47d1e78a099d7c9a04 --- /dev/null +++ b/checkpoint-4000/trainer_state.json @@ -0,0 +1,2416 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.7408779403593257, + "global_step": 4000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 3.794844442012156e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-4000/training_args.bin b/checkpoint-4000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-4000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-5000/README.md b/checkpoint-5000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-5000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-5000/adapter_config.json b/checkpoint-5000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-5000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-5000/adapter_model.bin b/checkpoint-5000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca1d5d6168fe118a91122aad14c617a3f0e48ba9 --- /dev/null +++ b/checkpoint-5000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5d8db5b4f643e46c88553b1f5114a9ab8addbaa3e64d15bec61d77d67b3111 +size 7819417 diff --git a/checkpoint-5000/finetuning_args.json b/checkpoint-5000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-5000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-5000/optimizer.pt b/checkpoint-5000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..362544914814302e195723b57e192c1b5d3bc1b5 --- /dev/null +++ b/checkpoint-5000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ec02adc57096b48b938f74b3714f4d29bae0f99ae539d729cbf37a89637562 +size 15644485 diff --git a/checkpoint-5000/rng_state_0.pth b/checkpoint-5000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8140020d6e671b0642470951d86fe146dbc630fb --- /dev/null +++ b/checkpoint-5000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b782b8dbde946b3332327e532def6d0d0df0f933e880345ab43801588cf28f91 +size 18679 diff --git a/checkpoint-5000/rng_state_1.pth b/checkpoint-5000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e8b5dfe6817990159897e1ea832b235153067f3 --- /dev/null +++ b/checkpoint-5000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a980aa66153b14a465ebfdd75b81c4540513a522fc44abfcd7a7876aae1f51 +size 18679 diff --git a/checkpoint-5000/rng_state_2.pth b/checkpoint-5000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a97abd679b6be17c7fce0b602a02d9d0e2f7a5bb --- /dev/null +++ b/checkpoint-5000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f75c94763d262d4d94cf9237ac9d8b05846f520d53e872c618144ec1d552f6 +size 18679 diff --git a/checkpoint-5000/rng_state_3.pth b/checkpoint-5000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c52ee93049b612c1deb18b615b4f2a65e4338d5 --- /dev/null +++ b/checkpoint-5000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b4cb7fb77fa909f4a6fc60da635e6f393ec6c66e581b4c064d08a766067e15 +size 18679 diff --git a/checkpoint-5000/scheduler.pt b/checkpoint-5000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..60accdad98ff963f3ba612a860c29388a708e6c9 --- /dev/null +++ b/checkpoint-5000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0288a93a721a1a39ec39deee58b3a168f5fd23543ea06051f9e633c304ce07cc +size 627 diff --git a/checkpoint-5000/trainer_state.json b/checkpoint-5000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2d09464d2ccc46da84215b965a01cf39dea86357 --- /dev/null +++ b/checkpoint-5000/trainer_state.json @@ -0,0 +1,3016 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.9260974254491573, + "global_step": 5000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 4.745478246164857e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-5000/training_args.bin b/checkpoint-5000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-5000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-6000/README.md b/checkpoint-6000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-6000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-6000/adapter_config.json b/checkpoint-6000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-6000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-6000/adapter_model.bin b/checkpoint-6000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6e0235ae2d4c50205ab5c08a409af17a45183d61 --- /dev/null +++ b/checkpoint-6000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb424b3742beb6722b24f39dabe187b6a521916bcd5199ec99b47e9b03012b7 +size 7819417 diff --git a/checkpoint-6000/finetuning_args.json b/checkpoint-6000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-6000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-6000/optimizer.pt b/checkpoint-6000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99b54c8d28599c0c86a78257dc7ae027d7e6535 --- /dev/null +++ b/checkpoint-6000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a53e7954cdacd508bb532719784406b4c59d019729868c2d0dc4cf5870ecfb +size 15644485 diff --git a/checkpoint-6000/rng_state_0.pth b/checkpoint-6000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e48904bf092087a164ad4bb35342c3166b9ad91 --- /dev/null +++ b/checkpoint-6000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82f3c47df4c878687fd4e3dab1556abe1108f96acd0000174fe768521c14da4 +size 18679 diff --git a/checkpoint-6000/rng_state_1.pth b/checkpoint-6000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ed25d5a42ae083c0d3ccc5adcc24de2cfbb85fb --- /dev/null +++ b/checkpoint-6000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8320c50ab31e682336a70fc992d94efd77210f27e90bda7d0fd46e4ef08d8e90 +size 18679 diff --git a/checkpoint-6000/rng_state_2.pth b/checkpoint-6000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..cbab159810bcf174e034d099b8500efaba740152 --- /dev/null +++ b/checkpoint-6000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6ef674a400c820a8c278cc54395d37eef5237091ebabd729595fe26db881cd +size 18679 diff --git a/checkpoint-6000/rng_state_3.pth b/checkpoint-6000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc8b601cf6b762a81a4b72c9b814e35bcdb081ae --- /dev/null +++ b/checkpoint-6000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137f81f8dced1134e5e5078524f916aac5328eef01067ad7fce3b983ec8fab43 +size 18679 diff --git a/checkpoint-6000/scheduler.pt b/checkpoint-6000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d83222009cc48bd77634fb83833e64efdeafd82 --- /dev/null +++ b/checkpoint-6000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91adbbcde4202523704e5a2ae3486ef81737f8bf719683367a5c4c98d7060d1 +size 627 diff --git a/checkpoint-6000/trainer_state.json b/checkpoint-6000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..30531438867afb78c768a2b915c1c0bc9554098a --- /dev/null +++ b/checkpoint-6000/trainer_state.json @@ -0,0 +1,3616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.1113169105389886, + "global_step": 6000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005569011071543997, + "loss": 1.9859, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005554556085681757, + "loss": 1.9607, + "step": 5020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005540096405655409, + "loss": 1.9825, + "step": 5030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005525632153862152, + "loss": 1.9875, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005511163452737884, + "loss": 2.0051, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005496690424756164, + "loss": 2.0089, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005482213192427174, + "loss": 1.9495, + "step": 5070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005467731878296688, + "loss": 1.9701, + "step": 5080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005453246604945034, + "loss": 1.9588, + "step": 5090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005438757494986044, + "loss": 1.9833, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005424264671066038, + "loss": 1.9974, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005409768255862766, + "loss": 1.9746, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005395268372084378, + "loss": 1.9757, + "step": 5130 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005380765142468387, + "loss": 1.9908, + "step": 5140 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005366258689780625, + "loss": 2.006, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005351749136814208, + "loss": 1.9957, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005337236606388495, + "loss": 1.959, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005322721221348047, + "loss": 2.0027, + "step": 5180 + }, + { + "epoch": 0.96, + "learning_rate": 0.000530820310456159, + "loss": 1.9248, + "step": 5190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005293682378920974, + "loss": 1.9742, + "step": 5200 + }, + { + "epoch": 0.96, + "learning_rate": 0.000527915916734013, + "loss": 1.9844, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005264633592754035, + "loss": 1.9985, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005250105778117661, + "loss": 2.0074, + "step": 5230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005235575846404952, + "loss": 1.9901, + "step": 5240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005221043920607763, + "loss": 1.9861, + "step": 5250 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005206510123734837, + "loss": 1.9576, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005191974578810746, + "loss": 1.9741, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005177437408874868, + "loss": 1.9794, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005162898736980327, + "loss": 1.9883, + "step": 5290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005148358686192967, + "loss": 1.969, + "step": 5300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005133817379590302, + "loss": 2.0018, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005119274940260476, + "loss": 1.971, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005104731491301225, + "loss": 1.9564, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005090187155818823, + "loss": 1.9798, + "step": 5340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005075642056927057, + "loss": 2.0331, + "step": 5350 + }, + { + "epoch": 0.99, + "learning_rate": 0.000506109631774617, + "loss": 1.9505, + "step": 5360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005046550061401825, + "loss": 1.9348, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005032003411024067, + "loss": 2.0099, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005017456489746275, + "loss": 1.9756, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005002909420704116, + "loss": 1.9444, + "step": 5400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004988362327034516, + "loss": 1.976, + "step": 5410 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004973815331874603, + "loss": 1.9593, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004959268558360675, + "loss": 1.9251, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004944722129627151, + "loss": 1.972, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004930176168805531, + "loss": 1.9307, + "step": 5450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004915630799023359, + "loss": 1.9541, + "step": 5460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004901086143403172, + "loss": 1.9212, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004886542325061464, + "loss": 1.965, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004871999467107639, + "loss": 2.0083, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004857457692642974, + "loss": 1.9676, + "step": 5500 + }, + { + "epoch": 1.02, + "learning_rate": 0.000484291712475957, + "loss": 1.9384, + "step": 5510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00048283778865393243, + "loss": 1.9339, + "step": 5520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004813840101052869, + "loss": 2.0182, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004799303891358545, + "loss": 1.9262, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004784769380501352, + "loss": 1.9397, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004770236691511908, + "loss": 1.9404, + "step": 5560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004755705947405417, + "loss": 1.9415, + "step": 5570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00047411772711806105, + "loss": 1.9292, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000472665078581872, + "loss": 1.9487, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00047121266142824354, + "loss": 1.9435, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004697604879514853, + "loss": 1.9145, + "step": 5610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004683085704438451, + "loss": 1.9975, + "step": 5620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046685692119540357, + "loss": 1.9696, + "step": 5630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046540555249397056, + "loss": 1.9598, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046395447662498117, + "loss": 1.9366, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046250370587139206, + "loss": 1.9748, + "step": 5660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046105325251357695, + "loss": 1.9125, + "step": 5670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045960312882922306, + "loss": 1.9595, + "step": 5680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045815334709322665, + "loss": 1.9369, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004567039195775899, + "loss": 1.9564, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 0.000455254858551316, + "loss": 1.9274, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045380617628030693, + "loss": 1.9366, + "step": 5720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045235788502725777, + "loss": 1.9446, + "step": 5730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045090999705155383, + "loss": 1.9236, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004494625246091672, + "loss": 1.9397, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044801547995255194, + "loss": 1.9849, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044656887533054193, + "loss": 1.9367, + "step": 5770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004451227229882455, + "loss": 1.9451, + "step": 5780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004436770351669429, + "loss": 1.9578, + "step": 5790 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004422318241039821, + "loss": 1.9095, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00044078710203267576, + "loss": 1.9337, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004393428811821971, + "loss": 1.9904, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043789917377747695, + "loss": 1.9569, + "step": 5830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004364559920390996, + "loss": 1.9423, + "step": 5840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043501334818320004, + "loss": 2.0013, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004335712544213597, + "loss": 1.9585, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004321297229605044, + "loss": 1.9148, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00043068876600279964, + "loss": 1.9558, + "step": 5880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004292483957455482, + "loss": 1.9899, + "step": 5890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042780862438108655, + "loss": 1.9597, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042636946409668123, + "loss": 1.9603, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042493092707442717, + "loss": 1.9771, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004234930254911427, + "loss": 1.9416, + "step": 5930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042205577151826747, + "loss": 1.9417, + "step": 5940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042061917732175966, + "loss": 1.9636, + "step": 5950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000419183255061992, + "loss": 1.966, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004177480168936504, + "loss": 1.9885, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041631347496562913, + "loss": 1.9525, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004148796414209297, + "loss": 1.9809, + "step": 5990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004134465283965568, + "loss": 1.8982, + "step": 6000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 5.693111667768951e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-6000/training_args.bin b/checkpoint-6000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-6000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-7000/README.md b/checkpoint-7000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-7000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-7000/adapter_config.json b/checkpoint-7000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-7000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-7000/adapter_model.bin b/checkpoint-7000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a909a3b27506abecd4d395ef9d94f532015465c --- /dev/null +++ b/checkpoint-7000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea269ac3ab9dd0426746da50d0b2d67b41aaec93957ae21627b7f4353bd1a79a +size 7819417 diff --git a/checkpoint-7000/finetuning_args.json b/checkpoint-7000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-7000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-7000/optimizer.pt b/checkpoint-7000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..9928cd5f6912e12ad746cd484d204141ff1b5c93 --- /dev/null +++ b/checkpoint-7000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf3332174a372f6b7093ac01816f0144597f5367c9958a65af11ec5dd97db95a +size 15644485 diff --git a/checkpoint-7000/rng_state_0.pth b/checkpoint-7000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..a65c522f6194f2777086acf9cbc9d675a89ad2c4 --- /dev/null +++ b/checkpoint-7000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05bb33129498e599dd13f7d01121f0a9b1c866f16d8b4d9b8ff79df607cfae8a +size 18679 diff --git a/checkpoint-7000/rng_state_1.pth b/checkpoint-7000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..81e7c788a00f590e7d0c3c3291d313b2417c05d5 --- /dev/null +++ b/checkpoint-7000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa58058633b27efd1a8e0970f4770c742adccd1a5b30e1e8aaa8e05a61f8516 +size 18679 diff --git a/checkpoint-7000/rng_state_2.pth b/checkpoint-7000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7008aabbba0f534682de370960626c6cd2f0cc8 --- /dev/null +++ b/checkpoint-7000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d602e6d4371bacfc4d5c0d547815e244632c06ed02997b3f64503ff944e6f8b3 +size 18679 diff --git a/checkpoint-7000/rng_state_3.pth b/checkpoint-7000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..883b8c100f7a1c71c8359f0e932bd1c99d14fee9 --- /dev/null +++ b/checkpoint-7000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0200b65d6e51ebf8f243c883c47dec4a3316c3942bc124ecff5b126b42cbede8 +size 18679 diff --git a/checkpoint-7000/scheduler.pt b/checkpoint-7000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c807b10927767ad5e585fc9eae0c4ef9cbf77fb9 --- /dev/null +++ b/checkpoint-7000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1156ef2323b023466187426932639c600c3d200ad5610ea37f6f38534683f0e4 +size 627 diff --git a/checkpoint-7000/trainer_state.json b/checkpoint-7000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..276e46368772abe9609d7a455676583be43f4566 --- /dev/null +++ b/checkpoint-7000/trainer_state.json @@ -0,0 +1,4216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.29653639562882, + "global_step": 7000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005569011071543997, + "loss": 1.9859, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005554556085681757, + "loss": 1.9607, + "step": 5020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005540096405655409, + "loss": 1.9825, + "step": 5030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005525632153862152, + "loss": 1.9875, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005511163452737884, + "loss": 2.0051, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005496690424756164, + "loss": 2.0089, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005482213192427174, + "loss": 1.9495, + "step": 5070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005467731878296688, + "loss": 1.9701, + "step": 5080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005453246604945034, + "loss": 1.9588, + "step": 5090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005438757494986044, + "loss": 1.9833, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005424264671066038, + "loss": 1.9974, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005409768255862766, + "loss": 1.9746, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005395268372084378, + "loss": 1.9757, + "step": 5130 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005380765142468387, + "loss": 1.9908, + "step": 5140 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005366258689780625, + "loss": 2.006, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005351749136814208, + "loss": 1.9957, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005337236606388495, + "loss": 1.959, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005322721221348047, + "loss": 2.0027, + "step": 5180 + }, + { + "epoch": 0.96, + "learning_rate": 0.000530820310456159, + "loss": 1.9248, + "step": 5190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005293682378920974, + "loss": 1.9742, + "step": 5200 + }, + { + "epoch": 0.96, + "learning_rate": 0.000527915916734013, + "loss": 1.9844, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005264633592754035, + "loss": 1.9985, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005250105778117661, + "loss": 2.0074, + "step": 5230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005235575846404952, + "loss": 1.9901, + "step": 5240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005221043920607763, + "loss": 1.9861, + "step": 5250 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005206510123734837, + "loss": 1.9576, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005191974578810746, + "loss": 1.9741, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005177437408874868, + "loss": 1.9794, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005162898736980327, + "loss": 1.9883, + "step": 5290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005148358686192967, + "loss": 1.969, + "step": 5300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005133817379590302, + "loss": 2.0018, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005119274940260476, + "loss": 1.971, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005104731491301225, + "loss": 1.9564, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005090187155818823, + "loss": 1.9798, + "step": 5340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005075642056927057, + "loss": 2.0331, + "step": 5350 + }, + { + "epoch": 0.99, + "learning_rate": 0.000506109631774617, + "loss": 1.9505, + "step": 5360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005046550061401825, + "loss": 1.9348, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005032003411024067, + "loss": 2.0099, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005017456489746275, + "loss": 1.9756, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005002909420704116, + "loss": 1.9444, + "step": 5400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004988362327034516, + "loss": 1.976, + "step": 5410 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004973815331874603, + "loss": 1.9593, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004959268558360675, + "loss": 1.9251, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004944722129627151, + "loss": 1.972, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004930176168805531, + "loss": 1.9307, + "step": 5450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004915630799023359, + "loss": 1.9541, + "step": 5460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004901086143403172, + "loss": 1.9212, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004886542325061464, + "loss": 1.965, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004871999467107639, + "loss": 2.0083, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004857457692642974, + "loss": 1.9676, + "step": 5500 + }, + { + "epoch": 1.02, + "learning_rate": 0.000484291712475957, + "loss": 1.9384, + "step": 5510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00048283778865393243, + "loss": 1.9339, + "step": 5520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004813840101052869, + "loss": 2.0182, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004799303891358545, + "loss": 1.9262, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004784769380501352, + "loss": 1.9397, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004770236691511908, + "loss": 1.9404, + "step": 5560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004755705947405417, + "loss": 1.9415, + "step": 5570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00047411772711806105, + "loss": 1.9292, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000472665078581872, + "loss": 1.9487, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00047121266142824354, + "loss": 1.9435, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004697604879514853, + "loss": 1.9145, + "step": 5610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004683085704438451, + "loss": 1.9975, + "step": 5620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046685692119540357, + "loss": 1.9696, + "step": 5630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046540555249397056, + "loss": 1.9598, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046395447662498117, + "loss": 1.9366, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046250370587139206, + "loss": 1.9748, + "step": 5660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046105325251357695, + "loss": 1.9125, + "step": 5670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045960312882922306, + "loss": 1.9595, + "step": 5680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045815334709322665, + "loss": 1.9369, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004567039195775899, + "loss": 1.9564, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 0.000455254858551316, + "loss": 1.9274, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045380617628030693, + "loss": 1.9366, + "step": 5720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045235788502725777, + "loss": 1.9446, + "step": 5730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045090999705155383, + "loss": 1.9236, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004494625246091672, + "loss": 1.9397, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044801547995255194, + "loss": 1.9849, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044656887533054193, + "loss": 1.9367, + "step": 5770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004451227229882455, + "loss": 1.9451, + "step": 5780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004436770351669429, + "loss": 1.9578, + "step": 5790 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004422318241039821, + "loss": 1.9095, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00044078710203267576, + "loss": 1.9337, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004393428811821971, + "loss": 1.9904, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043789917377747695, + "loss": 1.9569, + "step": 5830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004364559920390996, + "loss": 1.9423, + "step": 5840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043501334818320004, + "loss": 2.0013, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004335712544213597, + "loss": 1.9585, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004321297229605044, + "loss": 1.9148, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00043068876600279964, + "loss": 1.9558, + "step": 5880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004292483957455482, + "loss": 1.9899, + "step": 5890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042780862438108655, + "loss": 1.9597, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042636946409668123, + "loss": 1.9603, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042493092707442717, + "loss": 1.9771, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004234930254911427, + "loss": 1.9416, + "step": 5930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042205577151826747, + "loss": 1.9417, + "step": 5940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042061917732175966, + "loss": 1.9636, + "step": 5950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000419183255061992, + "loss": 1.966, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004177480168936504, + "loss": 1.9885, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041631347496562913, + "loss": 1.9525, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004148796414209297, + "loss": 1.9809, + "step": 5990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004134465283965568, + "loss": 1.8982, + "step": 6000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041201414802341643, + "loss": 1.8978, + "step": 6010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00041058251242621295, + "loss": 1.9406, + "step": 6020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004091516337233464, + "loss": 1.919, + "step": 6030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040772152402680973, + "loss": 1.9897, + "step": 6040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040629219544208644, + "loss": 1.9473, + "step": 6050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040486366006804817, + "loss": 1.9589, + "step": 6060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040343592999685264, + "loss": 1.8972, + "step": 6070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004020090173138404, + "loss": 1.9611, + "step": 6080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00040058293409743316, + "loss": 1.9164, + "step": 6090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00039915769241903175, + "loss": 1.939, + "step": 6100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003977333043429129, + "loss": 1.9233, + "step": 6110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003963097819261288, + "loss": 1.9742, + "step": 6120 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003948871372184033, + "loss": 1.9719, + "step": 6130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003934653822620309, + "loss": 1.9861, + "step": 6140 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003920445290917747, + "loss": 1.9514, + "step": 6150 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003906245897347643, + "loss": 2.0047, + "step": 6160 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003892055762103943, + "loss": 1.934, + "step": 6170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003877875005302223, + "loss": 1.9619, + "step": 6180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038637037469786727, + "loss": 1.9085, + "step": 6190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038495421070890796, + "loss": 1.9222, + "step": 6200 + }, + { + "epoch": 1.15, + "learning_rate": 0.0003835390205507812, + "loss": 1.9409, + "step": 6210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038212481620268125, + "loss": 1.9439, + "step": 6220 + }, + { + "epoch": 1.15, + "learning_rate": 0.000380711609635457, + "loss": 1.974, + "step": 6230 + }, + { + "epoch": 1.16, + "learning_rate": 0.000379299412811512, + "loss": 1.9141, + "step": 6240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037788823768470227, + "loss": 1.8982, + "step": 6250 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003764780962002352, + "loss": 1.9384, + "step": 6260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003750690002945695, + "loss": 1.9174, + "step": 6270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037366096189531253, + "loss": 1.927, + "step": 6280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003722539929211205, + "loss": 1.9449, + "step": 6290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003708481052815973, + "loss": 2.008, + "step": 6300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003694433108771933, + "loss": 1.9345, + "step": 6310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00036803962159910543, + "loss": 1.8619, + "step": 6320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003666370493291757, + "loss": 1.9612, + "step": 6330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003652356059397909, + "loss": 1.9371, + "step": 6340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036383530329378225, + "loss": 1.9193, + "step": 6350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036243615324432494, + "loss": 1.9509, + "step": 6360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036103816763483775, + "loss": 1.9517, + "step": 6370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035964135829888287, + "loss": 1.9141, + "step": 6380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035824573706006547, + "loss": 1.9985, + "step": 6390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035685131573193386, + "loss": 1.9791, + "step": 6400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035545810611787925, + "loss": 1.8865, + "step": 6410 + }, + { + "epoch": 1.19, + "learning_rate": 0.0003540661200110367, + "loss": 1.9409, + "step": 6420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035267536919418395, + "loss": 1.9928, + "step": 6430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035128586543964243, + "loss": 1.9149, + "step": 6440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00034989762050917784, + "loss": 1.9837, + "step": 6450 + }, + { + "epoch": 1.2, + "learning_rate": 0.0003485106461538999, + "loss": 1.9142, + "step": 6460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034712495411416385, + "loss": 1.9284, + "step": 6470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034574055611946984, + "loss": 1.8848, + "step": 6480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034435746388836457, + "loss": 1.9295, + "step": 6490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034297568912834177, + "loss": 1.9635, + "step": 6500 + }, + { + "epoch": 1.21, + "learning_rate": 0.0003415952435357431, + "loss": 1.9794, + "step": 6510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00034021613879565944, + "loss": 1.9347, + "step": 6520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033883838658183154, + "loss": 1.9282, + "step": 6530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033746199855655125, + "loss": 1.9973, + "step": 6540 + }, + { + "epoch": 1.21, + "learning_rate": 0.000336086986370563, + "loss": 1.9718, + "step": 6550 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003347133616629652, + "loss": 1.9157, + "step": 6560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033334113606111194, + "loss": 1.9528, + "step": 6570 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003319703211805135, + "loss": 1.9369, + "step": 6580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033060092862473967, + "loss": 1.9552, + "step": 6590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00032923296998532003, + "loss": 1.9581, + "step": 6600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003278664568416465, + "loss": 1.9406, + "step": 6610 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003265014007608758, + "loss": 1.9672, + "step": 6620 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003251378132978304, + "loss": 1.9166, + "step": 6630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032377570599490164, + "loss": 1.9356, + "step": 6640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032241509038195165, + "loss": 1.9092, + "step": 6650 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003210559779762157, + "loss": 1.9343, + "step": 6660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031969838028220513, + "loss": 1.9796, + "step": 6670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031834230879160947, + "loss": 1.8932, + "step": 6680 + }, + { + "epoch": 1.24, + "learning_rate": 0.0003169877749831993, + "loss": 1.9279, + "step": 6690 + }, + { + "epoch": 1.24, + "learning_rate": 0.000315634790322729, + "loss": 1.9444, + "step": 6700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031428336626284037, + "loss": 1.9296, + "step": 6710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031293351424296467, + "loss": 1.9341, + "step": 6720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031158524568922663, + "loss": 1.9589, + "step": 6730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031023857201434703, + "loss": 1.8997, + "step": 6740 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003088935046175466, + "loss": 1.9417, + "step": 6750 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003075500548844492, + "loss": 1.9058, + "step": 6760 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003062082341869862, + "loss": 1.9511, + "step": 6770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030486805388329894, + "loss": 1.922, + "step": 6780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030352952531764363, + "loss": 1.9634, + "step": 6790 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003021926598202949, + "loss": 1.9555, + "step": 6800 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003008574687074498, + "loss": 1.9254, + "step": 6810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00029952396328113265, + "loss": 1.9211, + "step": 6820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029819215482909846, + "loss": 1.9504, + "step": 6830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029686205462473784, + "loss": 1.9174, + "step": 6840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029553367392698177, + "loss": 1.9368, + "step": 6850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029420702398020595, + "loss": 1.8939, + "step": 6860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029288211601413586, + "loss": 1.9097, + "step": 6870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029155896124375156, + "loss": 1.9885, + "step": 6880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002902375708691925, + "loss": 1.9752, + "step": 6890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002889179560756634, + "loss": 1.9321, + "step": 6900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002876001280333391, + "loss": 1.9345, + "step": 6910 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002862840978972698, + "loss": 1.9192, + "step": 6920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002849698768072877, + "loss": 1.9499, + "step": 6930 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002836574758879107, + "loss": 1.9217, + "step": 6940 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002823469062482503, + "loss": 1.9318, + "step": 6950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002810381789819167, + "loss": 1.9422, + "step": 6960 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002797313051669247, + "loss": 1.9562, + "step": 6970 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002784262958656003, + "loss": 1.9189, + "step": 6980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00027712316212448663, + "loss": 1.9453, + "step": 6990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027582191497425114, + "loss": 1.9335, + "step": 7000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 6.639684974406533e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-7000/training_args.bin b/checkpoint-7000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-7000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-8000/README.md b/checkpoint-8000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-8000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-8000/adapter_config.json b/checkpoint-8000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-8000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-8000/adapter_model.bin b/checkpoint-8000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0e91336e81b1a0119d9909816763f66014a54f7 --- /dev/null +++ b/checkpoint-8000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26cc12af751f07ff8b84d4edceba7fb7a751a5d1ef30167f9acc6a0994d038a1 +size 7819417 diff --git a/checkpoint-8000/finetuning_args.json b/checkpoint-8000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-8000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-8000/optimizer.pt b/checkpoint-8000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2062fd8047886e6a09c53c5b73d1632dc2406e13 --- /dev/null +++ b/checkpoint-8000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0edd07de468c1f9603fcc4e7063d83071db3975315372bc831641d45a56dbd8 +size 15644485 diff --git a/checkpoint-8000/rng_state_0.pth b/checkpoint-8000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..46c31753c8ac868ec139ad9b385674de1073f6f8 --- /dev/null +++ b/checkpoint-8000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26cb0683f50631a8ba754215237ee1ead097ed6406a88b2e2f8faac1294951f2 +size 18679 diff --git a/checkpoint-8000/rng_state_1.pth b/checkpoint-8000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4454546274b64c9cc4f3d886582c94e576b0f0e --- /dev/null +++ b/checkpoint-8000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ab9c3a4dfbe2559f167e865696cfcb1addf400a7cb328e576639572aba68a13 +size 18679 diff --git a/checkpoint-8000/rng_state_2.pth b/checkpoint-8000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..5459b393c4f00d56a25ba49daba24406ed3f3894 --- /dev/null +++ b/checkpoint-8000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e329103a2857e2f7a2869594ffacce86675d9d24903d36732025e65d7f4348f +size 18679 diff --git a/checkpoint-8000/rng_state_3.pth b/checkpoint-8000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0d6ad69b22f915ef5833f2d2b33f18ce0d61d30 --- /dev/null +++ b/checkpoint-8000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aee57679ab5cd990f494d4f975d408a4f4be8307ca380e080503899d788d5b6 +size 18679 diff --git a/checkpoint-8000/scheduler.pt b/checkpoint-8000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3aad7a022e28d8d559c17777a77efa4b732e3e5 --- /dev/null +++ b/checkpoint-8000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b53a0f3c7e5afe2de44dedf208ab9efc1639ae1ba0044b84cd5c11359049f2 +size 627 diff --git a/checkpoint-8000/trainer_state.json b/checkpoint-8000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..720ddab5ff49c20fa0cfd5445c755cf81b3f155e --- /dev/null +++ b/checkpoint-8000/trainer_state.json @@ -0,0 +1,4816 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.4817558807186515, + "global_step": 8000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005569011071543997, + "loss": 1.9859, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005554556085681757, + "loss": 1.9607, + "step": 5020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005540096405655409, + "loss": 1.9825, + "step": 5030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005525632153862152, + "loss": 1.9875, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005511163452737884, + "loss": 2.0051, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005496690424756164, + "loss": 2.0089, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005482213192427174, + "loss": 1.9495, + "step": 5070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005467731878296688, + "loss": 1.9701, + "step": 5080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005453246604945034, + "loss": 1.9588, + "step": 5090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005438757494986044, + "loss": 1.9833, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005424264671066038, + "loss": 1.9974, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005409768255862766, + "loss": 1.9746, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005395268372084378, + "loss": 1.9757, + "step": 5130 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005380765142468387, + "loss": 1.9908, + "step": 5140 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005366258689780625, + "loss": 2.006, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005351749136814208, + "loss": 1.9957, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005337236606388495, + "loss": 1.959, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005322721221348047, + "loss": 2.0027, + "step": 5180 + }, + { + "epoch": 0.96, + "learning_rate": 0.000530820310456159, + "loss": 1.9248, + "step": 5190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005293682378920974, + "loss": 1.9742, + "step": 5200 + }, + { + "epoch": 0.96, + "learning_rate": 0.000527915916734013, + "loss": 1.9844, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005264633592754035, + "loss": 1.9985, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005250105778117661, + "loss": 2.0074, + "step": 5230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005235575846404952, + "loss": 1.9901, + "step": 5240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005221043920607763, + "loss": 1.9861, + "step": 5250 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005206510123734837, + "loss": 1.9576, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005191974578810746, + "loss": 1.9741, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005177437408874868, + "loss": 1.9794, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005162898736980327, + "loss": 1.9883, + "step": 5290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005148358686192967, + "loss": 1.969, + "step": 5300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005133817379590302, + "loss": 2.0018, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005119274940260476, + "loss": 1.971, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005104731491301225, + "loss": 1.9564, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005090187155818823, + "loss": 1.9798, + "step": 5340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005075642056927057, + "loss": 2.0331, + "step": 5350 + }, + { + "epoch": 0.99, + "learning_rate": 0.000506109631774617, + "loss": 1.9505, + "step": 5360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005046550061401825, + "loss": 1.9348, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005032003411024067, + "loss": 2.0099, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005017456489746275, + "loss": 1.9756, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005002909420704116, + "loss": 1.9444, + "step": 5400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004988362327034516, + "loss": 1.976, + "step": 5410 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004973815331874603, + "loss": 1.9593, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004959268558360675, + "loss": 1.9251, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004944722129627151, + "loss": 1.972, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004930176168805531, + "loss": 1.9307, + "step": 5450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004915630799023359, + "loss": 1.9541, + "step": 5460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004901086143403172, + "loss": 1.9212, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004886542325061464, + "loss": 1.965, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004871999467107639, + "loss": 2.0083, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004857457692642974, + "loss": 1.9676, + "step": 5500 + }, + { + "epoch": 1.02, + "learning_rate": 0.000484291712475957, + "loss": 1.9384, + "step": 5510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00048283778865393243, + "loss": 1.9339, + "step": 5520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004813840101052869, + "loss": 2.0182, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004799303891358545, + "loss": 1.9262, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004784769380501352, + "loss": 1.9397, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004770236691511908, + "loss": 1.9404, + "step": 5560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004755705947405417, + "loss": 1.9415, + "step": 5570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00047411772711806105, + "loss": 1.9292, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000472665078581872, + "loss": 1.9487, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00047121266142824354, + "loss": 1.9435, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004697604879514853, + "loss": 1.9145, + "step": 5610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004683085704438451, + "loss": 1.9975, + "step": 5620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046685692119540357, + "loss": 1.9696, + "step": 5630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046540555249397056, + "loss": 1.9598, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046395447662498117, + "loss": 1.9366, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046250370587139206, + "loss": 1.9748, + "step": 5660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046105325251357695, + "loss": 1.9125, + "step": 5670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045960312882922306, + "loss": 1.9595, + "step": 5680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045815334709322665, + "loss": 1.9369, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004567039195775899, + "loss": 1.9564, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 0.000455254858551316, + "loss": 1.9274, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045380617628030693, + "loss": 1.9366, + "step": 5720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045235788502725777, + "loss": 1.9446, + "step": 5730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045090999705155383, + "loss": 1.9236, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004494625246091672, + "loss": 1.9397, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044801547995255194, + "loss": 1.9849, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044656887533054193, + "loss": 1.9367, + "step": 5770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004451227229882455, + "loss": 1.9451, + "step": 5780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004436770351669429, + "loss": 1.9578, + "step": 5790 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004422318241039821, + "loss": 1.9095, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00044078710203267576, + "loss": 1.9337, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004393428811821971, + "loss": 1.9904, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043789917377747695, + "loss": 1.9569, + "step": 5830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004364559920390996, + "loss": 1.9423, + "step": 5840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043501334818320004, + "loss": 2.0013, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004335712544213597, + "loss": 1.9585, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004321297229605044, + "loss": 1.9148, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00043068876600279964, + "loss": 1.9558, + "step": 5880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004292483957455482, + "loss": 1.9899, + "step": 5890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042780862438108655, + "loss": 1.9597, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042636946409668123, + "loss": 1.9603, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042493092707442717, + "loss": 1.9771, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004234930254911427, + "loss": 1.9416, + "step": 5930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042205577151826747, + "loss": 1.9417, + "step": 5940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042061917732175966, + "loss": 1.9636, + "step": 5950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000419183255061992, + "loss": 1.966, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004177480168936504, + "loss": 1.9885, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041631347496562913, + "loss": 1.9525, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004148796414209297, + "loss": 1.9809, + "step": 5990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004134465283965568, + "loss": 1.8982, + "step": 6000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041201414802341643, + "loss": 1.8978, + "step": 6010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00041058251242621295, + "loss": 1.9406, + "step": 6020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004091516337233464, + "loss": 1.919, + "step": 6030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040772152402680973, + "loss": 1.9897, + "step": 6040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040629219544208644, + "loss": 1.9473, + "step": 6050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040486366006804817, + "loss": 1.9589, + "step": 6060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040343592999685264, + "loss": 1.8972, + "step": 6070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004020090173138404, + "loss": 1.9611, + "step": 6080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00040058293409743316, + "loss": 1.9164, + "step": 6090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00039915769241903175, + "loss": 1.939, + "step": 6100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003977333043429129, + "loss": 1.9233, + "step": 6110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003963097819261288, + "loss": 1.9742, + "step": 6120 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003948871372184033, + "loss": 1.9719, + "step": 6130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003934653822620309, + "loss": 1.9861, + "step": 6140 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003920445290917747, + "loss": 1.9514, + "step": 6150 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003906245897347643, + "loss": 2.0047, + "step": 6160 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003892055762103943, + "loss": 1.934, + "step": 6170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003877875005302223, + "loss": 1.9619, + "step": 6180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038637037469786727, + "loss": 1.9085, + "step": 6190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038495421070890796, + "loss": 1.9222, + "step": 6200 + }, + { + "epoch": 1.15, + "learning_rate": 0.0003835390205507812, + "loss": 1.9409, + "step": 6210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038212481620268125, + "loss": 1.9439, + "step": 6220 + }, + { + "epoch": 1.15, + "learning_rate": 0.000380711609635457, + "loss": 1.974, + "step": 6230 + }, + { + "epoch": 1.16, + "learning_rate": 0.000379299412811512, + "loss": 1.9141, + "step": 6240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037788823768470227, + "loss": 1.8982, + "step": 6250 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003764780962002352, + "loss": 1.9384, + "step": 6260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003750690002945695, + "loss": 1.9174, + "step": 6270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037366096189531253, + "loss": 1.927, + "step": 6280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003722539929211205, + "loss": 1.9449, + "step": 6290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003708481052815973, + "loss": 2.008, + "step": 6300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003694433108771933, + "loss": 1.9345, + "step": 6310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00036803962159910543, + "loss": 1.8619, + "step": 6320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003666370493291757, + "loss": 1.9612, + "step": 6330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003652356059397909, + "loss": 1.9371, + "step": 6340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036383530329378225, + "loss": 1.9193, + "step": 6350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036243615324432494, + "loss": 1.9509, + "step": 6360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036103816763483775, + "loss": 1.9517, + "step": 6370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035964135829888287, + "loss": 1.9141, + "step": 6380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035824573706006547, + "loss": 1.9985, + "step": 6390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035685131573193386, + "loss": 1.9791, + "step": 6400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035545810611787925, + "loss": 1.8865, + "step": 6410 + }, + { + "epoch": 1.19, + "learning_rate": 0.0003540661200110367, + "loss": 1.9409, + "step": 6420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035267536919418395, + "loss": 1.9928, + "step": 6430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035128586543964243, + "loss": 1.9149, + "step": 6440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00034989762050917784, + "loss": 1.9837, + "step": 6450 + }, + { + "epoch": 1.2, + "learning_rate": 0.0003485106461538999, + "loss": 1.9142, + "step": 6460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034712495411416385, + "loss": 1.9284, + "step": 6470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034574055611946984, + "loss": 1.8848, + "step": 6480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034435746388836457, + "loss": 1.9295, + "step": 6490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034297568912834177, + "loss": 1.9635, + "step": 6500 + }, + { + "epoch": 1.21, + "learning_rate": 0.0003415952435357431, + "loss": 1.9794, + "step": 6510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00034021613879565944, + "loss": 1.9347, + "step": 6520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033883838658183154, + "loss": 1.9282, + "step": 6530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033746199855655125, + "loss": 1.9973, + "step": 6540 + }, + { + "epoch": 1.21, + "learning_rate": 0.000336086986370563, + "loss": 1.9718, + "step": 6550 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003347133616629652, + "loss": 1.9157, + "step": 6560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033334113606111194, + "loss": 1.9528, + "step": 6570 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003319703211805135, + "loss": 1.9369, + "step": 6580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033060092862473967, + "loss": 1.9552, + "step": 6590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00032923296998532003, + "loss": 1.9581, + "step": 6600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003278664568416465, + "loss": 1.9406, + "step": 6610 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003265014007608758, + "loss": 1.9672, + "step": 6620 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003251378132978304, + "loss": 1.9166, + "step": 6630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032377570599490164, + "loss": 1.9356, + "step": 6640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032241509038195165, + "loss": 1.9092, + "step": 6650 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003210559779762157, + "loss": 1.9343, + "step": 6660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031969838028220513, + "loss": 1.9796, + "step": 6670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031834230879160947, + "loss": 1.8932, + "step": 6680 + }, + { + "epoch": 1.24, + "learning_rate": 0.0003169877749831993, + "loss": 1.9279, + "step": 6690 + }, + { + "epoch": 1.24, + "learning_rate": 0.000315634790322729, + "loss": 1.9444, + "step": 6700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031428336626284037, + "loss": 1.9296, + "step": 6710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031293351424296467, + "loss": 1.9341, + "step": 6720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031158524568922663, + "loss": 1.9589, + "step": 6730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031023857201434703, + "loss": 1.8997, + "step": 6740 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003088935046175466, + "loss": 1.9417, + "step": 6750 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003075500548844492, + "loss": 1.9058, + "step": 6760 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003062082341869862, + "loss": 1.9511, + "step": 6770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030486805388329894, + "loss": 1.922, + "step": 6780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030352952531764363, + "loss": 1.9634, + "step": 6790 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003021926598202949, + "loss": 1.9555, + "step": 6800 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003008574687074498, + "loss": 1.9254, + "step": 6810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00029952396328113265, + "loss": 1.9211, + "step": 6820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029819215482909846, + "loss": 1.9504, + "step": 6830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029686205462473784, + "loss": 1.9174, + "step": 6840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029553367392698177, + "loss": 1.9368, + "step": 6850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029420702398020595, + "loss": 1.8939, + "step": 6860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029288211601413586, + "loss": 1.9097, + "step": 6870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029155896124375156, + "loss": 1.9885, + "step": 6880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002902375708691925, + "loss": 1.9752, + "step": 6890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002889179560756634, + "loss": 1.9321, + "step": 6900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002876001280333391, + "loss": 1.9345, + "step": 6910 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002862840978972698, + "loss": 1.9192, + "step": 6920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002849698768072877, + "loss": 1.9499, + "step": 6930 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002836574758879107, + "loss": 1.9217, + "step": 6940 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002823469062482503, + "loss": 1.9318, + "step": 6950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002810381789819167, + "loss": 1.9422, + "step": 6960 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002797313051669247, + "loss": 1.9562, + "step": 6970 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002784262958656003, + "loss": 1.9189, + "step": 6980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00027712316212448663, + "loss": 1.9453, + "step": 6990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027582191497425114, + "loss": 1.9335, + "step": 7000 + }, + { + "epoch": 1.3, + "learning_rate": 0.000274522565429591, + "loss": 1.9724, + "step": 7010 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002732251244891421, + "loss": 1.9236, + "step": 7020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027192960313538307, + "loss": 1.9407, + "step": 7030 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002706360123345445, + "loss": 1.8948, + "step": 7040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026934436303651554, + "loss": 1.9354, + "step": 7050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026805466617475007, + "loss": 1.955, + "step": 7060 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002667669326661767, + "loss": 1.9595, + "step": 7070 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002654811734111033, + "loss": 1.9766, + "step": 7080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026419739929312713, + "loss": 1.9626, + "step": 7090 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002629156211790417, + "loss": 1.9096, + "step": 7100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026163584991874413, + "loss": 1.9522, + "step": 7110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026035809634514543, + "loss": 1.9387, + "step": 7120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00025908237127407626, + "loss": 1.8788, + "step": 7130 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002578086855041973, + "loss": 1.9326, + "step": 7140 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002565370498169064, + "loss": 1.92, + "step": 7150 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002552674749762487, + "loss": 1.9131, + "step": 7160 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002539999717288246, + "loss": 1.9263, + "step": 7170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025286099888629365, + "loss": 1.919, + "step": 7180 + }, + { + "epoch": 1.33, + "learning_rate": 0.000251597461210021, + "loss": 1.9281, + "step": 7190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025033602619263507, + "loss": 1.9831, + "step": 7200 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024907670451183454, + "loss": 1.9535, + "step": 7210 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024781950682742983, + "loss": 1.8798, + "step": 7220 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024656444378125204, + "loss": 1.9124, + "step": 7230 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024531152599706346, + "loss": 1.9472, + "step": 7240 + }, + { + "epoch": 1.34, + "learning_rate": 0.0002440607640804668, + "loss": 1.9697, + "step": 7250 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024281216861881633, + "loss": 1.938, + "step": 7260 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024156575018112787, + "loss": 1.9035, + "step": 7270 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024032151931798918, + "loss": 1.9379, + "step": 7280 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002390794865614711, + "loss": 1.9176, + "step": 7290 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002378396624250375, + "loss": 1.9392, + "step": 7300 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002366020574034576, + "loss": 1.9235, + "step": 7310 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023536668197271588, + "loss": 1.939, + "step": 7320 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002341335465899243, + "loss": 1.889, + "step": 7330 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023290266169323354, + "loss": 1.9247, + "step": 7340 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002316740377017438, + "loss": 1.935, + "step": 7350 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002304476850154183, + "loss": 1.9198, + "step": 7360 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022922361401499325, + "loss": 1.9068, + "step": 7370 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022800183506189238, + "loss": 1.9505, + "step": 7380 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022678235849813645, + "loss": 1.9459, + "step": 7390 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022556519464625807, + "loss": 1.9302, + "step": 7400 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022435035380921321, + "loss": 1.9345, + "step": 7410 + }, + { + "epoch": 1.37, + "learning_rate": 0.0002231378462702935, + "loss": 1.9304, + "step": 7420 + }, + { + "epoch": 1.38, + "learning_rate": 0.00022192768229304107, + "loss": 1.9457, + "step": 7430 + }, + { + "epoch": 1.38, + "learning_rate": 0.0002207198721211593, + "loss": 1.9395, + "step": 7440 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021951442597842785, + "loss": 1.9867, + "step": 7450 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021831135406861558, + "loss": 1.9217, + "step": 7460 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021711066657539342, + "loss": 1.991, + "step": 7470 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021591237366225008, + "loss": 1.9492, + "step": 7480 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021471648547240365, + "loss": 1.9376, + "step": 7490 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021352301212871762, + "loss": 1.9436, + "step": 7500 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021233196373361397, + "loss": 1.9267, + "step": 7510 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021114335036898852, + "loss": 1.9483, + "step": 7520 + }, + { + "epoch": 1.39, + "learning_rate": 0.0002099571820961252, + "loss": 1.9485, + "step": 7530 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020877346895561082, + "loss": 1.9607, + "step": 7540 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020759222096725034, + "loss": 1.9665, + "step": 7550 + }, + { + "epoch": 1.4, + "learning_rate": 0.0002064134481299814, + "loss": 1.9202, + "step": 7560 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020523716042179075, + "loss": 1.9375, + "step": 7570 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020406336779962888, + "loss": 1.9406, + "step": 7580 + }, + { + "epoch": 1.41, + "learning_rate": 0.00020289208019932635, + "loss": 1.9357, + "step": 7590 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002017233075355089, + "loss": 1.9432, + "step": 7600 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002005570597015145, + "loss": 1.962, + "step": 7610 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019939334656930892, + "loss": 1.9237, + "step": 7620 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019823217798940247, + "loss": 1.9688, + "step": 7630 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019707356379076668, + "loss": 1.9524, + "step": 7640 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019591751378075035, + "loss": 1.981, + "step": 7650 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019476403774499774, + "loss": 1.9405, + "step": 7660 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001936131454473649, + "loss": 1.9, + "step": 7670 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019246484662983733, + "loss": 1.8852, + "step": 7680 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019131915101244752, + "loss": 1.9447, + "step": 7690 + }, + { + "epoch": 1.43, + "learning_rate": 0.00019017606829319205, + "loss": 1.9221, + "step": 7700 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018903560814795086, + "loss": 1.9481, + "step": 7710 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018789778023040355, + "loss": 1.8919, + "step": 7720 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001867625941719499, + "loss": 1.94, + "step": 7730 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018563005958162587, + "loss": 1.9089, + "step": 7740 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018450018604602414, + "loss": 1.9105, + "step": 7750 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001833729831292123, + "loss": 1.9568, + "step": 7760 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018224846037265125, + "loss": 1.9156, + "step": 7770 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001811266272951162, + "loss": 1.9445, + "step": 7780 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001800074933926138, + "loss": 1.8871, + "step": 7790 + }, + { + "epoch": 1.44, + "learning_rate": 0.00017889106813830363, + "loss": 1.9684, + "step": 7800 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001777773609824173, + "loss": 1.9411, + "step": 7810 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017666638135217783, + "loss": 1.9295, + "step": 7820 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001755581386517216, + "loss": 1.9499, + "step": 7830 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001744526422620165, + "loss": 1.9499, + "step": 7840 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017334990154078446, + "loss": 1.9262, + "step": 7850 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017224992582242076, + "loss": 1.9554, + "step": 7860 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017115272441791635, + "loss": 1.9685, + "step": 7870 + }, + { + "epoch": 1.46, + "learning_rate": 0.000170058306614778, + "loss": 1.9021, + "step": 7880 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016896668167695018, + "loss": 1.8804, + "step": 7890 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016787785884473665, + "loss": 1.9164, + "step": 7900 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016679184733472163, + "loss": 1.9409, + "step": 7910 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016570865633969283, + "loss": 1.9329, + "step": 7920 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016462829502856286, + "loss": 1.9518, + "step": 7930 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016355077254629196, + "loss": 1.9494, + "step": 7940 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016247609801381003, + "loss": 1.9376, + "step": 7950 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016140428052794042, + "loss": 1.9312, + "step": 7960 + }, + { + "epoch": 1.48, + "learning_rate": 0.00016033532916132203, + "loss": 1.9528, + "step": 7970 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015926925296233296, + "loss": 1.9698, + "step": 7980 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015820606095501405, + "loss": 1.936, + "step": 7990 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015714576213899167, + "loss": 1.962, + "step": 8000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 7.590046841631146e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-8000/training_args.bin b/checkpoint-8000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-8000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/checkpoint-9000/README.md b/checkpoint-9000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/checkpoint-9000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/checkpoint-9000/adapter_config.json b/checkpoint-9000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c700a5d161022cf91737dcca4d31f37c02bb25 --- /dev/null +++ b/checkpoint-9000/adapter_config.json @@ -0,0 +1,19 @@ +{ + "base_model_name_or_path": "chatglm2-6b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "query_key_value" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/checkpoint-9000/adapter_model.bin b/checkpoint-9000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d5286a7b437a9b298b1994fdb8fabc3b17811ab --- /dev/null +++ b/checkpoint-9000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1175629f314b3e551f1a36df65c880a760fe036b9ac688d7cd773e292a6d1a +size 7819417 diff --git a/checkpoint-9000/finetuning_args.json b/checkpoint-9000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/checkpoint-9000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/checkpoint-9000/optimizer.pt b/checkpoint-9000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e587fd6a6ec85a670df73fb939e9af0dd47014 --- /dev/null +++ b/checkpoint-9000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b72fdea3e5271fec0823b4b25073e58582dc16073c907a3ab72c255768fa564 +size 15644485 diff --git a/checkpoint-9000/rng_state_0.pth b/checkpoint-9000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa690631eff8c4697559adb384a43904aa02cce6 --- /dev/null +++ b/checkpoint-9000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea82e8fa895368a32b5a59085f733ab681de73a704773d16869338460eeb64ed +size 18679 diff --git a/checkpoint-9000/rng_state_1.pth b/checkpoint-9000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..8a7ba2fa46866471851d937d6297e1560ec804af --- /dev/null +++ b/checkpoint-9000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378a694fa4d3744d64cf07fb8a89d57f6a4220fde48ab789bcf61596764890d3 +size 18679 diff --git a/checkpoint-9000/rng_state_2.pth b/checkpoint-9000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c8571dbfb99d915e55d855d49f08a64a7b34c287 --- /dev/null +++ b/checkpoint-9000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890300fe5eaa3dc2aeaba4371cc67c46fac6c8d2627ba0074c98628827dcd548 +size 18679 diff --git a/checkpoint-9000/rng_state_3.pth b/checkpoint-9000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a7e38384e9756ad7b4f00f4e463daf9b35aa22d --- /dev/null +++ b/checkpoint-9000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c2146dada3c6fb76d940b0d833bd2c3e389b1bb9f499ec6822de00e712d05 +size 18679 diff --git a/checkpoint-9000/scheduler.pt b/checkpoint-9000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc86df3763318fb7421464ad888aca87dd742dd --- /dev/null +++ b/checkpoint-9000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e2d6c17dcb6ab9cec36b8c7fd51272351126dad81c0237768472b83071b4ba +size 627 diff --git a/checkpoint-9000/trainer_state.json b/checkpoint-9000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..98bd594e06af7f08d3aff0f008758cd5cdd50141 --- /dev/null +++ b/checkpoint-9000/trainer_state.json @@ -0,0 +1,5416 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.666975365808483, + "global_step": 9000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005569011071543997, + "loss": 1.9859, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005554556085681757, + "loss": 1.9607, + "step": 5020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005540096405655409, + "loss": 1.9825, + "step": 5030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005525632153862152, + "loss": 1.9875, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005511163452737884, + "loss": 2.0051, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005496690424756164, + "loss": 2.0089, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005482213192427174, + "loss": 1.9495, + "step": 5070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005467731878296688, + "loss": 1.9701, + "step": 5080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005453246604945034, + "loss": 1.9588, + "step": 5090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005438757494986044, + "loss": 1.9833, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005424264671066038, + "loss": 1.9974, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005409768255862766, + "loss": 1.9746, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005395268372084378, + "loss": 1.9757, + "step": 5130 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005380765142468387, + "loss": 1.9908, + "step": 5140 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005366258689780625, + "loss": 2.006, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005351749136814208, + "loss": 1.9957, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005337236606388495, + "loss": 1.959, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005322721221348047, + "loss": 2.0027, + "step": 5180 + }, + { + "epoch": 0.96, + "learning_rate": 0.000530820310456159, + "loss": 1.9248, + "step": 5190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005293682378920974, + "loss": 1.9742, + "step": 5200 + }, + { + "epoch": 0.96, + "learning_rate": 0.000527915916734013, + "loss": 1.9844, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005264633592754035, + "loss": 1.9985, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005250105778117661, + "loss": 2.0074, + "step": 5230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005235575846404952, + "loss": 1.9901, + "step": 5240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005221043920607763, + "loss": 1.9861, + "step": 5250 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005206510123734837, + "loss": 1.9576, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005191974578810746, + "loss": 1.9741, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005177437408874868, + "loss": 1.9794, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005162898736980327, + "loss": 1.9883, + "step": 5290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005148358686192967, + "loss": 1.969, + "step": 5300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005133817379590302, + "loss": 2.0018, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005119274940260476, + "loss": 1.971, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005104731491301225, + "loss": 1.9564, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005090187155818823, + "loss": 1.9798, + "step": 5340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005075642056927057, + "loss": 2.0331, + "step": 5350 + }, + { + "epoch": 0.99, + "learning_rate": 0.000506109631774617, + "loss": 1.9505, + "step": 5360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005046550061401825, + "loss": 1.9348, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005032003411024067, + "loss": 2.0099, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005017456489746275, + "loss": 1.9756, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005002909420704116, + "loss": 1.9444, + "step": 5400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004988362327034516, + "loss": 1.976, + "step": 5410 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004973815331874603, + "loss": 1.9593, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004959268558360675, + "loss": 1.9251, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004944722129627151, + "loss": 1.972, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004930176168805531, + "loss": 1.9307, + "step": 5450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004915630799023359, + "loss": 1.9541, + "step": 5460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004901086143403172, + "loss": 1.9212, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004886542325061464, + "loss": 1.965, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004871999467107639, + "loss": 2.0083, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004857457692642974, + "loss": 1.9676, + "step": 5500 + }, + { + "epoch": 1.02, + "learning_rate": 0.000484291712475957, + "loss": 1.9384, + "step": 5510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00048283778865393243, + "loss": 1.9339, + "step": 5520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004813840101052869, + "loss": 2.0182, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004799303891358545, + "loss": 1.9262, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004784769380501352, + "loss": 1.9397, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004770236691511908, + "loss": 1.9404, + "step": 5560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004755705947405417, + "loss": 1.9415, + "step": 5570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00047411772711806105, + "loss": 1.9292, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000472665078581872, + "loss": 1.9487, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00047121266142824354, + "loss": 1.9435, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004697604879514853, + "loss": 1.9145, + "step": 5610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004683085704438451, + "loss": 1.9975, + "step": 5620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046685692119540357, + "loss": 1.9696, + "step": 5630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046540555249397056, + "loss": 1.9598, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046395447662498117, + "loss": 1.9366, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046250370587139206, + "loss": 1.9748, + "step": 5660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046105325251357695, + "loss": 1.9125, + "step": 5670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045960312882922306, + "loss": 1.9595, + "step": 5680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045815334709322665, + "loss": 1.9369, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004567039195775899, + "loss": 1.9564, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 0.000455254858551316, + "loss": 1.9274, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045380617628030693, + "loss": 1.9366, + "step": 5720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045235788502725777, + "loss": 1.9446, + "step": 5730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045090999705155383, + "loss": 1.9236, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004494625246091672, + "loss": 1.9397, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044801547995255194, + "loss": 1.9849, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044656887533054193, + "loss": 1.9367, + "step": 5770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004451227229882455, + "loss": 1.9451, + "step": 5780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004436770351669429, + "loss": 1.9578, + "step": 5790 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004422318241039821, + "loss": 1.9095, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00044078710203267576, + "loss": 1.9337, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004393428811821971, + "loss": 1.9904, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043789917377747695, + "loss": 1.9569, + "step": 5830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004364559920390996, + "loss": 1.9423, + "step": 5840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043501334818320004, + "loss": 2.0013, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004335712544213597, + "loss": 1.9585, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004321297229605044, + "loss": 1.9148, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00043068876600279964, + "loss": 1.9558, + "step": 5880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004292483957455482, + "loss": 1.9899, + "step": 5890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042780862438108655, + "loss": 1.9597, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042636946409668123, + "loss": 1.9603, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042493092707442717, + "loss": 1.9771, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004234930254911427, + "loss": 1.9416, + "step": 5930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042205577151826747, + "loss": 1.9417, + "step": 5940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042061917732175966, + "loss": 1.9636, + "step": 5950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000419183255061992, + "loss": 1.966, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004177480168936504, + "loss": 1.9885, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041631347496562913, + "loss": 1.9525, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004148796414209297, + "loss": 1.9809, + "step": 5990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004134465283965568, + "loss": 1.8982, + "step": 6000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041201414802341643, + "loss": 1.8978, + "step": 6010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00041058251242621295, + "loss": 1.9406, + "step": 6020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004091516337233464, + "loss": 1.919, + "step": 6030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040772152402680973, + "loss": 1.9897, + "step": 6040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040629219544208644, + "loss": 1.9473, + "step": 6050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040486366006804817, + "loss": 1.9589, + "step": 6060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040343592999685264, + "loss": 1.8972, + "step": 6070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004020090173138404, + "loss": 1.9611, + "step": 6080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00040058293409743316, + "loss": 1.9164, + "step": 6090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00039915769241903175, + "loss": 1.939, + "step": 6100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003977333043429129, + "loss": 1.9233, + "step": 6110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003963097819261288, + "loss": 1.9742, + "step": 6120 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003948871372184033, + "loss": 1.9719, + "step": 6130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003934653822620309, + "loss": 1.9861, + "step": 6140 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003920445290917747, + "loss": 1.9514, + "step": 6150 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003906245897347643, + "loss": 2.0047, + "step": 6160 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003892055762103943, + "loss": 1.934, + "step": 6170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003877875005302223, + "loss": 1.9619, + "step": 6180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038637037469786727, + "loss": 1.9085, + "step": 6190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038495421070890796, + "loss": 1.9222, + "step": 6200 + }, + { + "epoch": 1.15, + "learning_rate": 0.0003835390205507812, + "loss": 1.9409, + "step": 6210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038212481620268125, + "loss": 1.9439, + "step": 6220 + }, + { + "epoch": 1.15, + "learning_rate": 0.000380711609635457, + "loss": 1.974, + "step": 6230 + }, + { + "epoch": 1.16, + "learning_rate": 0.000379299412811512, + "loss": 1.9141, + "step": 6240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037788823768470227, + "loss": 1.8982, + "step": 6250 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003764780962002352, + "loss": 1.9384, + "step": 6260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003750690002945695, + "loss": 1.9174, + "step": 6270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037366096189531253, + "loss": 1.927, + "step": 6280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003722539929211205, + "loss": 1.9449, + "step": 6290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003708481052815973, + "loss": 2.008, + "step": 6300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003694433108771933, + "loss": 1.9345, + "step": 6310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00036803962159910543, + "loss": 1.8619, + "step": 6320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003666370493291757, + "loss": 1.9612, + "step": 6330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003652356059397909, + "loss": 1.9371, + "step": 6340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036383530329378225, + "loss": 1.9193, + "step": 6350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036243615324432494, + "loss": 1.9509, + "step": 6360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036103816763483775, + "loss": 1.9517, + "step": 6370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035964135829888287, + "loss": 1.9141, + "step": 6380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035824573706006547, + "loss": 1.9985, + "step": 6390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035685131573193386, + "loss": 1.9791, + "step": 6400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035545810611787925, + "loss": 1.8865, + "step": 6410 + }, + { + "epoch": 1.19, + "learning_rate": 0.0003540661200110367, + "loss": 1.9409, + "step": 6420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035267536919418395, + "loss": 1.9928, + "step": 6430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035128586543964243, + "loss": 1.9149, + "step": 6440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00034989762050917784, + "loss": 1.9837, + "step": 6450 + }, + { + "epoch": 1.2, + "learning_rate": 0.0003485106461538999, + "loss": 1.9142, + "step": 6460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034712495411416385, + "loss": 1.9284, + "step": 6470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034574055611946984, + "loss": 1.8848, + "step": 6480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034435746388836457, + "loss": 1.9295, + "step": 6490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034297568912834177, + "loss": 1.9635, + "step": 6500 + }, + { + "epoch": 1.21, + "learning_rate": 0.0003415952435357431, + "loss": 1.9794, + "step": 6510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00034021613879565944, + "loss": 1.9347, + "step": 6520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033883838658183154, + "loss": 1.9282, + "step": 6530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033746199855655125, + "loss": 1.9973, + "step": 6540 + }, + { + "epoch": 1.21, + "learning_rate": 0.000336086986370563, + "loss": 1.9718, + "step": 6550 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003347133616629652, + "loss": 1.9157, + "step": 6560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033334113606111194, + "loss": 1.9528, + "step": 6570 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003319703211805135, + "loss": 1.9369, + "step": 6580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033060092862473967, + "loss": 1.9552, + "step": 6590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00032923296998532003, + "loss": 1.9581, + "step": 6600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003278664568416465, + "loss": 1.9406, + "step": 6610 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003265014007608758, + "loss": 1.9672, + "step": 6620 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003251378132978304, + "loss": 1.9166, + "step": 6630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032377570599490164, + "loss": 1.9356, + "step": 6640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032241509038195165, + "loss": 1.9092, + "step": 6650 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003210559779762157, + "loss": 1.9343, + "step": 6660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031969838028220513, + "loss": 1.9796, + "step": 6670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031834230879160947, + "loss": 1.8932, + "step": 6680 + }, + { + "epoch": 1.24, + "learning_rate": 0.0003169877749831993, + "loss": 1.9279, + "step": 6690 + }, + { + "epoch": 1.24, + "learning_rate": 0.000315634790322729, + "loss": 1.9444, + "step": 6700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031428336626284037, + "loss": 1.9296, + "step": 6710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031293351424296467, + "loss": 1.9341, + "step": 6720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031158524568922663, + "loss": 1.9589, + "step": 6730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031023857201434703, + "loss": 1.8997, + "step": 6740 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003088935046175466, + "loss": 1.9417, + "step": 6750 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003075500548844492, + "loss": 1.9058, + "step": 6760 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003062082341869862, + "loss": 1.9511, + "step": 6770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030486805388329894, + "loss": 1.922, + "step": 6780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030352952531764363, + "loss": 1.9634, + "step": 6790 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003021926598202949, + "loss": 1.9555, + "step": 6800 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003008574687074498, + "loss": 1.9254, + "step": 6810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00029952396328113265, + "loss": 1.9211, + "step": 6820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029819215482909846, + "loss": 1.9504, + "step": 6830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029686205462473784, + "loss": 1.9174, + "step": 6840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029553367392698177, + "loss": 1.9368, + "step": 6850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029420702398020595, + "loss": 1.8939, + "step": 6860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029288211601413586, + "loss": 1.9097, + "step": 6870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029155896124375156, + "loss": 1.9885, + "step": 6880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002902375708691925, + "loss": 1.9752, + "step": 6890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002889179560756634, + "loss": 1.9321, + "step": 6900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002876001280333391, + "loss": 1.9345, + "step": 6910 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002862840978972698, + "loss": 1.9192, + "step": 6920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002849698768072877, + "loss": 1.9499, + "step": 6930 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002836574758879107, + "loss": 1.9217, + "step": 6940 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002823469062482503, + "loss": 1.9318, + "step": 6950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002810381789819167, + "loss": 1.9422, + "step": 6960 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002797313051669247, + "loss": 1.9562, + "step": 6970 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002784262958656003, + "loss": 1.9189, + "step": 6980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00027712316212448663, + "loss": 1.9453, + "step": 6990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027582191497425114, + "loss": 1.9335, + "step": 7000 + }, + { + "epoch": 1.3, + "learning_rate": 0.000274522565429591, + "loss": 1.9724, + "step": 7010 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002732251244891421, + "loss": 1.9236, + "step": 7020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027192960313538307, + "loss": 1.9407, + "step": 7030 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002706360123345445, + "loss": 1.8948, + "step": 7040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026934436303651554, + "loss": 1.9354, + "step": 7050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026805466617475007, + "loss": 1.955, + "step": 7060 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002667669326661767, + "loss": 1.9595, + "step": 7070 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002654811734111033, + "loss": 1.9766, + "step": 7080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026419739929312713, + "loss": 1.9626, + "step": 7090 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002629156211790417, + "loss": 1.9096, + "step": 7100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026163584991874413, + "loss": 1.9522, + "step": 7110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026035809634514543, + "loss": 1.9387, + "step": 7120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00025908237127407626, + "loss": 1.8788, + "step": 7130 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002578086855041973, + "loss": 1.9326, + "step": 7140 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002565370498169064, + "loss": 1.92, + "step": 7150 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002552674749762487, + "loss": 1.9131, + "step": 7160 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002539999717288246, + "loss": 1.9263, + "step": 7170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025286099888629365, + "loss": 1.919, + "step": 7180 + }, + { + "epoch": 1.33, + "learning_rate": 0.000251597461210021, + "loss": 1.9281, + "step": 7190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025033602619263507, + "loss": 1.9831, + "step": 7200 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024907670451183454, + "loss": 1.9535, + "step": 7210 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024781950682742983, + "loss": 1.8798, + "step": 7220 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024656444378125204, + "loss": 1.9124, + "step": 7230 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024531152599706346, + "loss": 1.9472, + "step": 7240 + }, + { + "epoch": 1.34, + "learning_rate": 0.0002440607640804668, + "loss": 1.9697, + "step": 7250 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024281216861881633, + "loss": 1.938, + "step": 7260 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024156575018112787, + "loss": 1.9035, + "step": 7270 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024032151931798918, + "loss": 1.9379, + "step": 7280 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002390794865614711, + "loss": 1.9176, + "step": 7290 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002378396624250375, + "loss": 1.9392, + "step": 7300 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002366020574034576, + "loss": 1.9235, + "step": 7310 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023536668197271588, + "loss": 1.939, + "step": 7320 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002341335465899243, + "loss": 1.889, + "step": 7330 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023290266169323354, + "loss": 1.9247, + "step": 7340 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002316740377017438, + "loss": 1.935, + "step": 7350 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002304476850154183, + "loss": 1.9198, + "step": 7360 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022922361401499325, + "loss": 1.9068, + "step": 7370 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022800183506189238, + "loss": 1.9505, + "step": 7380 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022678235849813645, + "loss": 1.9459, + "step": 7390 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022556519464625807, + "loss": 1.9302, + "step": 7400 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022435035380921321, + "loss": 1.9345, + "step": 7410 + }, + { + "epoch": 1.37, + "learning_rate": 0.0002231378462702935, + "loss": 1.9304, + "step": 7420 + }, + { + "epoch": 1.38, + "learning_rate": 0.00022192768229304107, + "loss": 1.9457, + "step": 7430 + }, + { + "epoch": 1.38, + "learning_rate": 0.0002207198721211593, + "loss": 1.9395, + "step": 7440 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021951442597842785, + "loss": 1.9867, + "step": 7450 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021831135406861558, + "loss": 1.9217, + "step": 7460 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021711066657539342, + "loss": 1.991, + "step": 7470 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021591237366225008, + "loss": 1.9492, + "step": 7480 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021471648547240365, + "loss": 1.9376, + "step": 7490 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021352301212871762, + "loss": 1.9436, + "step": 7500 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021233196373361397, + "loss": 1.9267, + "step": 7510 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021114335036898852, + "loss": 1.9483, + "step": 7520 + }, + { + "epoch": 1.39, + "learning_rate": 0.0002099571820961252, + "loss": 1.9485, + "step": 7530 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020877346895561082, + "loss": 1.9607, + "step": 7540 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020759222096725034, + "loss": 1.9665, + "step": 7550 + }, + { + "epoch": 1.4, + "learning_rate": 0.0002064134481299814, + "loss": 1.9202, + "step": 7560 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020523716042179075, + "loss": 1.9375, + "step": 7570 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020406336779962888, + "loss": 1.9406, + "step": 7580 + }, + { + "epoch": 1.41, + "learning_rate": 0.00020289208019932635, + "loss": 1.9357, + "step": 7590 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002017233075355089, + "loss": 1.9432, + "step": 7600 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002005570597015145, + "loss": 1.962, + "step": 7610 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019939334656930892, + "loss": 1.9237, + "step": 7620 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019823217798940247, + "loss": 1.9688, + "step": 7630 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019707356379076668, + "loss": 1.9524, + "step": 7640 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019591751378075035, + "loss": 1.981, + "step": 7650 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019476403774499774, + "loss": 1.9405, + "step": 7660 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001936131454473649, + "loss": 1.9, + "step": 7670 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019246484662983733, + "loss": 1.8852, + "step": 7680 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019131915101244752, + "loss": 1.9447, + "step": 7690 + }, + { + "epoch": 1.43, + "learning_rate": 0.00019017606829319205, + "loss": 1.9221, + "step": 7700 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018903560814795086, + "loss": 1.9481, + "step": 7710 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018789778023040355, + "loss": 1.8919, + "step": 7720 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001867625941719499, + "loss": 1.94, + "step": 7730 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018563005958162587, + "loss": 1.9089, + "step": 7740 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018450018604602414, + "loss": 1.9105, + "step": 7750 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001833729831292123, + "loss": 1.9568, + "step": 7760 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018224846037265125, + "loss": 1.9156, + "step": 7770 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001811266272951162, + "loss": 1.9445, + "step": 7780 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001800074933926138, + "loss": 1.8871, + "step": 7790 + }, + { + "epoch": 1.44, + "learning_rate": 0.00017889106813830363, + "loss": 1.9684, + "step": 7800 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001777773609824173, + "loss": 1.9411, + "step": 7810 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017666638135217783, + "loss": 1.9295, + "step": 7820 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001755581386517216, + "loss": 1.9499, + "step": 7830 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001744526422620165, + "loss": 1.9499, + "step": 7840 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017334990154078446, + "loss": 1.9262, + "step": 7850 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017224992582242076, + "loss": 1.9554, + "step": 7860 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017115272441791635, + "loss": 1.9685, + "step": 7870 + }, + { + "epoch": 1.46, + "learning_rate": 0.000170058306614778, + "loss": 1.9021, + "step": 7880 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016896668167695018, + "loss": 1.8804, + "step": 7890 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016787785884473665, + "loss": 1.9164, + "step": 7900 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016679184733472163, + "loss": 1.9409, + "step": 7910 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016570865633969283, + "loss": 1.9329, + "step": 7920 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016462829502856286, + "loss": 1.9518, + "step": 7930 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016355077254629196, + "loss": 1.9494, + "step": 7940 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016247609801381003, + "loss": 1.9376, + "step": 7950 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016140428052794042, + "loss": 1.9312, + "step": 7960 + }, + { + "epoch": 1.48, + "learning_rate": 0.00016033532916132203, + "loss": 1.9528, + "step": 7970 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015926925296233296, + "loss": 1.9698, + "step": 7980 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015820606095501405, + "loss": 1.936, + "step": 7990 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015714576213899167, + "loss": 1.962, + "step": 8000 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015608836548940252, + "loss": 1.9439, + "step": 8010 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015503387995681732, + "loss": 1.9274, + "step": 8020 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001539823144671648, + "loss": 1.9029, + "step": 8030 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015293367792165664, + "loss": 1.928, + "step": 8040 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015188797919671115, + "loss": 1.9405, + "step": 8050 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015084522714387967, + "loss": 1.909, + "step": 8060 + }, + { + "epoch": 1.49, + "learning_rate": 0.00014980543058976977, + "loss": 1.9286, + "step": 8070 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014876859833597278, + "loss": 1.9358, + "step": 8080 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014773473915898695, + "loss": 1.9073, + "step": 8090 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014670386181014477, + "loss": 1.9044, + "step": 8100 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014567597501553847, + "loss": 1.9133, + "step": 8110 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001446510874759454, + "loss": 1.9583, + "step": 8120 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014362920786675616, + "loss": 1.9381, + "step": 8130 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014261034483789892, + "loss": 1.951, + "step": 8140 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014159450701376803, + "loss": 1.9806, + "step": 8150 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014058170299315027, + "loss": 1.9101, + "step": 8160 + }, + { + "epoch": 1.51, + "learning_rate": 0.00013957194134915147, + "loss": 1.9122, + "step": 8170 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013856523062912569, + "loss": 1.91, + "step": 8180 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001375615793546006, + "loss": 1.9182, + "step": 8190 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013656099602120752, + "loss": 1.9312, + "step": 8200 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013556348909860762, + "loss": 1.9327, + "step": 8210 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013456906703042165, + "loss": 1.9184, + "step": 8220 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013357773823415782, + "loss": 1.8876, + "step": 8230 + }, + { + "epoch": 1.53, + "learning_rate": 0.00013258951110114054, + "loss": 1.927, + "step": 8240 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001316043939964398, + "loss": 1.9525, + "step": 8250 + }, + { + "epoch": 1.53, + "learning_rate": 0.00013062239525879943, + "loss": 1.8933, + "step": 8260 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001296435232005677, + "loss": 1.9433, + "step": 8270 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001286677861076263, + "loss": 1.9306, + "step": 8280 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012769519223932034, + "loss": 1.8962, + "step": 8290 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012672574982838802, + "loss": 1.9322, + "step": 8300 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012575946708089176, + "loss": 1.9191, + "step": 8310 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001247963521761481, + "loss": 1.9308, + "step": 8320 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012383641326665874, + "loss": 1.8876, + "step": 8330 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012287965847804162, + "loss": 1.9103, + "step": 8340 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012192609590896142, + "loss": 1.8804, + "step": 8350 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012097573363106218, + "loss": 1.944, + "step": 8360 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012002857968889797, + "loss": 1.9259, + "step": 8370 + }, + { + "epoch": 1.55, + "learning_rate": 0.00011908464209986541, + "loss": 1.9421, + "step": 8380 + }, + { + "epoch": 1.55, + "learning_rate": 0.00011814392885413567, + "loss": 1.9251, + "step": 8390 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011720644791458623, + "loss": 1.9106, + "step": 8400 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011627220721673459, + "loss": 1.8928, + "step": 8410 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011534121466866986, + "loss": 1.9323, + "step": 8420 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011441347815098735, + "loss": 1.9238, + "step": 8430 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001134890055167201, + "loss": 1.9831, + "step": 8440 + }, + { + "epoch": 1.57, + "learning_rate": 0.00011256780459127374, + "loss": 1.85, + "step": 8450 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001116498831723598, + "loss": 1.9391, + "step": 8460 + }, + { + "epoch": 1.57, + "learning_rate": 0.00011073524902992921, + "loss": 1.9071, + "step": 8470 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010982390990610791, + "loss": 1.9538, + "step": 8480 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010891587351512949, + "loss": 1.8972, + "step": 8490 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010801114754327135, + "loss": 1.9184, + "step": 8500 + }, + { + "epoch": 1.58, + "learning_rate": 0.00010710973964878906, + "loss": 1.9567, + "step": 8510 + }, + { + "epoch": 1.58, + "learning_rate": 0.00010621165746185113, + "loss": 1.9755, + "step": 8520 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001053169085844758, + "loss": 1.9256, + "step": 8530 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001044255005904648, + "loss": 1.9742, + "step": 8540 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001035374410253408, + "loss": 1.9562, + "step": 8550 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001026527374062825, + "loss": 1.9432, + "step": 8560 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010177139722206191, + "loss": 1.9007, + "step": 8570 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010089342793298028, + "loss": 1.9834, + "step": 8580 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010001883697080504, + "loss": 1.9063, + "step": 8590 + }, + { + "epoch": 1.59, + "learning_rate": 9.914763173870738e-05, + "loss": 1.9063, + "step": 8600 + }, + { + "epoch": 1.59, + "learning_rate": 9.827981961119869e-05, + "loss": 1.9149, + "step": 8610 + }, + { + "epoch": 1.6, + "learning_rate": 9.741540793406911e-05, + "loss": 1.9096, + "step": 8620 + }, + { + "epoch": 1.6, + "learning_rate": 9.655440402432464e-05, + "loss": 1.8657, + "step": 8630 + }, + { + "epoch": 1.6, + "learning_rate": 9.569681517012585e-05, + "loss": 1.9237, + "step": 8640 + }, + { + "epoch": 1.6, + "learning_rate": 9.484264863072523e-05, + "loss": 1.9739, + "step": 8650 + }, + { + "epoch": 1.6, + "learning_rate": 9.399191163640675e-05, + "loss": 1.9199, + "step": 8660 + }, + { + "epoch": 1.61, + "learning_rate": 9.314461138842406e-05, + "loss": 1.9639, + "step": 8670 + }, + { + "epoch": 1.61, + "learning_rate": 9.230075505893987e-05, + "loss": 1.9391, + "step": 8680 + }, + { + "epoch": 1.61, + "learning_rate": 9.146034979096496e-05, + "loss": 1.9326, + "step": 8690 + }, + { + "epoch": 1.61, + "learning_rate": 9.06234026982976e-05, + "loss": 1.9501, + "step": 8700 + }, + { + "epoch": 1.61, + "learning_rate": 8.9789920865464e-05, + "loss": 1.9041, + "step": 8710 + }, + { + "epoch": 1.62, + "learning_rate": 8.895991134765758e-05, + "loss": 1.931, + "step": 8720 + }, + { + "epoch": 1.62, + "learning_rate": 8.813338117067965e-05, + "loss": 1.9589, + "step": 8730 + }, + { + "epoch": 1.62, + "learning_rate": 8.731033733088012e-05, + "loss": 1.9226, + "step": 8740 + }, + { + "epoch": 1.62, + "learning_rate": 8.649078679509742e-05, + "loss": 1.911, + "step": 8750 + }, + { + "epoch": 1.62, + "learning_rate": 8.567473650060082e-05, + "loss": 1.9641, + "step": 8760 + }, + { + "epoch": 1.62, + "learning_rate": 8.486219335503026e-05, + "loss": 1.8924, + "step": 8770 + }, + { + "epoch": 1.63, + "learning_rate": 8.405316423633958e-05, + "loss": 1.9583, + "step": 8780 + }, + { + "epoch": 1.63, + "learning_rate": 8.324765599273649e-05, + "loss": 1.9399, + "step": 8790 + }, + { + "epoch": 1.63, + "learning_rate": 8.244567544262588e-05, + "loss": 1.9362, + "step": 8800 + }, + { + "epoch": 1.63, + "learning_rate": 8.164722937455177e-05, + "loss": 1.9283, + "step": 8810 + }, + { + "epoch": 1.63, + "learning_rate": 8.08523245471392e-05, + "loss": 1.9588, + "step": 8820 + }, + { + "epoch": 1.64, + "learning_rate": 8.006096768903848e-05, + "loss": 1.9126, + "step": 8830 + }, + { + "epoch": 1.64, + "learning_rate": 7.927316549886659e-05, + "loss": 1.9331, + "step": 8840 + }, + { + "epoch": 1.64, + "learning_rate": 7.84889246451515e-05, + "loss": 1.8967, + "step": 8850 + }, + { + "epoch": 1.64, + "learning_rate": 7.77082517662756e-05, + "loss": 1.927, + "step": 8860 + }, + { + "epoch": 1.64, + "learning_rate": 7.693115347041884e-05, + "loss": 1.8978, + "step": 8870 + }, + { + "epoch": 1.64, + "learning_rate": 7.615763633550421e-05, + "loss": 1.9142, + "step": 8880 + }, + { + "epoch": 1.65, + "learning_rate": 7.538770690914015e-05, + "loss": 1.9001, + "step": 8890 + }, + { + "epoch": 1.65, + "learning_rate": 7.462137170856698e-05, + "loss": 1.8979, + "step": 8900 + }, + { + "epoch": 1.65, + "learning_rate": 7.385863722060022e-05, + "loss": 1.892, + "step": 8910 + }, + { + "epoch": 1.65, + "learning_rate": 7.309950990157677e-05, + "loss": 1.9496, + "step": 8920 + }, + { + "epoch": 1.65, + "learning_rate": 7.234399617729976e-05, + "loss": 1.8879, + "step": 8930 + }, + { + "epoch": 1.66, + "learning_rate": 7.159210244298414e-05, + "loss": 1.921, + "step": 8940 + }, + { + "epoch": 1.66, + "learning_rate": 7.084383506320291e-05, + "loss": 1.9408, + "step": 8950 + }, + { + "epoch": 1.66, + "learning_rate": 7.009920037183248e-05, + "loss": 1.9258, + "step": 8960 + }, + { + "epoch": 1.66, + "learning_rate": 6.935820467200005e-05, + "loss": 1.9182, + "step": 8970 + }, + { + "epoch": 1.66, + "learning_rate": 6.862085423602955e-05, + "loss": 1.9668, + "step": 8980 + }, + { + "epoch": 1.67, + "learning_rate": 6.78871553053888e-05, + "loss": 1.898, + "step": 8990 + }, + { + "epoch": 1.67, + "learning_rate": 6.715711409063652e-05, + "loss": 1.9261, + "step": 9000 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 8.540413167031812e+18, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-9000/training_args.bin b/checkpoint-9000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/checkpoint-9000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305 diff --git a/finetuning_args.json b/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f28e18016479196fd772d484c058dd17ca8c6a --- /dev/null +++ b/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "query_key_value" + ], + "name_module_trainable": "mlp", + "num_layer_trainable": 3, + "pre_seq_len": 64, + "prefix_projection": false +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000000000000000000000000000000000000..3b709b03c3ec85d406b36c7012506ade625a1842 --- /dev/null +++ b/train_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 2.0, + "train_loss": 1.978195481530868, + "train_runtime": 26343.521, + "train_samples_per_second": 26.232, + "train_steps_per_second": 0.41 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b97afaca6ef8fb626d3849d22c8122bdfc869bb --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,4316 @@ +{"current_steps": 10, "total_steps": 10798, "loss": 2.9794, "reward": null, "learning_rate": 0.0009999978838190456, "epoch": 0.0, "percentage": 0.09, "elapsed_time": "0:00:29", "remaining_time": "8:50:13"} +{"current_steps": 10, "total_steps": 10798, "loss": 2.9794, "reward": null, "learning_rate": 0.0009999978838190456, "epoch": 0.0, "percentage": 0.09, "elapsed_time": "0:06:32", "remaining_time": "4 days, 21:40:56"} +{"current_steps": 10, "total_steps": 10798, "loss": 2.9794, "reward": null, "learning_rate": 0.0009999978838190456, "epoch": 0.0, "percentage": 0.09, "elapsed_time": "0:00:27", "remaining_time": "8:21:27"} +{"current_steps": 10, "total_steps": 10798, "loss": 2.9794, "reward": null, "learning_rate": 0.0009999978838190456, "epoch": 0.0, "percentage": 0.09, "elapsed_time": "0:00:31", "remaining_time": "9:21:41"} +{"current_steps": 20, "total_steps": 10798, "loss": 2.3885, "reward": null, "learning_rate": 0.0009999915352940948, "epoch": 0.0, "percentage": 0.19, "elapsed_time": "0:00:54", "remaining_time": "8:06:36"} +{"current_steps": 20, "total_steps": 10798, "loss": 2.3885, "reward": null, "learning_rate": 0.0009999915352940948, "epoch": 0.0, "percentage": 0.19, "elapsed_time": "0:00:52", "remaining_time": "7:50:53"} +{"current_steps": 20, "total_steps": 10798, "loss": 2.3885, "reward": null, "learning_rate": 0.0009999915352940948, "epoch": 0.0, "percentage": 0.19, "elapsed_time": "0:00:50", "remaining_time": "7:36:31"} +{"current_steps": 20, "total_steps": 10798, "loss": 2.3885, "reward": null, "learning_rate": 0.0009999915352940948, "epoch": 0.0, "percentage": 0.19, "elapsed_time": "0:06:55", "remaining_time": "2 days, 14:13:13"} +{"current_steps": 30, "total_steps": 10798, "loss": 2.3057, "reward": null, "learning_rate": 0.000999980954478887, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:07:18", "remaining_time": "1 day, 19:40:30"} +{"current_steps": 30, "total_steps": 10798, "loss": 2.3057, "reward": null, "learning_rate": 0.000999980954478887, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:01:14", "remaining_time": "7:27:38"} +{"current_steps": 30, "total_steps": 10798, "loss": 2.3057, "reward": null, "learning_rate": 0.000999980954478887, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:01:16", "remaining_time": "7:38:06"} +{"current_steps": 30, "total_steps": 10798, "loss": 2.3057, "reward": null, "learning_rate": 0.000999980954478887, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:01:13", "remaining_time": "7:18:03"} +{"current_steps": 40, "total_steps": 10798, "loss": 2.2692, "reward": null, "learning_rate": 0.000999966141462985, "epoch": 0.01, "percentage": 0.37, "elapsed_time": "0:07:41", "remaining_time": "1 day, 10:29:18"} +{"current_steps": 40, "total_steps": 10798, "loss": 2.2692, "reward": null, "learning_rate": 0.000999966141462985, "epoch": 0.01, "percentage": 0.37, "elapsed_time": "0:01:40", "remaining_time": "7:29:01"} +{"current_steps": 40, "total_steps": 10798, "loss": 2.2692, "reward": null, "learning_rate": 0.000999966141462985, "epoch": 0.01, "percentage": 0.37, "elapsed_time": "0:01:38", "remaining_time": "7:21:10"} +{"current_steps": 40, "total_steps": 10798, "loss": 2.2692, "reward": null, "learning_rate": 0.000999966141462985, "epoch": 0.01, "percentage": 0.37, "elapsed_time": "0:01:36", "remaining_time": "7:14:00"} +{"current_steps": 50, "total_steps": 10798, "loss": 2.2576, "reward": null, "learning_rate": 0.000999947096371777, "epoch": 0.01, "percentage": 0.46, "elapsed_time": "0:08:03", "remaining_time": "1 day, 4:51:58"} +{"current_steps": 50, "total_steps": 10798, "loss": 2.2576, "reward": null, "learning_rate": 0.000999947096371777, "epoch": 0.01, "percentage": 0.46, "elapsed_time": "0:02:01", "remaining_time": "7:16:57"} +{"current_steps": 50, "total_steps": 10798, "loss": 2.2576, "reward": null, "learning_rate": 0.000999947096371777, "epoch": 0.01, "percentage": 0.46, "elapsed_time": "0:02:00", "remaining_time": "7:10:40"} +{"current_steps": 50, "total_steps": 10798, "loss": 2.2576, "reward": null, "learning_rate": 0.000999947096371777, "epoch": 0.01, "percentage": 0.46, "elapsed_time": "0:01:58", "remaining_time": "7:04:57"} +{"current_steps": 60, "total_steps": 10798, "loss": 2.2388, "reward": null, "learning_rate": 0.0009999238193664748, "epoch": 0.01, "percentage": 0.56, "elapsed_time": "0:02:23", "remaining_time": "7:08:40"} +{"current_steps": 60, "total_steps": 10798, "loss": 2.2388, "reward": null, "learning_rate": 0.0009999238193664748, "epoch": 0.01, "percentage": 0.56, "elapsed_time": "0:08:26", "remaining_time": "1 day, 1:12:04"} +{"current_steps": 60, "total_steps": 10798, "loss": 2.2388, "reward": null, "learning_rate": 0.0009999238193664748, "epoch": 0.01, "percentage": 0.56, "elapsed_time": "0:02:22", "remaining_time": "7:03:54"} +{"current_steps": 60, "total_steps": 10798, "loss": 2.2388, "reward": null, "learning_rate": 0.0009999238193664748, "epoch": 0.01, "percentage": 0.56, "elapsed_time": "0:02:25", "remaining_time": "7:13:53"} +{"current_steps": 70, "total_steps": 10798, "loss": 2.2523, "reward": null, "learning_rate": 0.0009998963106441117, "epoch": 0.01, "percentage": 0.65, "elapsed_time": "0:02:46", "remaining_time": "7:06:33"} +{"current_steps": 70, "total_steps": 10798, "loss": 2.2523, "reward": null, "learning_rate": 0.0009998963106441117, "epoch": 0.01, "percentage": 0.65, "elapsed_time": "0:08:50", "remaining_time": "22:34:19"} +{"current_steps": 70, "total_steps": 10798, "loss": 2.2523, "reward": null, "learning_rate": 0.0009998963106441117, "epoch": 0.01, "percentage": 0.65, "elapsed_time": "0:02:48", "remaining_time": "7:11:01"} +{"current_steps": 70, "total_steps": 10798, "loss": 2.2523, "reward": null, "learning_rate": 0.0009998963106441117, "epoch": 0.01, "percentage": 0.65, "elapsed_time": "0:02:45", "remaining_time": "7:02:28"} +{"current_steps": 80, "total_steps": 10798, "loss": 2.218, "reward": null, "learning_rate": 0.0009998645704375414, "epoch": 0.01, "percentage": 0.74, "elapsed_time": "0:09:14", "remaining_time": "20:38:36"} +{"current_steps": 80, "total_steps": 10798, "loss": 2.218, "reward": null, "learning_rate": 0.0009998645704375414, "epoch": 0.01, "percentage": 0.74, "elapsed_time": "0:03:11", "remaining_time": "7:07:34"} +{"current_steps": 80, "total_steps": 10798, "loss": 2.218, "reward": null, "learning_rate": 0.0009998645704375414, "epoch": 0.01, "percentage": 0.74, "elapsed_time": "0:03:09", "remaining_time": "7:03:59"} +{"current_steps": 80, "total_steps": 10798, "loss": 2.218, "reward": null, "learning_rate": 0.0009998645704375414, "epoch": 0.01, "percentage": 0.74, "elapsed_time": "0:03:13", "remaining_time": "7:11:28"} +{"current_steps": 90, "total_steps": 10798, "loss": 2.2457, "reward": null, "learning_rate": 0.000999828599015436, "epoch": 0.02, "percentage": 0.83, "elapsed_time": "0:09:39", "remaining_time": "19:08:37"} +{"current_steps": 90, "total_steps": 10798, "loss": 2.2457, "reward": null, "learning_rate": 0.000999828599015436, "epoch": 0.02, "percentage": 0.83, "elapsed_time": "0:03:37", "remaining_time": "7:11:50"} +{"current_steps": 90, "total_steps": 10798, "loss": 2.2457, "reward": null, "learning_rate": 0.000999828599015436, "epoch": 0.02, "percentage": 0.83, "elapsed_time": "0:03:34", "remaining_time": "7:05:11"} +{"current_steps": 90, "total_steps": 10798, "loss": 2.2457, "reward": null, "learning_rate": 0.000999828599015436, "epoch": 0.02, "percentage": 0.83, "elapsed_time": "0:03:36", "remaining_time": "7:08:21"} +{"current_steps": 100, "total_steps": 10798, "loss": 2.198, "reward": null, "learning_rate": 0.0009997883966822835, "epoch": 0.02, "percentage": 0.93, "elapsed_time": "0:03:59", "remaining_time": "7:07:13"} +{"current_steps": 100, "total_steps": 10798, "loss": 2.198, "reward": null, "learning_rate": 0.0009997883966822835, "epoch": 0.02, "percentage": 0.93, "elapsed_time": "0:03:58", "remaining_time": "7:04:22"} +{"current_steps": 100, "total_steps": 10798, "loss": 2.198, "reward": null, "learning_rate": 0.0009997883966822835, "epoch": 0.02, "percentage": 0.93, "elapsed_time": "0:04:01", "remaining_time": "7:10:21"} +{"current_steps": 100, "total_steps": 10798, "loss": 2.198, "reward": null, "learning_rate": 0.0009997883966822835, "epoch": 0.02, "percentage": 0.93, "elapsed_time": "0:10:02", "remaining_time": "17:54:51"} +{"current_steps": 110, "total_steps": 10798, "loss": 2.2013, "reward": null, "learning_rate": 0.0009997439637783859, "epoch": 0.02, "percentage": 1.02, "elapsed_time": "0:10:26", "remaining_time": "16:54:03"} +{"current_steps": 110, "total_steps": 10798, "loss": 2.2013, "reward": null, "learning_rate": 0.0009997439637783859, "epoch": 0.02, "percentage": 1.02, "elapsed_time": "0:04:24", "remaining_time": "7:08:41"} +{"current_steps": 110, "total_steps": 10798, "loss": 2.2013, "reward": null, "learning_rate": 0.0009997439637783859, "epoch": 0.02, "percentage": 1.02, "elapsed_time": "0:04:21", "remaining_time": "7:03:16"} +{"current_steps": 110, "total_steps": 10798, "loss": 2.2013, "reward": null, "learning_rate": 0.0009997439637783859, "epoch": 0.02, "percentage": 1.02, "elapsed_time": "0:04:22", "remaining_time": "7:05:51"} +{"current_steps": 120, "total_steps": 10798, "loss": 2.1765, "reward": null, "learning_rate": 0.000999695300679855, "epoch": 0.02, "percentage": 1.11, "elapsed_time": "0:04:50", "remaining_time": "7:10:21"} +{"current_steps": 120, "total_steps": 10798, "loss": 2.1765, "reward": null, "learning_rate": 0.000999695300679855, "epoch": 0.02, "percentage": 1.11, "elapsed_time": "0:04:46", "remaining_time": "7:05:23"} +{"current_steps": 120, "total_steps": 10798, "loss": 2.1765, "reward": null, "learning_rate": 0.000999695300679855, "epoch": 0.02, "percentage": 1.11, "elapsed_time": "0:04:48", "remaining_time": "7:07:45"} +{"current_steps": 120, "total_steps": 10798, "loss": 2.1765, "reward": null, "learning_rate": 0.000999695300679855, "epoch": 0.02, "percentage": 1.11, "elapsed_time": "0:10:51", "remaining_time": "16:06:26"} +{"current_steps": 130, "total_steps": 10798, "loss": 2.1741, "reward": null, "learning_rate": 0.0009996424077986109, "epoch": 0.02, "percentage": 1.2, "elapsed_time": "0:05:11", "remaining_time": "7:06:42"} +{"current_steps": 130, "total_steps": 10798, "loss": 2.1741, "reward": null, "learning_rate": 0.0009996424077986109, "epoch": 0.02, "percentage": 1.2, "elapsed_time": "0:11:15", "remaining_time": "15:23:28"} +{"current_steps": 130, "total_steps": 10798, "loss": 2.1741, "reward": null, "learning_rate": 0.0009996424077986109, "epoch": 0.02, "percentage": 1.2, "elapsed_time": "0:05:13", "remaining_time": "7:09:05"} +{"current_steps": 130, "total_steps": 10798, "loss": 2.1741, "reward": null, "learning_rate": 0.0009996424077986109, "epoch": 0.02, "percentage": 1.2, "elapsed_time": "0:05:10", "remaining_time": "7:04:31"} +{"current_steps": 140, "total_steps": 10798, "loss": 2.1898, "reward": null, "learning_rate": 0.000999585285582377, "epoch": 0.03, "percentage": 1.3, "elapsed_time": "0:05:38", "remaining_time": "7:09:04"} +{"current_steps": 140, "total_steps": 10798, "loss": 2.1898, "reward": null, "learning_rate": 0.000999585285582377, "epoch": 0.03, "percentage": 1.3, "elapsed_time": "0:05:36", "remaining_time": "7:06:51"} +{"current_steps": 140, "total_steps": 10798, "loss": 2.1898, "reward": null, "learning_rate": 0.000999585285582377, "epoch": 0.03, "percentage": 1.3, "elapsed_time": "0:05:34", "remaining_time": "7:04:49"} +{"current_steps": 140, "total_steps": 10798, "loss": 2.1898, "reward": null, "learning_rate": 0.000999585285582377, "epoch": 0.03, "percentage": 1.3, "elapsed_time": "0:11:39", "remaining_time": "14:47:42"} +{"current_steps": 150, "total_steps": 10798, "loss": 2.1466, "reward": null, "learning_rate": 0.0009995239345146772, "epoch": 0.03, "percentage": 1.39, "elapsed_time": "0:05:59", "remaining_time": "7:04:58"} +{"current_steps": 150, "total_steps": 10798, "loss": 2.1466, "reward": null, "learning_rate": 0.0009995239345146772, "epoch": 0.03, "percentage": 1.39, "elapsed_time": "0:06:02", "remaining_time": "7:08:55"} +{"current_steps": 150, "total_steps": 10798, "loss": 2.1466, "reward": null, "learning_rate": 0.0009995239345146772, "epoch": 0.03, "percentage": 1.39, "elapsed_time": "0:12:04", "remaining_time": "14:16:35"} +{"current_steps": 150, "total_steps": 10798, "loss": 2.1466, "reward": null, "learning_rate": 0.0009995239345146772, "epoch": 0.03, "percentage": 1.39, "elapsed_time": "0:06:00", "remaining_time": "7:06:51"} +{"current_steps": 160, "total_steps": 10798, "loss": 2.1423, "reward": null, "learning_rate": 0.0009994583551148314, "epoch": 0.03, "percentage": 1.48, "elapsed_time": "0:12:27", "remaining_time": "13:47:58"} +{"current_steps": 160, "total_steps": 10798, "loss": 2.1423, "reward": null, "learning_rate": 0.0009994583551148314, "epoch": 0.03, "percentage": 1.48, "elapsed_time": "0:06:22", "remaining_time": "7:03:41"} +{"current_steps": 160, "total_steps": 10798, "loss": 2.1423, "reward": null, "learning_rate": 0.0009994583551148314, "epoch": 0.03, "percentage": 1.48, "elapsed_time": "0:06:25", "remaining_time": "7:07:24"} +{"current_steps": 160, "total_steps": 10798, "loss": 2.1423, "reward": null, "learning_rate": 0.0009994583551148314, "epoch": 0.03, "percentage": 1.48, "elapsed_time": "0:06:23", "remaining_time": "7:05:28"} +{"current_steps": 170, "total_steps": 10798, "loss": 2.1451, "reward": null, "learning_rate": 0.0009993885479379506, "epoch": 0.03, "percentage": 1.57, "elapsed_time": "0:12:51", "remaining_time": "13:23:31"} +{"current_steps": 170, "total_steps": 10798, "loss": 2.1451, "reward": null, "learning_rate": 0.0009993885479379506, "epoch": 0.03, "percentage": 1.57, "elapsed_time": "0:06:49", "remaining_time": "7:06:53"} +{"current_steps": 170, "total_steps": 10798, "loss": 2.1451, "reward": null, "learning_rate": 0.0009993885479379506, "epoch": 0.03, "percentage": 1.57, "elapsed_time": "0:06:46", "remaining_time": "7:03:23"} +{"current_steps": 170, "total_steps": 10798, "loss": 2.1451, "reward": null, "learning_rate": 0.0009993885479379506, "epoch": 0.03, "percentage": 1.57, "elapsed_time": "0:06:47", "remaining_time": "7:05:04"} +{"current_steps": 180, "total_steps": 10798, "loss": 2.202, "reward": null, "learning_rate": 0.000999314513574934, "epoch": 0.03, "percentage": 1.67, "elapsed_time": "0:13:14", "remaining_time": "13:01:18"} +{"current_steps": 180, "total_steps": 10798, "loss": 2.202, "reward": null, "learning_rate": 0.000999314513574934, "epoch": 0.03, "percentage": 1.67, "elapsed_time": "0:07:09", "remaining_time": "7:02:38"} +{"current_steps": 180, "total_steps": 10798, "loss": 2.202, "reward": null, "learning_rate": 0.000999314513574934, "epoch": 0.03, "percentage": 1.67, "elapsed_time": "0:07:13", "remaining_time": "7:05:56"} +{"current_steps": 180, "total_steps": 10798, "loss": 2.202, "reward": null, "learning_rate": 0.000999314513574934, "epoch": 0.03, "percentage": 1.67, "elapsed_time": "0:07:11", "remaining_time": "7:04:12"} +{"current_steps": 190, "total_steps": 10798, "loss": 2.1208, "reward": null, "learning_rate": 0.0009992362526524616, "epoch": 0.04, "percentage": 1.76, "elapsed_time": "0:13:38", "remaining_time": "12:41:43"} +{"current_steps": 190, "total_steps": 10798, "loss": 2.1208, "reward": null, "learning_rate": 0.0009992362526524616, "epoch": 0.04, "percentage": 1.76, "elapsed_time": "0:07:35", "remaining_time": "7:03:43"} +{"current_steps": 190, "total_steps": 10798, "loss": 2.1208, "reward": null, "learning_rate": 0.0009992362526524616, "epoch": 0.04, "percentage": 1.76, "elapsed_time": "0:07:37", "remaining_time": "7:05:21"} +{"current_steps": 190, "total_steps": 10798, "loss": 2.1208, "reward": null, "learning_rate": 0.0009992362526524616, "epoch": 0.04, "percentage": 1.76, "elapsed_time": "0:07:33", "remaining_time": "7:02:14"} +{"current_steps": 200, "total_steps": 10798, "loss": 2.1591, "reward": null, "learning_rate": 0.0009991537658329906, "epoch": 0.04, "percentage": 1.85, "elapsed_time": "0:07:58", "remaining_time": "7:03:00"} +{"current_steps": 200, "total_steps": 10798, "loss": 2.1591, "reward": null, "learning_rate": 0.0009991537658329906, "epoch": 0.04, "percentage": 1.85, "elapsed_time": "0:07:57", "remaining_time": "7:01:35"} +{"current_steps": 200, "total_steps": 10798, "loss": 2.1591, "reward": null, "learning_rate": 0.0009991537658329906, "epoch": 0.04, "percentage": 1.85, "elapsed_time": "0:08:00", "remaining_time": "7:04:32"} +{"current_steps": 200, "total_steps": 10798, "loss": 2.1591, "reward": null, "learning_rate": 0.0009991537658329906, "epoch": 0.04, "percentage": 1.85, "elapsed_time": "0:14:02", "remaining_time": "12:23:47"} +{"current_steps": 210, "total_steps": 10798, "loss": 2.1788, "reward": null, "learning_rate": 0.000999067053814749, "epoch": 0.04, "percentage": 1.94, "elapsed_time": "0:08:23", "remaining_time": "7:03:17"} +{"current_steps": 210, "total_steps": 10798, "loss": 2.1788, "reward": null, "learning_rate": 0.000999067053814749, "epoch": 0.04, "percentage": 1.94, "elapsed_time": "0:08:20", "remaining_time": "7:00:28"} +{"current_steps": 210, "total_steps": 10798, "loss": 2.1788, "reward": null, "learning_rate": 0.000999067053814749, "epoch": 0.04, "percentage": 1.94, "elapsed_time": "0:08:21", "remaining_time": "7:01:49"} +{"current_steps": 210, "total_steps": 10798, "loss": 2.1788, "reward": null, "learning_rate": 0.000999067053814749, "epoch": 0.04, "percentage": 1.94, "elapsed_time": "0:14:25", "remaining_time": "12:07:02"} +{"current_steps": 220, "total_steps": 10798, "loss": 2.147, "reward": null, "learning_rate": 0.0009989761173317304, "epoch": 0.04, "percentage": 2.04, "elapsed_time": "0:14:48", "remaining_time": "11:52:05"} +{"current_steps": 220, "total_steps": 10798, "loss": 2.147, "reward": null, "learning_rate": 0.0009989761173317304, "epoch": 0.04, "percentage": 2.04, "elapsed_time": "0:08:45", "remaining_time": "7:01:01"} +{"current_steps": 220, "total_steps": 10798, "loss": 2.147, "reward": null, "learning_rate": 0.0009989761173317304, "epoch": 0.04, "percentage": 2.04, "elapsed_time": "0:08:43", "remaining_time": "6:59:44"} +{"current_steps": 220, "total_steps": 10798, "loss": 2.147, "reward": null, "learning_rate": 0.0009989761173317304, "epoch": 0.04, "percentage": 2.04, "elapsed_time": "0:08:47", "remaining_time": "7:02:25"} +{"current_steps": 230, "total_steps": 10798, "loss": 2.1249, "reward": null, "learning_rate": 0.000998880957153687, "epoch": 0.04, "percentage": 2.13, "elapsed_time": "0:15:12", "remaining_time": "11:39:02"} +{"current_steps": 230, "total_steps": 10798, "loss": 2.1249, "reward": null, "learning_rate": 0.000998880957153687, "epoch": 0.04, "percentage": 2.13, "elapsed_time": "0:09:09", "remaining_time": "7:00:53"} +{"current_steps": 230, "total_steps": 10798, "loss": 2.1249, "reward": null, "learning_rate": 0.000998880957153687, "epoch": 0.04, "percentage": 2.13, "elapsed_time": "0:09:11", "remaining_time": "7:02:13"} +{"current_steps": 230, "total_steps": 10798, "loss": 2.1249, "reward": null, "learning_rate": 0.000998880957153687, "epoch": 0.04, "percentage": 2.13, "elapsed_time": "0:09:08", "remaining_time": "6:59:39"} +{"current_steps": 240, "total_steps": 10798, "loss": 2.165, "reward": null, "learning_rate": 0.000998781574086123, "epoch": 0.04, "percentage": 2.22, "elapsed_time": "0:09:32", "remaining_time": "6:59:49"} +{"current_steps": 240, "total_steps": 10798, "loss": 2.165, "reward": null, "learning_rate": 0.000998781574086123, "epoch": 0.04, "percentage": 2.22, "elapsed_time": "0:09:34", "remaining_time": "7:00:59"} +{"current_steps": 240, "total_steps": 10798, "loss": 2.165, "reward": null, "learning_rate": 0.000998781574086123, "epoch": 0.04, "percentage": 2.22, "elapsed_time": "0:09:35", "remaining_time": "7:02:16"} +{"current_steps": 240, "total_steps": 10798, "loss": 2.165, "reward": null, "learning_rate": 0.000998781574086123, "epoch": 0.04, "percentage": 2.22, "elapsed_time": "0:15:37", "remaining_time": "11:27:18"} +{"current_steps": 250, "total_steps": 10798, "loss": 2.1428, "reward": null, "learning_rate": 0.000998677968970289, "epoch": 0.05, "percentage": 2.32, "elapsed_time": "0:10:00", "remaining_time": "7:02:18"} +{"current_steps": 250, "total_steps": 10798, "loss": 2.1428, "reward": null, "learning_rate": 0.000998677968970289, "epoch": 0.05, "percentage": 2.32, "elapsed_time": "0:09:57", "remaining_time": "6:59:57"} +{"current_steps": 250, "total_steps": 10798, "loss": 2.1428, "reward": null, "learning_rate": 0.000998677968970289, "epoch": 0.05, "percentage": 2.32, "elapsed_time": "0:09:58", "remaining_time": "7:01:04"} +{"current_steps": 250, "total_steps": 10798, "loss": 2.1428, "reward": null, "learning_rate": 0.000998677968970289, "epoch": 0.05, "percentage": 2.32, "elapsed_time": "0:16:02", "remaining_time": "11:16:29"} +{"current_steps": 260, "total_steps": 10798, "loss": 2.1384, "reward": null, "learning_rate": 0.0009985701426831735, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:16:25", "remaining_time": "11:05:51"} +{"current_steps": 260, "total_steps": 10798, "loss": 2.1384, "reward": null, "learning_rate": 0.0009985701426831735, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:10:20", "remaining_time": "6:59:25"} +{"current_steps": 260, "total_steps": 10798, "loss": 2.1384, "reward": null, "learning_rate": 0.0009985701426831735, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:10:22", "remaining_time": "7:00:29"} +{"current_steps": 260, "total_steps": 10798, "loss": 2.1384, "reward": null, "learning_rate": 0.0009985701426831735, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:10:24", "remaining_time": "7:01:40"} +{"current_steps": 270, "total_steps": 10798, "loss": 2.1585, "reward": null, "learning_rate": 0.0009984580961374964, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:10:46", "remaining_time": "7:00:15"} +{"current_steps": 270, "total_steps": 10798, "loss": 2.1585, "reward": null, "learning_rate": 0.0009984580961374964, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:16:49", "remaining_time": "10:56:18"} +{"current_steps": 270, "total_steps": 10798, "loss": 2.1585, "reward": null, "learning_rate": 0.0009984580961374964, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:10:45", "remaining_time": "6:59:13"} +{"current_steps": 270, "total_steps": 10798, "loss": 2.1585, "reward": null, "learning_rate": 0.0009984580961374964, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:10:48", "remaining_time": "7:01:24"} +{"current_steps": 280, "total_steps": 10798, "loss": 2.1156, "reward": null, "learning_rate": 0.0009983418302817008, "epoch": 0.05, "percentage": 2.59, "elapsed_time": "0:17:14", "remaining_time": "10:47:29"} +{"current_steps": 280, "total_steps": 10798, "loss": 2.1156, "reward": null, "learning_rate": 0.0009983418302817008, "epoch": 0.05, "percentage": 2.59, "elapsed_time": "0:11:09", "remaining_time": "6:59:05"} +{"current_steps": 280, "total_steps": 10798, "loss": 2.1156, "reward": null, "learning_rate": 0.0009983418302817008, "epoch": 0.05, "percentage": 2.59, "elapsed_time": "0:11:11", "remaining_time": "7:00:05"} +{"current_steps": 280, "total_steps": 10798, "loss": 2.1156, "reward": null, "learning_rate": 0.0009983418302817008, "epoch": 0.05, "percentage": 2.59, "elapsed_time": "0:11:12", "remaining_time": "7:01:11"} +{"current_steps": 290, "total_steps": 10798, "loss": 2.0811, "reward": null, "learning_rate": 0.0009982213460999448, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:17:37", "remaining_time": "10:38:32"} +{"current_steps": 290, "total_steps": 10798, "loss": 2.0811, "reward": null, "learning_rate": 0.0009982213460999448, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:11:34", "remaining_time": "6:59:11"} +{"current_steps": 290, "total_steps": 10798, "loss": 2.0811, "reward": null, "learning_rate": 0.0009982213460999448, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:11:35", "remaining_time": "7:00:14"} +{"current_steps": 290, "total_steps": 10798, "loss": 2.0811, "reward": null, "learning_rate": 0.0009982213460999448, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:11:32", "remaining_time": "6:58:13"} +{"current_steps": 300, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.000998096644612094, "epoch": 0.06, "percentage": 2.78, "elapsed_time": "0:11:59", "remaining_time": "6:59:25"} +{"current_steps": 300, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.000998096644612094, "epoch": 0.06, "percentage": 2.78, "elapsed_time": "0:11:57", "remaining_time": "6:58:24"} +{"current_steps": 300, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.000998096644612094, "epoch": 0.06, "percentage": 2.78, "elapsed_time": "0:11:55", "remaining_time": "6:57:28"} +{"current_steps": 300, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.000998096644612094, "epoch": 0.06, "percentage": 2.78, "elapsed_time": "0:18:00", "remaining_time": "10:30:14"} +{"current_steps": 310, "total_steps": 10798, "loss": 2.1246, "reward": null, "learning_rate": 0.0009979677268737118, "epoch": 0.06, "percentage": 2.87, "elapsed_time": "0:18:24", "remaining_time": "10:23:02"} +{"current_steps": 310, "total_steps": 10798, "loss": 2.1246, "reward": null, "learning_rate": 0.0009979677268737118, "epoch": 0.06, "percentage": 2.87, "elapsed_time": "0:12:20", "remaining_time": "6:57:19"} +{"current_steps": 310, "total_steps": 10798, "loss": 2.1246, "reward": null, "learning_rate": 0.0009979677268737118, "epoch": 0.06, "percentage": 2.87, "elapsed_time": "0:12:21", "remaining_time": "6:58:13"} +{"current_steps": 310, "total_steps": 10798, "loss": 2.1246, "reward": null, "learning_rate": 0.0009979677268737118, "epoch": 0.06, "percentage": 2.87, "elapsed_time": "0:12:23", "remaining_time": "6:59:13"} +{"current_steps": 320, "total_steps": 10798, "loss": 2.1229, "reward": null, "learning_rate": 0.0009978345939760515, "epoch": 0.06, "percentage": 2.96, "elapsed_time": "0:18:50", "remaining_time": "10:16:51"} +{"current_steps": 320, "total_steps": 10798, "loss": 2.1229, "reward": null, "learning_rate": 0.0009978345939760515, "epoch": 0.06, "percentage": 2.96, "elapsed_time": "0:12:45", "remaining_time": "6:57:45"} +{"current_steps": 320, "total_steps": 10798, "loss": 2.1229, "reward": null, "learning_rate": 0.0009978345939760515, "epoch": 0.06, "percentage": 2.96, "elapsed_time": "0:12:48", "remaining_time": "6:59:35"} +{"current_steps": 320, "total_steps": 10798, "loss": 2.1229, "reward": null, "learning_rate": 0.0009978345939760515, "epoch": 0.06, "percentage": 2.96, "elapsed_time": "0:12:47", "remaining_time": "6:58:38"} +{"current_steps": 330, "total_steps": 10798, "loss": 2.1033, "reward": null, "learning_rate": 0.000997697247046046, "epoch": 0.06, "percentage": 3.06, "elapsed_time": "0:19:14", "remaining_time": "10:10:24"} +{"current_steps": 330, "total_steps": 10798, "loss": 2.1033, "reward": null, "learning_rate": 0.000997697247046046, "epoch": 0.06, "percentage": 3.06, "elapsed_time": "0:13:11", "remaining_time": "6:58:22"} +{"current_steps": 330, "total_steps": 10798, "loss": 2.1033, "reward": null, "learning_rate": 0.000997697247046046, "epoch": 0.06, "percentage": 3.06, "elapsed_time": "0:13:13", "remaining_time": "6:59:17"} +{"current_steps": 330, "total_steps": 10798, "loss": 2.1033, "reward": null, "learning_rate": 0.000997697247046046, "epoch": 0.06, "percentage": 3.06, "elapsed_time": "0:13:09", "remaining_time": "6:57:31"} +{"current_steps": 340, "total_steps": 10798, "loss": 2.0931, "reward": null, "learning_rate": 0.0009975556872462994, "epoch": 0.06, "percentage": 3.15, "elapsed_time": "0:13:34", "remaining_time": "6:57:25"} +{"current_steps": 340, "total_steps": 10798, "loss": 2.0931, "reward": null, "learning_rate": 0.0009975556872462994, "epoch": 0.06, "percentage": 3.15, "elapsed_time": "0:13:35", "remaining_time": "6:58:14"} +{"current_steps": 340, "total_steps": 10798, "loss": 2.0931, "reward": null, "learning_rate": 0.0009975556872462994, "epoch": 0.06, "percentage": 3.15, "elapsed_time": "0:19:39", "remaining_time": "10:04:26"} +{"current_steps": 340, "total_steps": 10798, "loss": 2.0931, "reward": null, "learning_rate": 0.0009975556872462994, "epoch": 0.06, "percentage": 3.15, "elapsed_time": "0:13:37", "remaining_time": "6:59:08"} +{"current_steps": 350, "total_steps": 10798, "loss": 2.1206, "reward": null, "learning_rate": 0.000997409915775076, "epoch": 0.06, "percentage": 3.24, "elapsed_time": "0:20:02", "remaining_time": "9:58:22"} +{"current_steps": 350, "total_steps": 10798, "loss": 2.1206, "reward": null, "learning_rate": 0.000997409915775076, "epoch": 0.06, "percentage": 3.24, "elapsed_time": "0:13:59", "remaining_time": "6:57:39"} +{"current_steps": 350, "total_steps": 10798, "loss": 2.1206, "reward": null, "learning_rate": 0.000997409915775076, "epoch": 0.06, "percentage": 3.24, "elapsed_time": "0:14:01", "remaining_time": "6:58:31"} +{"current_steps": 350, "total_steps": 10798, "loss": 2.1206, "reward": null, "learning_rate": 0.000997409915775076, "epoch": 0.06, "percentage": 3.24, "elapsed_time": "0:13:57", "remaining_time": "6:56:51"} +{"current_steps": 360, "total_steps": 10798, "loss": 2.0537, "reward": null, "learning_rate": 0.0009972599338662915, "epoch": 0.07, "percentage": 3.33, "elapsed_time": "0:20:26", "remaining_time": "9:52:40"} +{"current_steps": 360, "total_steps": 10798, "loss": 2.0537, "reward": null, "learning_rate": 0.0009972599338662915, "epoch": 0.07, "percentage": 3.33, "elapsed_time": "0:14:21", "remaining_time": "6:56:22"} +{"current_steps": 360, "total_steps": 10798, "loss": 2.0537, "reward": null, "learning_rate": 0.0009972599338662915, "epoch": 0.07, "percentage": 3.33, "elapsed_time": "0:14:24", "remaining_time": "6:57:59"} +{"current_steps": 360, "total_steps": 10798, "loss": 2.0537, "reward": null, "learning_rate": 0.0009972599338662915, "epoch": 0.07, "percentage": 3.33, "elapsed_time": "0:14:23", "remaining_time": "6:57:08"} +{"current_steps": 370, "total_steps": 10798, "loss": 2.0762, "reward": null, "learning_rate": 0.0009971057427895012, "epoch": 0.07, "percentage": 3.43, "elapsed_time": "0:14:45", "remaining_time": "6:56:05"} +{"current_steps": 370, "total_steps": 10798, "loss": 2.0762, "reward": null, "learning_rate": 0.0009971057427895012, "epoch": 0.07, "percentage": 3.43, "elapsed_time": "0:14:49", "remaining_time": "6:57:40"} +{"current_steps": 370, "total_steps": 10798, "loss": 2.0762, "reward": null, "learning_rate": 0.0009971057427895012, "epoch": 0.07, "percentage": 3.43, "elapsed_time": "0:14:47", "remaining_time": "6:56:51"} +{"current_steps": 370, "total_steps": 10798, "loss": 2.0762, "reward": null, "learning_rate": 0.0009971057427895012, "epoch": 0.07, "percentage": 3.43, "elapsed_time": "0:20:50", "remaining_time": "9:47:28"} +{"current_steps": 380, "total_steps": 10798, "loss": 2.0883, "reward": null, "learning_rate": 0.0009969473438498897, "epoch": 0.07, "percentage": 3.52, "elapsed_time": "0:21:14", "remaining_time": "9:42:15"} +{"current_steps": 380, "total_steps": 10798, "loss": 2.0883, "reward": null, "learning_rate": 0.0009969473438498897, "epoch": 0.07, "percentage": 3.52, "elapsed_time": "0:15:11", "remaining_time": "6:56:17"} +{"current_steps": 380, "total_steps": 10798, "loss": 2.0883, "reward": null, "learning_rate": 0.0009969473438498897, "epoch": 0.07, "percentage": 3.52, "elapsed_time": "0:15:09", "remaining_time": "6:55:33"} +{"current_steps": 380, "total_steps": 10798, "loss": 2.0883, "reward": null, "learning_rate": 0.0009969473438498897, "epoch": 0.07, "percentage": 3.52, "elapsed_time": "0:15:12", "remaining_time": "6:57:05"} +{"current_steps": 390, "total_steps": 10798, "loss": 2.1174, "reward": null, "learning_rate": 0.0009967847383882604, "epoch": 0.07, "percentage": 3.61, "elapsed_time": "0:15:35", "remaining_time": "6:56:01"} +{"current_steps": 390, "total_steps": 10798, "loss": 2.1174, "reward": null, "learning_rate": 0.0009967847383882604, "epoch": 0.07, "percentage": 3.61, "elapsed_time": "0:15:37", "remaining_time": "6:56:47"} +{"current_steps": 390, "total_steps": 10798, "loss": 2.1174, "reward": null, "learning_rate": 0.0009967847383882604, "epoch": 0.07, "percentage": 3.61, "elapsed_time": "0:15:33", "remaining_time": "6:55:18"} +{"current_steps": 390, "total_steps": 10798, "loss": 2.1174, "reward": null, "learning_rate": 0.0009967847383882604, "epoch": 0.07, "percentage": 3.61, "elapsed_time": "0:21:38", "remaining_time": "9:37:34"} +{"current_steps": 400, "total_steps": 10798, "loss": 2.1111, "reward": null, "learning_rate": 0.0009966179277810239, "epoch": 0.07, "percentage": 3.7, "elapsed_time": "0:22:02", "remaining_time": "9:33:02"} +{"current_steps": 400, "total_steps": 10798, "loss": 2.1111, "reward": null, "learning_rate": 0.0009966179277810239, "epoch": 0.07, "percentage": 3.7, "elapsed_time": "0:15:59", "remaining_time": "6:55:40"} +{"current_steps": 400, "total_steps": 10798, "loss": 2.1111, "reward": null, "learning_rate": 0.0009966179277810239, "epoch": 0.07, "percentage": 3.7, "elapsed_time": "0:15:57", "remaining_time": "6:54:58"} +{"current_steps": 400, "total_steps": 10798, "loss": 2.1111, "reward": null, "learning_rate": 0.0009966179277810239, "epoch": 0.07, "percentage": 3.7, "elapsed_time": "0:16:01", "remaining_time": "6:56:26"} +{"current_steps": 410, "total_steps": 10798, "loss": 2.1288, "reward": null, "learning_rate": 0.0009964469134401855, "epoch": 0.08, "percentage": 3.8, "elapsed_time": "0:22:26", "remaining_time": "9:28:43"} +{"current_steps": 410, "total_steps": 10798, "loss": 2.1288, "reward": null, "learning_rate": 0.0009964469134401855, "epoch": 0.08, "percentage": 3.8, "elapsed_time": "0:16:23", "remaining_time": "6:55:21"} +{"current_steps": 410, "total_steps": 10798, "loss": 2.1288, "reward": null, "learning_rate": 0.0009964469134401855, "epoch": 0.08, "percentage": 3.8, "elapsed_time": "0:16:25", "remaining_time": "6:56:05"} +{"current_steps": 410, "total_steps": 10798, "loss": 2.1288, "reward": null, "learning_rate": 0.0009964469134401855, "epoch": 0.08, "percentage": 3.8, "elapsed_time": "0:16:22", "remaining_time": "6:54:40"} +{"current_steps": 420, "total_steps": 10798, "loss": 2.0967, "reward": null, "learning_rate": 0.0009962716968133346, "epoch": 0.08, "percentage": 3.89, "elapsed_time": "0:16:48", "remaining_time": "6:55:20"} +{"current_steps": 420, "total_steps": 10798, "loss": 2.0967, "reward": null, "learning_rate": 0.0009962716968133346, "epoch": 0.08, "percentage": 3.89, "elapsed_time": "0:16:50", "remaining_time": "6:56:04"} +{"current_steps": 420, "total_steps": 10798, "loss": 2.0967, "reward": null, "learning_rate": 0.0009962716968133346, "epoch": 0.08, "percentage": 3.89, "elapsed_time": "0:16:46", "remaining_time": "6:54:41"} +{"current_steps": 420, "total_steps": 10798, "loss": 2.0967, "reward": null, "learning_rate": 0.0009962716968133346, "epoch": 0.08, "percentage": 3.89, "elapsed_time": "0:22:51", "remaining_time": "9:24:55"} +{"current_steps": 430, "total_steps": 10798, "loss": 2.1216, "reward": null, "learning_rate": 0.0009960922793836318, "epoch": 0.08, "percentage": 3.98, "elapsed_time": "0:17:14", "remaining_time": "6:55:42"} +{"current_steps": 430, "total_steps": 10798, "loss": 2.1216, "reward": null, "learning_rate": 0.0009960922793836318, "epoch": 0.08, "percentage": 3.98, "elapsed_time": "0:17:11", "remaining_time": "6:54:21"} +{"current_steps": 430, "total_steps": 10798, "loss": 2.1216, "reward": null, "learning_rate": 0.0009960922793836318, "epoch": 0.08, "percentage": 3.98, "elapsed_time": "0:17:12", "remaining_time": "6:55:00"} +{"current_steps": 430, "total_steps": 10798, "loss": 2.1216, "reward": null, "learning_rate": 0.0009960922793836318, "epoch": 0.08, "percentage": 3.98, "elapsed_time": "0:23:15", "remaining_time": "9:20:58"} +{"current_steps": 440, "total_steps": 10798, "loss": 2.0924, "reward": null, "learning_rate": 0.0009959086626697955, "epoch": 0.08, "percentage": 4.07, "elapsed_time": "0:23:41", "remaining_time": "9:17:37"} +{"current_steps": 440, "total_steps": 10798, "loss": 2.0924, "reward": null, "learning_rate": 0.0009959086626697955, "epoch": 0.08, "percentage": 4.07, "elapsed_time": "0:17:36", "remaining_time": "6:54:29"} +{"current_steps": 440, "total_steps": 10798, "loss": 2.0924, "reward": null, "learning_rate": 0.0009959086626697955, "epoch": 0.08, "percentage": 4.07, "elapsed_time": "0:17:39", "remaining_time": "6:55:48"} +{"current_steps": 440, "total_steps": 10798, "loss": 2.0924, "reward": null, "learning_rate": 0.0009959086626697955, "epoch": 0.08, "percentage": 4.07, "elapsed_time": "0:17:38", "remaining_time": "6:55:07"} +{"current_steps": 450, "total_steps": 10798, "loss": 2.0809, "reward": null, "learning_rate": 0.0009957208482260908, "epoch": 0.08, "percentage": 4.17, "elapsed_time": "0:24:05", "remaining_time": "9:13:58"} +{"current_steps": 450, "total_steps": 10798, "loss": 2.0809, "reward": null, "learning_rate": 0.0009957208482260908, "epoch": 0.08, "percentage": 4.17, "elapsed_time": "0:18:03", "remaining_time": "6:55:25"} +{"current_steps": 450, "total_steps": 10798, "loss": 2.0809, "reward": null, "learning_rate": 0.0009957208482260908, "epoch": 0.08, "percentage": 4.17, "elapsed_time": "0:18:02", "remaining_time": "6:54:45"} +{"current_steps": 450, "total_steps": 10798, "loss": 2.0809, "reward": null, "learning_rate": 0.0009957208482260908, "epoch": 0.08, "percentage": 4.17, "elapsed_time": "0:18:00", "remaining_time": "6:54:08"} +{"current_steps": 460, "total_steps": 10798, "loss": 2.1082, "reward": null, "learning_rate": 0.0009955288376423152, "epoch": 0.09, "percentage": 4.26, "elapsed_time": "0:24:30", "remaining_time": "9:10:46"} +{"current_steps": 460, "total_steps": 10798, "loss": 2.1082, "reward": null, "learning_rate": 0.0009955288376423152, "epoch": 0.09, "percentage": 4.26, "elapsed_time": "0:18:28", "remaining_time": "6:55:23"} +{"current_steps": 460, "total_steps": 10798, "loss": 2.1082, "reward": null, "learning_rate": 0.0009955288376423152, "epoch": 0.09, "percentage": 4.26, "elapsed_time": "0:18:27", "remaining_time": "6:54:43"} +{"current_steps": 460, "total_steps": 10798, "loss": 2.1082, "reward": null, "learning_rate": 0.0009955288376423152, "epoch": 0.09, "percentage": 4.26, "elapsed_time": "0:18:25", "remaining_time": "6:54:07"} +{"current_steps": 470, "total_steps": 10798, "loss": 2.0885, "reward": null, "learning_rate": 0.0009953326325437852, "epoch": 0.09, "percentage": 4.35, "elapsed_time": "0:24:54", "remaining_time": "9:07:10"} +{"current_steps": 470, "total_steps": 10798, "loss": 2.0885, "reward": null, "learning_rate": 0.0009953326325437852, "epoch": 0.09, "percentage": 4.35, "elapsed_time": "0:18:50", "remaining_time": "6:54:09"} +{"current_steps": 470, "total_steps": 10798, "loss": 2.0885, "reward": null, "learning_rate": 0.0009953326325437852, "epoch": 0.09, "percentage": 4.35, "elapsed_time": "0:18:52", "remaining_time": "6:54:47"} +{"current_steps": 470, "total_steps": 10798, "loss": 2.0885, "reward": null, "learning_rate": 0.0009953326325437852, "epoch": 0.09, "percentage": 4.35, "elapsed_time": "0:18:49", "remaining_time": "6:53:34"} +{"current_steps": 480, "total_steps": 10798, "loss": 2.1133, "reward": null, "learning_rate": 0.0009951322345913224, "epoch": 0.09, "percentage": 4.45, "elapsed_time": "0:25:18", "remaining_time": "9:04:04"} +{"current_steps": 480, "total_steps": 10798, "loss": 2.1133, "reward": null, "learning_rate": 0.0009951322345913224, "epoch": 0.09, "percentage": 4.45, "elapsed_time": "0:19:13", "remaining_time": "6:53:22"} +{"current_steps": 480, "total_steps": 10798, "loss": 2.1133, "reward": null, "learning_rate": 0.0009951322345913224, "epoch": 0.09, "percentage": 4.45, "elapsed_time": "0:19:15", "remaining_time": "6:53:56"} +{"current_steps": 480, "total_steps": 10798, "loss": 2.1133, "reward": null, "learning_rate": 0.0009951322345913224, "epoch": 0.09, "percentage": 4.45, "elapsed_time": "0:19:17", "remaining_time": "6:54:34"} +{"current_steps": 490, "total_steps": 10798, "loss": 2.0844, "reward": null, "learning_rate": 0.0009949276454812408, "epoch": 0.09, "percentage": 4.54, "elapsed_time": "0:19:37", "remaining_time": "6:52:45"} +{"current_steps": 490, "total_steps": 10798, "loss": 2.0844, "reward": null, "learning_rate": 0.0009949276454812408, "epoch": 0.09, "percentage": 4.54, "elapsed_time": "0:19:40", "remaining_time": "6:53:56"} +{"current_steps": 490, "total_steps": 10798, "loss": 2.0844, "reward": null, "learning_rate": 0.0009949276454812408, "epoch": 0.09, "percentage": 4.54, "elapsed_time": "0:19:38", "remaining_time": "6:53:19"} +{"current_steps": 490, "total_steps": 10798, "loss": 2.0844, "reward": null, "learning_rate": 0.0009949276454812408, "epoch": 0.09, "percentage": 4.54, "elapsed_time": "0:25:42", "remaining_time": "9:00:40"} +{"current_steps": 500, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.00099471886694533, "epoch": 0.09, "percentage": 4.63, "elapsed_time": "0:20:02", "remaining_time": "6:52:55"} +{"current_steps": 500, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.00099471886694533, "epoch": 0.09, "percentage": 4.63, "elapsed_time": "0:20:04", "remaining_time": "6:53:31"} +{"current_steps": 500, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.00099471886694533, "epoch": 0.09, "percentage": 4.63, "elapsed_time": "0:26:06", "remaining_time": "8:57:36"} +{"current_steps": 500, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.00099471886694533, "epoch": 0.09, "percentage": 4.63, "elapsed_time": "0:20:01", "remaining_time": "6:52:22"} +{"current_steps": 510, "total_steps": 10798, "loss": 2.1255, "reward": null, "learning_rate": 0.0009945059007508434, "epoch": 0.09, "percentage": 4.72, "elapsed_time": "0:26:31", "remaining_time": "8:55:06"} +{"current_steps": 510, "total_steps": 10798, "loss": 2.1255, "reward": null, "learning_rate": 0.0009945059007508434, "epoch": 0.09, "percentage": 4.72, "elapsed_time": "0:20:28", "remaining_time": "6:52:59"} +{"current_steps": 510, "total_steps": 10798, "loss": 2.1255, "reward": null, "learning_rate": 0.0009945059007508434, "epoch": 0.09, "percentage": 4.72, "elapsed_time": "0:20:26", "remaining_time": "6:52:26"} +{"current_steps": 510, "total_steps": 10798, "loss": 2.1255, "reward": null, "learning_rate": 0.0009945059007508434, "epoch": 0.09, "percentage": 4.72, "elapsed_time": "0:20:30", "remaining_time": "6:53:34"} +{"current_steps": 520, "total_steps": 10798, "loss": 2.0913, "reward": null, "learning_rate": 0.0009942887487004804, "epoch": 0.1, "percentage": 4.82, "elapsed_time": "0:20:51", "remaining_time": "6:52:18"} +{"current_steps": 520, "total_steps": 10798, "loss": 2.0913, "reward": null, "learning_rate": 0.0009942887487004804, "epoch": 0.1, "percentage": 4.82, "elapsed_time": "0:20:53", "remaining_time": "6:52:49"} +{"current_steps": 520, "total_steps": 10798, "loss": 2.0913, "reward": null, "learning_rate": 0.0009942887487004804, "epoch": 0.1, "percentage": 4.82, "elapsed_time": "0:20:54", "remaining_time": "6:53:24"} +{"current_steps": 520, "total_steps": 10798, "loss": 2.0913, "reward": null, "learning_rate": 0.0009942887487004804, "epoch": 0.1, "percentage": 4.82, "elapsed_time": "0:26:56", "remaining_time": "8:52:28"} +{"current_steps": 530, "total_steps": 10798, "loss": 2.1003, "reward": null, "learning_rate": 0.0009940674126323733, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:27:20", "remaining_time": "8:49:40"} +{"current_steps": 530, "total_steps": 10798, "loss": 2.1003, "reward": null, "learning_rate": 0.0009940674126323733, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:21:15", "remaining_time": "6:51:52"} +{"current_steps": 530, "total_steps": 10798, "loss": 2.1003, "reward": null, "learning_rate": 0.0009940674126323733, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:21:18", "remaining_time": "6:52:57"} +{"current_steps": 530, "total_steps": 10798, "loss": 2.1003, "reward": null, "learning_rate": 0.0009940674126323733, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:21:17", "remaining_time": "6:52:23"} +{"current_steps": 540, "total_steps": 10798, "loss": 2.0541, "reward": null, "learning_rate": 0.0009938418944200709, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:27:46", "remaining_time": "8:47:34"} +{"current_steps": 540, "total_steps": 10798, "loss": 2.0541, "reward": null, "learning_rate": 0.0009938418944200709, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:21:41", "remaining_time": "6:52:04"} +{"current_steps": 540, "total_steps": 10798, "loss": 2.0541, "reward": null, "learning_rate": 0.0009938418944200709, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:21:43", "remaining_time": "6:52:34"} +{"current_steps": 540, "total_steps": 10798, "loss": 2.0541, "reward": null, "learning_rate": 0.0009938418944200709, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:21:44", "remaining_time": "6:53:08"} +{"current_steps": 550, "total_steps": 10798, "loss": 2.0523, "reward": null, "learning_rate": 0.0009936121959725223, "epoch": 0.1, "percentage": 5.09, "elapsed_time": "0:22:06", "remaining_time": "6:51:57"} +{"current_steps": 550, "total_steps": 10798, "loss": 2.0523, "reward": null, "learning_rate": 0.0009936121959725223, "epoch": 0.1, "percentage": 5.09, "elapsed_time": "0:28:09", "remaining_time": "8:44:45"} +{"current_steps": 550, "total_steps": 10798, "loss": 2.0523, "reward": null, "learning_rate": 0.0009936121959725223, "epoch": 0.1, "percentage": 5.09, "elapsed_time": "0:22:08", "remaining_time": "6:52:30"} +{"current_steps": 550, "total_steps": 10798, "loss": 2.0523, "reward": null, "learning_rate": 0.0009936121959725223, "epoch": 0.1, "percentage": 5.09, "elapsed_time": "0:22:04", "remaining_time": "6:51:27"} +{"current_steps": 560, "total_steps": 10798, "loss": 2.1225, "reward": null, "learning_rate": 0.0009933783192340618, "epoch": 0.1, "percentage": 5.19, "elapsed_time": "0:28:35", "remaining_time": "8:42:36"} +{"current_steps": 560, "total_steps": 10798, "loss": 2.1225, "reward": null, "learning_rate": 0.0009933783192340618, "epoch": 0.1, "percentage": 5.19, "elapsed_time": "0:22:33", "remaining_time": "6:52:28"} +{"current_steps": 560, "total_steps": 10798, "loss": 2.1225, "reward": null, "learning_rate": 0.0009933783192340618, "epoch": 0.1, "percentage": 5.19, "elapsed_time": "0:22:30", "remaining_time": "6:51:27"} +{"current_steps": 560, "total_steps": 10798, "loss": 2.1225, "reward": null, "learning_rate": 0.0009933783192340618, "epoch": 0.1, "percentage": 5.19, "elapsed_time": "0:22:31", "remaining_time": "6:51:56"} +{"current_steps": 570, "total_steps": 10798, "loss": 2.0446, "reward": null, "learning_rate": 0.0009931402661843911, "epoch": 0.11, "percentage": 5.28, "elapsed_time": "0:28:59", "remaining_time": "8:40:15"} +{"current_steps": 570, "total_steps": 10798, "loss": 2.0446, "reward": null, "learning_rate": 0.0009931402661843911, "epoch": 0.11, "percentage": 5.28, "elapsed_time": "0:22:58", "remaining_time": "6:52:09"} +{"current_steps": 570, "total_steps": 10798, "loss": 2.0446, "reward": null, "learning_rate": 0.0009931402661843911, "epoch": 0.11, "percentage": 5.28, "elapsed_time": "0:22:56", "remaining_time": "6:51:38"} +{"current_steps": 570, "total_steps": 10798, "loss": 2.0446, "reward": null, "learning_rate": 0.0009931402661843911, "epoch": 0.11, "percentage": 5.28, "elapsed_time": "0:22:54", "remaining_time": "6:51:09"} +{"current_steps": 580, "total_steps": 10798, "loss": 2.0921, "reward": null, "learning_rate": 0.000992898038838564, "epoch": 0.11, "percentage": 5.37, "elapsed_time": "0:29:22", "remaining_time": "8:37:26"} +{"current_steps": 580, "total_steps": 10798, "loss": 2.0921, "reward": null, "learning_rate": 0.000992898038838564, "epoch": 0.11, "percentage": 5.37, "elapsed_time": "0:23:20", "remaining_time": "6:51:18"} +{"current_steps": 580, "total_steps": 10798, "loss": 2.0921, "reward": null, "learning_rate": 0.000992898038838564, "epoch": 0.11, "percentage": 5.37, "elapsed_time": "0:23:19", "remaining_time": "6:50:47"} +{"current_steps": 580, "total_steps": 10798, "loss": 2.0921, "reward": null, "learning_rate": 0.000992898038838564, "epoch": 0.11, "percentage": 5.37, "elapsed_time": "0:23:17", "remaining_time": "6:50:19"} +{"current_steps": 590, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.0009926516392469674, "epoch": 0.11, "percentage": 5.46, "elapsed_time": "0:29:46", "remaining_time": "8:35:01"} +{"current_steps": 590, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.0009926516392469674, "epoch": 0.11, "percentage": 5.46, "elapsed_time": "0:23:41", "remaining_time": "6:49:49"} +{"current_steps": 590, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.0009926516392469674, "epoch": 0.11, "percentage": 5.46, "elapsed_time": "0:23:42", "remaining_time": "6:50:16"} +{"current_steps": 590, "total_steps": 10798, "loss": 2.1081, "reward": null, "learning_rate": 0.0009926516392469674, "epoch": 0.11, "percentage": 5.46, "elapsed_time": "0:23:44", "remaining_time": "6:50:47"} +{"current_steps": 600, "total_steps": 10798, "loss": 2.0734, "reward": null, "learning_rate": 0.0009924010694953064, "epoch": 0.11, "percentage": 5.56, "elapsed_time": "0:30:10", "remaining_time": "8:32:46"} +{"current_steps": 600, "total_steps": 10798, "loss": 2.0734, "reward": null, "learning_rate": 0.0009924010694953064, "epoch": 0.11, "percentage": 5.56, "elapsed_time": "0:24:06", "remaining_time": "6:49:53"} +{"current_steps": 600, "total_steps": 10798, "loss": 2.0734, "reward": null, "learning_rate": 0.0009924010694953064, "epoch": 0.11, "percentage": 5.56, "elapsed_time": "0:24:08", "remaining_time": "6:50:22"} +{"current_steps": 600, "total_steps": 10798, "loss": 2.0734, "reward": null, "learning_rate": 0.0009924010694953064, "epoch": 0.11, "percentage": 5.56, "elapsed_time": "0:24:05", "remaining_time": "6:49:26"} +{"current_steps": 610, "total_steps": 10798, "loss": 2.0652, "reward": null, "learning_rate": 0.0009921463317045843, "epoch": 0.11, "percentage": 5.65, "elapsed_time": "0:24:31", "remaining_time": "6:49:37"} +{"current_steps": 610, "total_steps": 10798, "loss": 2.0652, "reward": null, "learning_rate": 0.0009921463317045843, "epoch": 0.11, "percentage": 5.65, "elapsed_time": "0:24:33", "remaining_time": "6:50:07"} +{"current_steps": 610, "total_steps": 10798, "loss": 2.0652, "reward": null, "learning_rate": 0.0009921463317045843, "epoch": 0.11, "percentage": 5.65, "elapsed_time": "0:24:29", "remaining_time": "6:49:11"} +{"current_steps": 610, "total_steps": 10798, "loss": 2.0652, "reward": null, "learning_rate": 0.0009921463317045843, "epoch": 0.11, "percentage": 5.65, "elapsed_time": "0:30:34", "remaining_time": "8:30:44"} +{"current_steps": 620, "total_steps": 10798, "loss": 2.0818, "reward": null, "learning_rate": 0.0009918874280310862, "epoch": 0.11, "percentage": 5.74, "elapsed_time": "0:24:53", "remaining_time": "6:48:45"} +{"current_steps": 620, "total_steps": 10798, "loss": 2.0818, "reward": null, "learning_rate": 0.0009918874280310862, "epoch": 0.11, "percentage": 5.74, "elapsed_time": "0:24:57", "remaining_time": "6:49:40"} +{"current_steps": 620, "total_steps": 10798, "loss": 2.0818, "reward": null, "learning_rate": 0.0009918874280310862, "epoch": 0.11, "percentage": 5.74, "elapsed_time": "0:24:55", "remaining_time": "6:49:11"} +{"current_steps": 620, "total_steps": 10798, "loss": 2.0818, "reward": null, "learning_rate": 0.0009918874280310862, "epoch": 0.11, "percentage": 5.74, "elapsed_time": "0:30:58", "remaining_time": "8:28:34"} +{"current_steps": 630, "total_steps": 10798, "loss": 2.0776, "reward": null, "learning_rate": 0.0009916243606663605, "epoch": 0.12, "percentage": 5.83, "elapsed_time": "0:25:21", "remaining_time": "6:49:22"} +{"current_steps": 630, "total_steps": 10798, "loss": 2.0776, "reward": null, "learning_rate": 0.0009916243606663605, "epoch": 0.12, "percentage": 5.83, "elapsed_time": "0:31:23", "remaining_time": "8:26:36"} +{"current_steps": 630, "total_steps": 10798, "loss": 2.0776, "reward": null, "learning_rate": 0.0009916243606663605, "epoch": 0.12, "percentage": 5.83, "elapsed_time": "0:25:20", "remaining_time": "6:48:53"} +{"current_steps": 630, "total_steps": 10798, "loss": 2.0776, "reward": null, "learning_rate": 0.0009916243606663605, "epoch": 0.12, "percentage": 5.83, "elapsed_time": "0:25:18", "remaining_time": "6:48:28"} +{"current_steps": 640, "total_steps": 10798, "loss": 2.1025, "reward": null, "learning_rate": 0.0009913571318371994, "epoch": 0.12, "percentage": 5.93, "elapsed_time": "0:31:46", "remaining_time": "8:24:23"} +{"current_steps": 640, "total_steps": 10798, "loss": 2.1025, "reward": null, "learning_rate": 0.0009913571318371994, "epoch": 0.12, "percentage": 5.93, "elapsed_time": "0:25:41", "remaining_time": "6:47:52"} +{"current_steps": 640, "total_steps": 10798, "loss": 2.1025, "reward": null, "learning_rate": 0.0009913571318371994, "epoch": 0.12, "percentage": 5.93, "elapsed_time": "0:25:45", "remaining_time": "6:48:46"} +{"current_steps": 640, "total_steps": 10798, "loss": 2.1025, "reward": null, "learning_rate": 0.0009913571318371994, "epoch": 0.12, "percentage": 5.93, "elapsed_time": "0:25:43", "remaining_time": "6:48:18"} +{"current_steps": 650, "total_steps": 10798, "loss": 2.066, "reward": null, "learning_rate": 0.0009910857438056215, "epoch": 0.12, "percentage": 6.02, "elapsed_time": "0:32:11", "remaining_time": "8:22:36"} +{"current_steps": 650, "total_steps": 10798, "loss": 2.066, "reward": null, "learning_rate": 0.0009910857438056215, "epoch": 0.12, "percentage": 6.02, "elapsed_time": "0:26:08", "remaining_time": "6:48:05"} +{"current_steps": 650, "total_steps": 10798, "loss": 2.066, "reward": null, "learning_rate": 0.0009910857438056215, "epoch": 0.12, "percentage": 6.02, "elapsed_time": "0:26:06", "remaining_time": "6:47:40"} +{"current_steps": 650, "total_steps": 10798, "loss": 2.066, "reward": null, "learning_rate": 0.0009910857438056215, "epoch": 0.12, "percentage": 6.02, "elapsed_time": "0:26:10", "remaining_time": "6:48:32"} +{"current_steps": 660, "total_steps": 10798, "loss": 2.0575, "reward": null, "learning_rate": 0.0009908101988688512, "epoch": 0.12, "percentage": 6.11, "elapsed_time": "0:32:35", "remaining_time": "8:20:31"} +{"current_steps": 660, "total_steps": 10798, "loss": 2.0575, "reward": null, "learning_rate": 0.0009908101988688512, "epoch": 0.12, "percentage": 6.11, "elapsed_time": "0:26:31", "remaining_time": "6:47:32"} +{"current_steps": 660, "total_steps": 10798, "loss": 2.0575, "reward": null, "learning_rate": 0.0009908101988688512, "epoch": 0.12, "percentage": 6.11, "elapsed_time": "0:26:30", "remaining_time": "6:47:07"} +{"current_steps": 660, "total_steps": 10798, "loss": 2.0575, "reward": null, "learning_rate": 0.0009908101988688512, "epoch": 0.12, "percentage": 6.11, "elapsed_time": "0:26:33", "remaining_time": "6:47:59"} +{"current_steps": 670, "total_steps": 10798, "loss": 2.1269, "reward": null, "learning_rate": 0.0009905304993593008, "epoch": 0.12, "percentage": 6.2, "elapsed_time": "0:26:56", "remaining_time": "6:47:20"} +{"current_steps": 670, "total_steps": 10798, "loss": 2.1269, "reward": null, "learning_rate": 0.0009905304993593008, "epoch": 0.12, "percentage": 6.2, "elapsed_time": "0:26:55", "remaining_time": "6:46:54"} +{"current_steps": 670, "total_steps": 10798, "loss": 2.1269, "reward": null, "learning_rate": 0.0009905304993593008, "epoch": 0.12, "percentage": 6.2, "elapsed_time": "0:32:58", "remaining_time": "8:18:24"} +{"current_steps": 670, "total_steps": 10798, "loss": 2.1269, "reward": null, "learning_rate": 0.0009905304993593008, "epoch": 0.12, "percentage": 6.2, "elapsed_time": "0:26:53", "remaining_time": "6:46:30"} +{"current_steps": 680, "total_steps": 10798, "loss": 2.0518, "reward": null, "learning_rate": 0.0009902466476445486, "epoch": 0.13, "percentage": 6.3, "elapsed_time": "0:27:21", "remaining_time": "6:47:03"} +{"current_steps": 680, "total_steps": 10798, "loss": 2.0518, "reward": null, "learning_rate": 0.0009902466476445486, "epoch": 0.13, "percentage": 6.3, "elapsed_time": "0:33:22", "remaining_time": "8:16:41"} +{"current_steps": 680, "total_steps": 10798, "loss": 2.0518, "reward": null, "learning_rate": 0.0009902466476445486, "epoch": 0.13, "percentage": 6.3, "elapsed_time": "0:27:19", "remaining_time": "6:46:36"} +{"current_steps": 680, "total_steps": 10798, "loss": 2.0518, "reward": null, "learning_rate": 0.0009902466476445486, "epoch": 0.13, "percentage": 6.3, "elapsed_time": "0:27:18", "remaining_time": "6:46:13"} +{"current_steps": 690, "total_steps": 10798, "loss": 2.0698, "reward": null, "learning_rate": 0.0009899586461273218, "epoch": 0.13, "percentage": 6.39, "elapsed_time": "0:33:47", "remaining_time": "8:14:59"} +{"current_steps": 690, "total_steps": 10798, "loss": 2.0698, "reward": null, "learning_rate": 0.0009899586461273218, "epoch": 0.13, "percentage": 6.39, "elapsed_time": "0:27:45", "remaining_time": "6:46:43"} +{"current_steps": 690, "total_steps": 10798, "loss": 2.0698, "reward": null, "learning_rate": 0.0009899586461273218, "epoch": 0.13, "percentage": 6.39, "elapsed_time": "0:27:44", "remaining_time": "6:46:18"} +{"current_steps": 690, "total_steps": 10798, "loss": 2.0698, "reward": null, "learning_rate": 0.0009899586461273218, "epoch": 0.13, "percentage": 6.39, "elapsed_time": "0:27:42", "remaining_time": "6:45:54"} +{"current_steps": 700, "total_steps": 10798, "loss": 2.0988, "reward": null, "learning_rate": 0.000989666497245473, "epoch": 0.13, "percentage": 6.48, "elapsed_time": "0:34:11", "remaining_time": "8:13:09"} +{"current_steps": 700, "total_steps": 10798, "loss": 2.0988, "reward": null, "learning_rate": 0.000989666497245473, "epoch": 0.13, "percentage": 6.48, "elapsed_time": "0:28:07", "remaining_time": "6:45:49"} +{"current_steps": 700, "total_steps": 10798, "loss": 2.0988, "reward": null, "learning_rate": 0.000989666497245473, "epoch": 0.13, "percentage": 6.48, "elapsed_time": "0:28:09", "remaining_time": "6:46:15"} +{"current_steps": 700, "total_steps": 10798, "loss": 2.0988, "reward": null, "learning_rate": 0.000989666497245473, "epoch": 0.13, "percentage": 6.48, "elapsed_time": "0:28:06", "remaining_time": "6:45:26"} +{"current_steps": 710, "total_steps": 10798, "loss": 2.0986, "reward": null, "learning_rate": 0.0009893702034719624, "epoch": 0.13, "percentage": 6.58, "elapsed_time": "0:34:35", "remaining_time": "8:11:32"} +{"current_steps": 710, "total_steps": 10798, "loss": 2.0986, "reward": null, "learning_rate": 0.0009893702034719624, "epoch": 0.13, "percentage": 6.58, "elapsed_time": "0:28:34", "remaining_time": "6:45:56"} +{"current_steps": 710, "total_steps": 10798, "loss": 2.0986, "reward": null, "learning_rate": 0.0009893702034719624, "epoch": 0.13, "percentage": 6.58, "elapsed_time": "0:28:30", "remaining_time": "6:45:08"} +{"current_steps": 710, "total_steps": 10798, "loss": 2.0986, "reward": null, "learning_rate": 0.0009893702034719624, "epoch": 0.13, "percentage": 6.58, "elapsed_time": "0:28:32", "remaining_time": "6:45:31"} +{"current_steps": 720, "total_steps": 10798, "loss": 2.0237, "reward": null, "learning_rate": 0.0009890697673148345, "epoch": 0.13, "percentage": 6.67, "elapsed_time": "0:35:00", "remaining_time": "8:10:00"} +{"current_steps": 720, "total_steps": 10798, "loss": 2.0237, "reward": null, "learning_rate": 0.0009890697673148345, "epoch": 0.13, "percentage": 6.67, "elapsed_time": "0:28:57", "remaining_time": "6:45:16"} +{"current_steps": 720, "total_steps": 10798, "loss": 2.0237, "reward": null, "learning_rate": 0.0009890697673148345, "epoch": 0.13, "percentage": 6.67, "elapsed_time": "0:28:55", "remaining_time": "6:44:54"} +{"current_steps": 720, "total_steps": 10798, "loss": 2.0237, "reward": null, "learning_rate": 0.0009890697673148345, "epoch": 0.13, "percentage": 6.67, "elapsed_time": "0:28:58", "remaining_time": "6:45:41"} +{"current_steps": 730, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0009887651913171986, "epoch": 0.14, "percentage": 6.76, "elapsed_time": "0:29:22", "remaining_time": "6:45:07"} +{"current_steps": 730, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0009887651913171986, "epoch": 0.14, "percentage": 6.76, "elapsed_time": "0:29:20", "remaining_time": "6:44:43"} +{"current_steps": 730, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0009887651913171986, "epoch": 0.14, "percentage": 6.76, "elapsed_time": "0:29:19", "remaining_time": "6:44:21"} +{"current_steps": 730, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0009887651913171986, "epoch": 0.14, "percentage": 6.76, "elapsed_time": "0:35:23", "remaining_time": "8:08:12"} +{"current_steps": 740, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0009884564780572064, "epoch": 0.14, "percentage": 6.85, "elapsed_time": "0:29:46", "remaining_time": "6:44:48"} +{"current_steps": 740, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0009884564780572064, "epoch": 0.14, "percentage": 6.85, "elapsed_time": "0:35:48", "remaining_time": "8:06:41"} +{"current_steps": 740, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0009884564780572064, "epoch": 0.14, "percentage": 6.85, "elapsed_time": "0:29:45", "remaining_time": "6:44:24"} +{"current_steps": 740, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0009884564780572064, "epoch": 0.14, "percentage": 6.85, "elapsed_time": "0:29:43", "remaining_time": "6:44:02"} +{"current_steps": 750, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009881436301480305, "epoch": 0.14, "percentage": 6.95, "elapsed_time": "0:36:13", "remaining_time": "8:05:18"} +{"current_steps": 750, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009881436301480305, "epoch": 0.14, "percentage": 6.95, "elapsed_time": "0:30:10", "remaining_time": "6:44:12"} +{"current_steps": 750, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009881436301480305, "epoch": 0.14, "percentage": 6.95, "elapsed_time": "0:30:08", "remaining_time": "6:43:50"} +{"current_steps": 750, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009881436301480305, "epoch": 0.14, "percentage": 6.95, "elapsed_time": "0:30:11", "remaining_time": "6:44:35"} +{"current_steps": 760, "total_steps": 10798, "loss": 2.0926, "reward": null, "learning_rate": 0.000987826650237842, "epoch": 0.14, "percentage": 7.04, "elapsed_time": "0:30:35", "remaining_time": "6:43:57"} +{"current_steps": 760, "total_steps": 10798, "loss": 2.0926, "reward": null, "learning_rate": 0.000987826650237842, "epoch": 0.14, "percentage": 7.04, "elapsed_time": "0:30:33", "remaining_time": "6:43:36"} +{"current_steps": 760, "total_steps": 10798, "loss": 2.0926, "reward": null, "learning_rate": 0.000987826650237842, "epoch": 0.14, "percentage": 7.04, "elapsed_time": "0:36:38", "remaining_time": "8:03:55"} +{"current_steps": 760, "total_steps": 10798, "loss": 2.0926, "reward": null, "learning_rate": 0.000987826650237842, "epoch": 0.14, "percentage": 7.04, "elapsed_time": "0:30:36", "remaining_time": "6:44:21"} +{"current_steps": 770, "total_steps": 10798, "loss": 2.0585, "reward": null, "learning_rate": 0.000987505541009788, "epoch": 0.14, "percentage": 7.13, "elapsed_time": "0:30:59", "remaining_time": "6:43:39"} +{"current_steps": 770, "total_steps": 10798, "loss": 2.0585, "reward": null, "learning_rate": 0.000987505541009788, "epoch": 0.14, "percentage": 7.13, "elapsed_time": "0:31:01", "remaining_time": "6:44:02"} +{"current_steps": 770, "total_steps": 10798, "loss": 2.0585, "reward": null, "learning_rate": 0.000987505541009788, "epoch": 0.14, "percentage": 7.13, "elapsed_time": "0:37:02", "remaining_time": "8:02:30"} +{"current_steps": 770, "total_steps": 10798, "loss": 2.0585, "reward": null, "learning_rate": 0.000987505541009788, "epoch": 0.14, "percentage": 7.13, "elapsed_time": "0:30:58", "remaining_time": "6:43:19"} +{"current_steps": 780, "total_steps": 10798, "loss": 2.0494, "reward": null, "learning_rate": 0.0009871803051819696, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "0:31:23", "remaining_time": "6:43:08"} +{"current_steps": 780, "total_steps": 10798, "loss": 2.0494, "reward": null, "learning_rate": 0.0009871803051819696, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "0:31:25", "remaining_time": "6:43:31"} +{"current_steps": 780, "total_steps": 10798, "loss": 2.0494, "reward": null, "learning_rate": 0.0009871803051819696, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "0:31:21", "remaining_time": "6:42:48"} +{"current_steps": 780, "total_steps": 10798, "loss": 2.0494, "reward": null, "learning_rate": 0.0009871803051819696, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "0:37:26", "remaining_time": "8:00:54"} +{"current_steps": 790, "total_steps": 10798, "loss": 2.0106, "reward": null, "learning_rate": 0.0009868509455074183, "epoch": 0.15, "percentage": 7.32, "elapsed_time": "0:31:46", "remaining_time": "6:42:29"} +{"current_steps": 790, "total_steps": 10798, "loss": 2.0106, "reward": null, "learning_rate": 0.0009868509455074183, "epoch": 0.15, "percentage": 7.32, "elapsed_time": "0:31:49", "remaining_time": "6:43:12"} +{"current_steps": 790, "total_steps": 10798, "loss": 2.0106, "reward": null, "learning_rate": 0.0009868509455074183, "epoch": 0.15, "percentage": 7.32, "elapsed_time": "0:31:47", "remaining_time": "6:42:50"} +{"current_steps": 790, "total_steps": 10798, "loss": 2.0106, "reward": null, "learning_rate": 0.0009868509455074183, "epoch": 0.15, "percentage": 7.32, "elapsed_time": "0:37:51", "remaining_time": "7:59:31"} +{"current_steps": 800, "total_steps": 10798, "loss": 2.0861, "reward": null, "learning_rate": 0.0009865174647740729, "epoch": 0.15, "percentage": 7.41, "elapsed_time": "0:38:15", "remaining_time": "7:58:12"} +{"current_steps": 800, "total_steps": 10798, "loss": 2.0861, "reward": null, "learning_rate": 0.0009865174647740729, "epoch": 0.15, "percentage": 7.41, "elapsed_time": "0:32:11", "remaining_time": "6:42:13"} +{"current_steps": 800, "total_steps": 10798, "loss": 2.0861, "reward": null, "learning_rate": 0.0009865174647740729, "epoch": 0.15, "percentage": 7.41, "elapsed_time": "0:32:12", "remaining_time": "6:42:33"} +{"current_steps": 800, "total_steps": 10798, "loss": 2.0861, "reward": null, "learning_rate": 0.0009865174647740729, "epoch": 0.15, "percentage": 7.41, "elapsed_time": "0:32:14", "remaining_time": "6:42:55"} +{"current_steps": 810, "total_steps": 10798, "loss": 2.0478, "reward": null, "learning_rate": 0.0009861798658047556, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:32:36", "remaining_time": "6:42:03"} +{"current_steps": 810, "total_steps": 10798, "loss": 2.0478, "reward": null, "learning_rate": 0.0009861798658047556, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:38:39", "remaining_time": "7:56:42"} +{"current_steps": 810, "total_steps": 10798, "loss": 2.0478, "reward": null, "learning_rate": 0.0009861798658047556, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:32:34", "remaining_time": "6:41:44"} +{"current_steps": 810, "total_steps": 10798, "loss": 2.0478, "reward": null, "learning_rate": 0.0009861798658047556, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:32:38", "remaining_time": "6:42:25"} +{"current_steps": 820, "total_steps": 10798, "loss": 2.0469, "reward": null, "learning_rate": 0.0009858381514571484, "epoch": 0.15, "percentage": 7.59, "elapsed_time": "0:39:03", "remaining_time": "7:55:18"} +{"current_steps": 820, "total_steps": 10798, "loss": 2.0469, "reward": null, "learning_rate": 0.0009858381514571484, "epoch": 0.15, "percentage": 7.59, "elapsed_time": "0:33:02", "remaining_time": "6:42:00"} +{"current_steps": 820, "total_steps": 10798, "loss": 2.0469, "reward": null, "learning_rate": 0.0009858381514571484, "epoch": 0.15, "percentage": 7.59, "elapsed_time": "0:32:58", "remaining_time": "6:41:19"} +{"current_steps": 820, "total_steps": 10798, "loss": 2.0469, "reward": null, "learning_rate": 0.0009858381514571484, "epoch": 0.15, "percentage": 7.59, "elapsed_time": "0:33:00", "remaining_time": "6:41:38"} +{"current_steps": 830, "total_steps": 10798, "loss": 2.0671, "reward": null, "learning_rate": 0.000985492324623769, "epoch": 0.15, "percentage": 7.69, "elapsed_time": "0:33:24", "remaining_time": "6:41:07"} +{"current_steps": 830, "total_steps": 10798, "loss": 2.0671, "reward": null, "learning_rate": 0.000985492324623769, "epoch": 0.15, "percentage": 7.69, "elapsed_time": "0:33:25", "remaining_time": "6:41:28"} +{"current_steps": 830, "total_steps": 10798, "loss": 2.0671, "reward": null, "learning_rate": 0.000985492324623769, "epoch": 0.15, "percentage": 7.69, "elapsed_time": "0:39:27", "remaining_time": "7:53:50"} +{"current_steps": 830, "total_steps": 10798, "loss": 2.0671, "reward": null, "learning_rate": 0.000985492324623769, "epoch": 0.15, "percentage": 7.69, "elapsed_time": "0:33:22", "remaining_time": "6:40:48"} +{"current_steps": 840, "total_steps": 10798, "loss": 2.0808, "reward": null, "learning_rate": 0.0009851423882319458, "epoch": 0.16, "percentage": 7.78, "elapsed_time": "0:39:50", "remaining_time": "7:52:20"} +{"current_steps": 840, "total_steps": 10798, "loss": 2.0808, "reward": null, "learning_rate": 0.0009851423882319458, "epoch": 0.16, "percentage": 7.78, "elapsed_time": "0:33:49", "remaining_time": "6:40:55"} +{"current_steps": 840, "total_steps": 10798, "loss": 2.0808, "reward": null, "learning_rate": 0.0009851423882319458, "epoch": 0.16, "percentage": 7.78, "elapsed_time": "0:33:47", "remaining_time": "6:40:35"} +{"current_steps": 840, "total_steps": 10798, "loss": 2.0808, "reward": null, "learning_rate": 0.0009851423882319458, "epoch": 0.16, "percentage": 7.78, "elapsed_time": "0:33:45", "remaining_time": "6:40:16"} +{"current_steps": 850, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009847883452437937, "epoch": 0.16, "percentage": 7.87, "elapsed_time": "0:34:10", "remaining_time": "6:39:54"} +{"current_steps": 850, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009847883452437937, "epoch": 0.16, "percentage": 7.87, "elapsed_time": "0:34:11", "remaining_time": "6:40:12"} +{"current_steps": 850, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009847883452437937, "epoch": 0.16, "percentage": 7.87, "elapsed_time": "0:34:13", "remaining_time": "6:40:33"} +{"current_steps": 850, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009847883452437937, "epoch": 0.16, "percentage": 7.87, "elapsed_time": "0:40:14", "remaining_time": "7:51:03"} +{"current_steps": 860, "total_steps": 10798, "loss": 2.0295, "reward": null, "learning_rate": 0.0009844301986561893, "epoch": 0.16, "percentage": 7.96, "elapsed_time": "0:40:38", "remaining_time": "7:49:43"} +{"current_steps": 860, "total_steps": 10798, "loss": 2.0295, "reward": null, "learning_rate": 0.0009844301986561893, "epoch": 0.16, "percentage": 7.96, "elapsed_time": "0:34:37", "remaining_time": "6:40:06"} +{"current_steps": 860, "total_steps": 10798, "loss": 2.0295, "reward": null, "learning_rate": 0.0009844301986561893, "epoch": 0.16, "percentage": 7.96, "elapsed_time": "0:34:34", "remaining_time": "6:39:28"} +{"current_steps": 860, "total_steps": 10798, "loss": 2.0295, "reward": null, "learning_rate": 0.0009844301986561893, "epoch": 0.16, "percentage": 7.96, "elapsed_time": "0:34:35", "remaining_time": "6:39:46"} +{"current_steps": 870, "total_steps": 10798, "loss": 2.0873, "reward": null, "learning_rate": 0.000984067951500744, "epoch": 0.16, "percentage": 8.06, "elapsed_time": "0:41:03", "remaining_time": "7:48:31"} +{"current_steps": 870, "total_steps": 10798, "loss": 2.0873, "reward": null, "learning_rate": 0.000984067951500744, "epoch": 0.16, "percentage": 8.06, "elapsed_time": "0:35:00", "remaining_time": "6:39:26"} +{"current_steps": 870, "total_steps": 10798, "loss": 2.0873, "reward": null, "learning_rate": 0.000984067951500744, "epoch": 0.16, "percentage": 8.06, "elapsed_time": "0:34:58", "remaining_time": "6:39:08"} +{"current_steps": 870, "total_steps": 10798, "loss": 2.0873, "reward": null, "learning_rate": 0.000984067951500744, "epoch": 0.16, "percentage": 8.06, "elapsed_time": "0:35:01", "remaining_time": "6:39:46"} +{"current_steps": 880, "total_steps": 10798, "loss": 2.1038, "reward": null, "learning_rate": 0.00098370160684378, "epoch": 0.16, "percentage": 8.15, "elapsed_time": "0:35:26", "remaining_time": "6:39:26"} +{"current_steps": 880, "total_steps": 10798, "loss": 2.1038, "reward": null, "learning_rate": 0.00098370160684378, "epoch": 0.16, "percentage": 8.15, "elapsed_time": "0:35:23", "remaining_time": "6:38:49"} +{"current_steps": 880, "total_steps": 10798, "loss": 2.1038, "reward": null, "learning_rate": 0.00098370160684378, "epoch": 0.16, "percentage": 8.15, "elapsed_time": "0:35:24", "remaining_time": "6:39:07"} +{"current_steps": 880, "total_steps": 10798, "loss": 2.1038, "reward": null, "learning_rate": 0.00098370160684378, "epoch": 0.16, "percentage": 8.15, "elapsed_time": "0:41:27", "remaining_time": "7:47:20"} +{"current_steps": 890, "total_steps": 10798, "loss": 2.0337, "reward": null, "learning_rate": 0.0009833311677863042, "epoch": 0.16, "percentage": 8.24, "elapsed_time": "0:35:47", "remaining_time": "6:38:29"} +{"current_steps": 890, "total_steps": 10798, "loss": 2.0337, "reward": null, "learning_rate": 0.0009833311677863042, "epoch": 0.16, "percentage": 8.24, "elapsed_time": "0:35:49", "remaining_time": "6:38:46"} +{"current_steps": 890, "total_steps": 10798, "loss": 2.0337, "reward": null, "learning_rate": 0.0009833311677863042, "epoch": 0.16, "percentage": 8.24, "elapsed_time": "0:35:51", "remaining_time": "6:39:06"} +{"current_steps": 890, "total_steps": 10798, "loss": 2.0337, "reward": null, "learning_rate": 0.0009833311677863042, "epoch": 0.16, "percentage": 8.24, "elapsed_time": "0:41:52", "remaining_time": "7:46:10"} +{"current_steps": 900, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0009829566374639801, "epoch": 0.17, "percentage": 8.33, "elapsed_time": "0:42:16", "remaining_time": "7:45:00"} +{"current_steps": 900, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0009829566374639801, "epoch": 0.17, "percentage": 8.33, "elapsed_time": "0:36:12", "remaining_time": "6:38:08"} +{"current_steps": 900, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0009829566374639801, "epoch": 0.17, "percentage": 8.33, "elapsed_time": "0:36:15", "remaining_time": "6:38:45"} +{"current_steps": 900, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0009829566374639801, "epoch": 0.17, "percentage": 8.33, "elapsed_time": "0:36:13", "remaining_time": "6:38:25"} +{"current_steps": 910, "total_steps": 10798, "loss": 2.1049, "reward": null, "learning_rate": 0.0009825780190471042, "epoch": 0.17, "percentage": 8.43, "elapsed_time": "0:42:41", "remaining_time": "7:43:49"} +{"current_steps": 910, "total_steps": 10798, "loss": 2.1049, "reward": null, "learning_rate": 0.0009825780190471042, "epoch": 0.17, "percentage": 8.43, "elapsed_time": "0:36:37", "remaining_time": "6:38:02"} +{"current_steps": 910, "total_steps": 10798, "loss": 2.1049, "reward": null, "learning_rate": 0.0009825780190471042, "epoch": 0.17, "percentage": 8.43, "elapsed_time": "0:36:36", "remaining_time": "6:37:44"} +{"current_steps": 910, "total_steps": 10798, "loss": 2.1049, "reward": null, "learning_rate": 0.0009825780190471042, "epoch": 0.17, "percentage": 8.43, "elapsed_time": "0:36:39", "remaining_time": "6:38:21"} +{"current_steps": 920, "total_steps": 10798, "loss": 2.0475, "reward": null, "learning_rate": 0.000982195315740576, "epoch": 0.17, "percentage": 8.52, "elapsed_time": "0:37:04", "remaining_time": "6:37:59"} +{"current_steps": 920, "total_steps": 10798, "loss": 2.0475, "reward": null, "learning_rate": 0.000982195315740576, "epoch": 0.17, "percentage": 8.52, "elapsed_time": "0:37:00", "remaining_time": "6:37:23"} +{"current_steps": 920, "total_steps": 10798, "loss": 2.0475, "reward": null, "learning_rate": 0.000982195315740576, "epoch": 0.17, "percentage": 8.52, "elapsed_time": "0:43:05", "remaining_time": "7:42:40"} +{"current_steps": 920, "total_steps": 10798, "loss": 2.0475, "reward": null, "learning_rate": 0.000982195315740576, "epoch": 0.17, "percentage": 8.52, "elapsed_time": "0:37:02", "remaining_time": "6:37:40"} +{"current_steps": 930, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009818085307838741, "epoch": 0.17, "percentage": 8.61, "elapsed_time": "0:43:30", "remaining_time": "7:41:38"} +{"current_steps": 930, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009818085307838741, "epoch": 0.17, "percentage": 8.61, "elapsed_time": "0:37:27", "remaining_time": "6:37:24"} +{"current_steps": 930, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009818085307838741, "epoch": 0.17, "percentage": 8.61, "elapsed_time": "0:37:28", "remaining_time": "6:37:43"} +{"current_steps": 930, "total_steps": 10798, "loss": 2.0624, "reward": null, "learning_rate": 0.0009818085307838741, "epoch": 0.17, "percentage": 8.61, "elapsed_time": "0:37:25", "remaining_time": "6:37:07"} +{"current_steps": 940, "total_steps": 10798, "loss": 2.0714, "reward": null, "learning_rate": 0.000981417667451026, "epoch": 0.17, "percentage": 8.71, "elapsed_time": "0:43:54", "remaining_time": "7:40:24"} +{"current_steps": 940, "total_steps": 10798, "loss": 2.0714, "reward": null, "learning_rate": 0.000981417667451026, "epoch": 0.17, "percentage": 8.71, "elapsed_time": "0:37:52", "remaining_time": "6:37:14"} +{"current_steps": 940, "total_steps": 10798, "loss": 2.0714, "reward": null, "learning_rate": 0.000981417667451026, "epoch": 0.17, "percentage": 8.71, "elapsed_time": "0:37:49", "remaining_time": "6:36:38"} +{"current_steps": 940, "total_steps": 10798, "loss": 2.0714, "reward": null, "learning_rate": 0.000981417667451026, "epoch": 0.17, "percentage": 8.71, "elapsed_time": "0:37:50", "remaining_time": "6:36:55"} +{"current_steps": 950, "total_steps": 10798, "loss": 2.0947, "reward": null, "learning_rate": 0.0009810227290505816, "epoch": 0.18, "percentage": 8.8, "elapsed_time": "0:44:18", "remaining_time": "7:39:15"} +{"current_steps": 950, "total_steps": 10798, "loss": 2.0947, "reward": null, "learning_rate": 0.0009810227290505816, "epoch": 0.18, "percentage": 8.8, "elapsed_time": "0:38:13", "remaining_time": "6:36:13"} +{"current_steps": 950, "total_steps": 10798, "loss": 2.0947, "reward": null, "learning_rate": 0.0009810227290505816, "epoch": 0.18, "percentage": 8.8, "elapsed_time": "0:38:16", "remaining_time": "6:36:48"} +{"current_steps": 950, "total_steps": 10798, "loss": 2.0947, "reward": null, "learning_rate": 0.0009810227290505816, "epoch": 0.18, "percentage": 8.8, "elapsed_time": "0:38:14", "remaining_time": "6:36:30"} +{"current_steps": 960, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0009806237189255859, "epoch": 0.18, "percentage": 8.89, "elapsed_time": "0:38:39", "remaining_time": "6:36:06"} +{"current_steps": 960, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0009806237189255859, "epoch": 0.18, "percentage": 8.89, "elapsed_time": "0:38:40", "remaining_time": "6:36:24"} +{"current_steps": 960, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0009806237189255859, "epoch": 0.18, "percentage": 8.89, "elapsed_time": "0:44:42", "remaining_time": "7:38:08"} +{"current_steps": 960, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0009806237189255859, "epoch": 0.18, "percentage": 8.89, "elapsed_time": "0:38:37", "remaining_time": "6:35:50"} +{"current_steps": 970, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009802206404535489, "epoch": 0.18, "percentage": 8.98, "elapsed_time": "0:45:05", "remaining_time": "7:36:55"} +{"current_steps": 970, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009802206404535489, "epoch": 0.18, "percentage": 8.98, "elapsed_time": "0:39:04", "remaining_time": "6:35:52"} +{"current_steps": 970, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009802206404535489, "epoch": 0.18, "percentage": 8.98, "elapsed_time": "0:39:00", "remaining_time": "6:35:18"} +{"current_steps": 970, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009802206404535489, "epoch": 0.18, "percentage": 8.98, "elapsed_time": "0:39:02", "remaining_time": "6:35:35"} +{"current_steps": 980, "total_steps": 10798, "loss": 2.0556, "reward": null, "learning_rate": 0.000979813497046419, "epoch": 0.18, "percentage": 9.08, "elapsed_time": "0:45:29", "remaining_time": "7:35:48"} +{"current_steps": 980, "total_steps": 10798, "loss": 2.0556, "reward": null, "learning_rate": 0.000979813497046419, "epoch": 0.18, "percentage": 9.08, "elapsed_time": "0:39:28", "remaining_time": "6:35:27"} +{"current_steps": 980, "total_steps": 10798, "loss": 2.0556, "reward": null, "learning_rate": 0.000979813497046419, "epoch": 0.18, "percentage": 9.08, "elapsed_time": "0:39:26", "remaining_time": "6:35:10"} +{"current_steps": 980, "total_steps": 10798, "loss": 2.0556, "reward": null, "learning_rate": 0.000979813497046419, "epoch": 0.18, "percentage": 9.08, "elapsed_time": "0:39:25", "remaining_time": "6:34:54"} +{"current_steps": 990, "total_steps": 10798, "loss": 2.0753, "reward": null, "learning_rate": 0.0009794022921505523, "epoch": 0.18, "percentage": 9.17, "elapsed_time": "0:45:54", "remaining_time": "7:34:44"} +{"current_steps": 990, "total_steps": 10798, "loss": 2.0753, "reward": null, "learning_rate": 0.0009794022921505523, "epoch": 0.18, "percentage": 9.17, "elapsed_time": "0:39:52", "remaining_time": "6:35:03"} +{"current_steps": 990, "total_steps": 10798, "loss": 2.0753, "reward": null, "learning_rate": 0.0009794022921505523, "epoch": 0.18, "percentage": 9.17, "elapsed_time": "0:39:50", "remaining_time": "6:34:45"} +{"current_steps": 990, "total_steps": 10798, "loss": 2.0753, "reward": null, "learning_rate": 0.0009794022921505523, "epoch": 0.18, "percentage": 9.17, "elapsed_time": "0:39:49", "remaining_time": "6:34:30"} +{"current_steps": 1000, "total_steps": 10798, "loss": 2.0898, "reward": null, "learning_rate": 0.000978987029246685, "epoch": 0.19, "percentage": 9.26, "elapsed_time": "0:46:18", "remaining_time": "7:33:44"} +{"current_steps": 1000, "total_steps": 10798, "loss": 2.0898, "reward": null, "learning_rate": 0.000978987029246685, "epoch": 0.19, "percentage": 9.26, "elapsed_time": "0:40:15", "remaining_time": "6:34:25"} +{"current_steps": 1000, "total_steps": 10798, "loss": 2.0898, "reward": null, "learning_rate": 0.000978987029246685, "epoch": 0.19, "percentage": 9.26, "elapsed_time": "0:40:17", "remaining_time": "6:34:42"} +{"current_steps": 1000, "total_steps": 10798, "loss": 2.0898, "reward": null, "learning_rate": 0.000978987029246685, "epoch": 0.19, "percentage": 9.26, "elapsed_time": "0:40:13", "remaining_time": "6:34:09"} +{"current_steps": 1010, "total_steps": 10798, "loss": 2.0464, "reward": null, "learning_rate": 0.0009785677118499029, "epoch": 0.19, "percentage": 9.35, "elapsed_time": "0:40:39", "remaining_time": "6:34:00"} +{"current_steps": 1010, "total_steps": 10798, "loss": 2.0464, "reward": null, "learning_rate": 0.0009785677118499029, "epoch": 0.19, "percentage": 9.35, "elapsed_time": "0:40:41", "remaining_time": "6:34:17"} +{"current_steps": 1010, "total_steps": 10798, "loss": 2.0464, "reward": null, "learning_rate": 0.0009785677118499029, "epoch": 0.19, "percentage": 9.35, "elapsed_time": "0:46:42", "remaining_time": "7:32:40"} +{"current_steps": 1010, "total_steps": 10798, "loss": 2.0464, "reward": null, "learning_rate": 0.0009785677118499029, "epoch": 0.19, "percentage": 9.35, "elapsed_time": "0:40:37", "remaining_time": "6:33:44"} +{"current_steps": 1020, "total_steps": 10798, "loss": 2.0828, "reward": null, "learning_rate": 0.0009781443435096116, "epoch": 0.19, "percentage": 9.45, "elapsed_time": "0:41:03", "remaining_time": "6:33:31"} +{"current_steps": 1020, "total_steps": 10798, "loss": 2.0828, "reward": null, "learning_rate": 0.0009781443435096116, "epoch": 0.19, "percentage": 9.45, "elapsed_time": "0:47:07", "remaining_time": "7:31:48"} +{"current_steps": 1020, "total_steps": 10798, "loss": 2.0828, "reward": null, "learning_rate": 0.0009781443435096116, "epoch": 0.19, "percentage": 9.45, "elapsed_time": "0:41:04", "remaining_time": "6:33:46"} +{"current_steps": 1020, "total_steps": 10798, "loss": 2.0828, "reward": null, "learning_rate": 0.0009781443435096116, "epoch": 0.19, "percentage": 9.45, "elapsed_time": "0:41:06", "remaining_time": "6:34:03"} +{"current_steps": 1030, "total_steps": 10798, "loss": 2.1137, "reward": null, "learning_rate": 0.0009777169278095074, "epoch": 0.19, "percentage": 9.54, "elapsed_time": "0:47:32", "remaining_time": "7:30:50"} +{"current_steps": 1030, "total_steps": 10798, "loss": 2.1137, "reward": null, "learning_rate": 0.0009777169278095074, "epoch": 0.19, "percentage": 9.54, "elapsed_time": "0:41:30", "remaining_time": "6:33:42"} +{"current_steps": 1030, "total_steps": 10798, "loss": 2.1137, "reward": null, "learning_rate": 0.0009777169278095074, "epoch": 0.19, "percentage": 9.54, "elapsed_time": "0:41:27", "remaining_time": "6:33:10"} +{"current_steps": 1030, "total_steps": 10798, "loss": 2.1137, "reward": null, "learning_rate": 0.0009777169278095074, "epoch": 0.19, "percentage": 9.54, "elapsed_time": "0:41:29", "remaining_time": "6:33:25"} +{"current_steps": 1040, "total_steps": 10798, "loss": 2.0167, "reward": null, "learning_rate": 0.0009772854683675462, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "0:41:54", "remaining_time": "6:33:15"} +{"current_steps": 1040, "total_steps": 10798, "loss": 2.0167, "reward": null, "learning_rate": 0.0009772854683675462, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "0:41:51", "remaining_time": "6:32:44"} +{"current_steps": 1040, "total_steps": 10798, "loss": 2.0167, "reward": null, "learning_rate": 0.0009772854683675462, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "0:41:53", "remaining_time": "6:32:59"} +{"current_steps": 1040, "total_steps": 10798, "loss": 2.0167, "reward": null, "learning_rate": 0.0009772854683675462, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "0:47:56", "remaining_time": "7:29:47"} +{"current_steps": 1050, "total_steps": 10798, "loss": 2.07, "reward": null, "learning_rate": 0.000976849968835913, "epoch": 0.19, "percentage": 9.72, "elapsed_time": "0:42:18", "remaining_time": "6:32:45"} +{"current_steps": 1050, "total_steps": 10798, "loss": 2.07, "reward": null, "learning_rate": 0.000976849968835913, "epoch": 0.19, "percentage": 9.72, "elapsed_time": "0:42:16", "remaining_time": "6:32:29"} +{"current_steps": 1050, "total_steps": 10798, "loss": 2.07, "reward": null, "learning_rate": 0.000976849968835913, "epoch": 0.19, "percentage": 9.72, "elapsed_time": "0:48:19", "remaining_time": "7:28:41"} +{"current_steps": 1050, "total_steps": 10798, "loss": 2.07, "reward": null, "learning_rate": 0.000976849968835913, "epoch": 0.19, "percentage": 9.72, "elapsed_time": "0:42:15", "remaining_time": "6:32:14"} +{"current_steps": 1060, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009764104329009909, "epoch": 0.2, "percentage": 9.82, "elapsed_time": "0:48:43", "remaining_time": "7:27:39"} +{"current_steps": 1060, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009764104329009909, "epoch": 0.2, "percentage": 9.82, "elapsed_time": "0:42:40", "remaining_time": "6:32:02"} +{"current_steps": 1060, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009764104329009909, "epoch": 0.2, "percentage": 9.82, "elapsed_time": "0:42:42", "remaining_time": "6:32:18"} +{"current_steps": 1060, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009764104329009909, "epoch": 0.2, "percentage": 9.82, "elapsed_time": "0:42:38", "remaining_time": "6:31:47"} +{"current_steps": 1070, "total_steps": 10798, "loss": 2.015, "reward": null, "learning_rate": 0.0009759668642833304, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "0:43:04", "remaining_time": "6:31:38"} +{"current_steps": 1070, "total_steps": 10798, "loss": 2.015, "reward": null, "learning_rate": 0.0009759668642833304, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "0:43:06", "remaining_time": "6:31:54"} +{"current_steps": 1070, "total_steps": 10798, "loss": 2.015, "reward": null, "learning_rate": 0.0009759668642833304, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "0:43:03", "remaining_time": "6:31:23"} +{"current_steps": 1070, "total_steps": 10798, "loss": 2.015, "reward": null, "learning_rate": 0.0009759668642833304, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "0:49:07", "remaining_time": "7:26:40"} +{"current_steps": 1080, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0009755192667376173, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:43:30", "remaining_time": "6:31:30"} +{"current_steps": 1080, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0009755192667376173, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:43:27", "remaining_time": "6:31:00"} +{"current_steps": 1080, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0009755192667376173, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:43:28", "remaining_time": "6:31:14"} +{"current_steps": 1080, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0009755192667376173, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:49:32", "remaining_time": "7:25:42"} +{"current_steps": 1090, "total_steps": 10798, "loss": 2.0773, "reward": null, "learning_rate": 0.0009750676440526411, "epoch": 0.2, "percentage": 10.09, "elapsed_time": "0:49:55", "remaining_time": "7:24:41"} +{"current_steps": 1090, "total_steps": 10798, "loss": 2.0773, "reward": null, "learning_rate": 0.0009750676440526411, "epoch": 0.2, "percentage": 10.09, "elapsed_time": "0:43:50", "remaining_time": "6:30:32"} +{"current_steps": 1090, "total_steps": 10798, "loss": 2.0773, "reward": null, "learning_rate": 0.0009750676440526411, "epoch": 0.2, "percentage": 10.09, "elapsed_time": "0:43:52", "remaining_time": "6:30:46"} +{"current_steps": 1090, "total_steps": 10798, "loss": 2.0773, "reward": null, "learning_rate": 0.0009750676440526411, "epoch": 0.2, "percentage": 10.09, "elapsed_time": "0:43:54", "remaining_time": "6:31:02"} +{"current_steps": 1100, "total_steps": 10798, "loss": 2.0245, "reward": null, "learning_rate": 0.0009746120000512632, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "0:50:20", "remaining_time": "7:23:50"} +{"current_steps": 1100, "total_steps": 10798, "loss": 2.0245, "reward": null, "learning_rate": 0.0009746120000512632, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "0:44:15", "remaining_time": "6:30:14"} +{"current_steps": 1100, "total_steps": 10798, "loss": 2.0245, "reward": null, "learning_rate": 0.0009746120000512632, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "0:44:19", "remaining_time": "6:30:43"} +{"current_steps": 1100, "total_steps": 10798, "loss": 2.0245, "reward": null, "learning_rate": 0.0009746120000512632, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "0:44:17", "remaining_time": "6:30:28"} +{"current_steps": 1110, "total_steps": 10798, "loss": 2.094, "reward": null, "learning_rate": 0.0009741523385903841, "epoch": 0.21, "percentage": 10.28, "elapsed_time": "0:50:43", "remaining_time": "7:22:47"} +{"current_steps": 1110, "total_steps": 10798, "loss": 2.094, "reward": null, "learning_rate": 0.0009741523385903841, "epoch": 0.21, "percentage": 10.28, "elapsed_time": "0:44:42", "remaining_time": "6:30:12"} +{"current_steps": 1110, "total_steps": 10798, "loss": 2.094, "reward": null, "learning_rate": 0.0009741523385903841, "epoch": 0.21, "percentage": 10.28, "elapsed_time": "0:44:40", "remaining_time": "6:29:57"} +{"current_steps": 1110, "total_steps": 10798, "loss": 2.094, "reward": null, "learning_rate": 0.0009741523385903841, "epoch": 0.21, "percentage": 10.28, "elapsed_time": "0:44:39", "remaining_time": "6:29:43"} +{"current_steps": 1120, "total_steps": 10798, "loss": 2.0506, "reward": null, "learning_rate": 0.0009736886635609112, "epoch": 0.21, "percentage": 10.37, "elapsed_time": "0:51:07", "remaining_time": "7:21:50"} +{"current_steps": 1120, "total_steps": 10798, "loss": 2.0506, "reward": null, "learning_rate": 0.0009736886635609112, "epoch": 0.21, "percentage": 10.37, "elapsed_time": "0:45:06", "remaining_time": "6:29:47"} +{"current_steps": 1120, "total_steps": 10798, "loss": 2.0506, "reward": null, "learning_rate": 0.0009736886635609112, "epoch": 0.21, "percentage": 10.37, "elapsed_time": "0:45:04", "remaining_time": "6:29:32"} +{"current_steps": 1120, "total_steps": 10798, "loss": 2.0506, "reward": null, "learning_rate": 0.0009736886635609112, "epoch": 0.21, "percentage": 10.37, "elapsed_time": "0:45:03", "remaining_time": "6:29:18"} +{"current_steps": 1130, "total_steps": 10798, "loss": 2.0287, "reward": null, "learning_rate": 0.0009732209788877258, "epoch": 0.21, "percentage": 10.46, "elapsed_time": "0:51:32", "remaining_time": "7:20:59"} +{"current_steps": 1130, "total_steps": 10798, "loss": 2.0287, "reward": null, "learning_rate": 0.0009732209788877258, "epoch": 0.21, "percentage": 10.46, "elapsed_time": "0:45:29", "remaining_time": "6:29:11"} +{"current_steps": 1130, "total_steps": 10798, "loss": 2.0287, "reward": null, "learning_rate": 0.0009732209788877258, "epoch": 0.21, "percentage": 10.46, "elapsed_time": "0:45:27", "remaining_time": "6:28:58"} +{"current_steps": 1130, "total_steps": 10798, "loss": 2.0287, "reward": null, "learning_rate": 0.0009732209788877258, "epoch": 0.21, "percentage": 10.46, "elapsed_time": "0:45:31", "remaining_time": "6:29:26"} +{"current_steps": 1140, "total_steps": 10798, "loss": 2.1162, "reward": null, "learning_rate": 0.0009727492885296489, "epoch": 0.21, "percentage": 10.56, "elapsed_time": "0:45:53", "remaining_time": "6:28:46"} +{"current_steps": 1140, "total_steps": 10798, "loss": 2.1162, "reward": null, "learning_rate": 0.0009727492885296489, "epoch": 0.21, "percentage": 10.56, "elapsed_time": "0:51:58", "remaining_time": "7:20:17"} +{"current_steps": 1140, "total_steps": 10798, "loss": 2.1162, "reward": null, "learning_rate": 0.0009727492885296489, "epoch": 0.21, "percentage": 10.56, "elapsed_time": "0:45:56", "remaining_time": "6:29:14"} +{"current_steps": 1140, "total_steps": 10798, "loss": 2.1162, "reward": null, "learning_rate": 0.0009727492885296489, "epoch": 0.21, "percentage": 10.56, "elapsed_time": "0:45:54", "remaining_time": "6:28:59"} +{"current_steps": 1150, "total_steps": 10798, "loss": 2.1096, "reward": null, "learning_rate": 0.0009722735964794099, "epoch": 0.21, "percentage": 10.65, "elapsed_time": "0:52:23", "remaining_time": "7:19:31"} +{"current_steps": 1150, "total_steps": 10798, "loss": 2.1096, "reward": null, "learning_rate": 0.0009722735964794099, "epoch": 0.21, "percentage": 10.65, "elapsed_time": "0:46:20", "remaining_time": "6:28:44"} +{"current_steps": 1150, "total_steps": 10798, "loss": 2.1096, "reward": null, "learning_rate": 0.0009722735964794099, "epoch": 0.21, "percentage": 10.65, "elapsed_time": "0:46:21", "remaining_time": "6:28:59"} +{"current_steps": 1150, "total_steps": 10798, "loss": 2.1096, "reward": null, "learning_rate": 0.0009722735964794099, "epoch": 0.21, "percentage": 10.65, "elapsed_time": "0:46:18", "remaining_time": "6:28:31"} +{"current_steps": 1160, "total_steps": 10798, "loss": 2.0621, "reward": null, "learning_rate": 0.0009717939067636099, "epoch": 0.21, "percentage": 10.74, "elapsed_time": "0:52:48", "remaining_time": "7:18:44"} +{"current_steps": 1160, "total_steps": 10798, "loss": 2.0621, "reward": null, "learning_rate": 0.0009717939067636099, "epoch": 0.21, "percentage": 10.74, "elapsed_time": "0:46:46", "remaining_time": "6:28:41"} +{"current_steps": 1160, "total_steps": 10798, "loss": 2.0621, "reward": null, "learning_rate": 0.0009717939067636099, "epoch": 0.21, "percentage": 10.74, "elapsed_time": "0:46:43", "remaining_time": "6:28:13"} +{"current_steps": 1160, "total_steps": 10798, "loss": 2.0621, "reward": null, "learning_rate": 0.0009717939067636099, "epoch": 0.21, "percentage": 10.74, "elapsed_time": "0:46:45", "remaining_time": "6:28:26"} +{"current_steps": 1170, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.0009713102234426903, "epoch": 0.22, "percentage": 10.84, "elapsed_time": "0:47:10", "remaining_time": "6:28:08"} +{"current_steps": 1170, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.0009713102234426903, "epoch": 0.22, "percentage": 10.84, "elapsed_time": "0:47:06", "remaining_time": "6:27:41"} +{"current_steps": 1170, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.0009713102234426903, "epoch": 0.22, "percentage": 10.84, "elapsed_time": "0:53:11", "remaining_time": "7:17:43"} +{"current_steps": 1170, "total_steps": 10798, "loss": 2.0796, "reward": null, "learning_rate": 0.0009713102234426903, "epoch": 0.22, "percentage": 10.84, "elapsed_time": "0:47:08", "remaining_time": "6:27:54"} +{"current_steps": 1180, "total_steps": 10798, "loss": 2.0565, "reward": null, "learning_rate": 0.0009708225506108965, "epoch": 0.22, "percentage": 10.93, "elapsed_time": "0:47:32", "remaining_time": "6:27:27"} +{"current_steps": 1180, "total_steps": 10798, "loss": 2.0565, "reward": null, "learning_rate": 0.0009708225506108965, "epoch": 0.22, "percentage": 10.93, "elapsed_time": "0:47:30", "remaining_time": "6:27:14"} +{"current_steps": 1180, "total_steps": 10798, "loss": 2.0565, "reward": null, "learning_rate": 0.0009708225506108965, "epoch": 0.22, "percentage": 10.93, "elapsed_time": "0:47:33", "remaining_time": "6:27:41"} +{"current_steps": 1180, "total_steps": 10798, "loss": 2.0565, "reward": null, "learning_rate": 0.0009708225506108965, "epoch": 0.22, "percentage": 10.93, "elapsed_time": "0:53:35", "remaining_time": "7:16:48"} +{"current_steps": 1190, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0009703308923962447, "epoch": 0.22, "percentage": 11.02, "elapsed_time": "0:47:57", "remaining_time": "6:27:13"} +{"current_steps": 1190, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0009703308923962447, "epoch": 0.22, "percentage": 11.02, "elapsed_time": "0:47:59", "remaining_time": "6:27:27"} +{"current_steps": 1190, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0009703308923962447, "epoch": 0.22, "percentage": 11.02, "elapsed_time": "0:47:55", "remaining_time": "6:27:00"} +{"current_steps": 1190, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0009703308923962447, "epoch": 0.22, "percentage": 11.02, "elapsed_time": "0:54:00", "remaining_time": "7:16:05"} +{"current_steps": 1200, "total_steps": 10798, "loss": 2.0638, "reward": null, "learning_rate": 0.0009698352529604857, "epoch": 0.22, "percentage": 11.11, "elapsed_time": "0:48:24", "remaining_time": "6:27:11"} +{"current_steps": 1200, "total_steps": 10798, "loss": 2.0638, "reward": null, "learning_rate": 0.0009698352529604857, "epoch": 0.22, "percentage": 11.11, "elapsed_time": "0:48:21", "remaining_time": "6:26:44"} +{"current_steps": 1200, "total_steps": 10798, "loss": 2.0638, "reward": null, "learning_rate": 0.0009698352529604857, "epoch": 0.22, "percentage": 11.11, "elapsed_time": "0:48:22", "remaining_time": "6:26:57"} +{"current_steps": 1200, "total_steps": 10798, "loss": 2.0638, "reward": null, "learning_rate": 0.0009698352529604857, "epoch": 0.22, "percentage": 11.11, "elapsed_time": "0:54:25", "remaining_time": "7:15:22"} +{"current_steps": 1210, "total_steps": 10798, "loss": 2.0358, "reward": null, "learning_rate": 0.0009693356364990705, "epoch": 0.22, "percentage": 11.21, "elapsed_time": "0:48:47", "remaining_time": "6:26:40"} +{"current_steps": 1210, "total_steps": 10798, "loss": 2.0358, "reward": null, "learning_rate": 0.0009693356364990705, "epoch": 0.22, "percentage": 11.21, "elapsed_time": "0:48:44", "remaining_time": "6:26:13"} +{"current_steps": 1210, "total_steps": 10798, "loss": 2.0358, "reward": null, "learning_rate": 0.0009693356364990705, "epoch": 0.22, "percentage": 11.21, "elapsed_time": "0:48:46", "remaining_time": "6:26:26"} +{"current_steps": 1210, "total_steps": 10798, "loss": 2.0358, "reward": null, "learning_rate": 0.0009693356364990705, "epoch": 0.22, "percentage": 11.21, "elapsed_time": "0:54:49", "remaining_time": "7:14:24"} +{"current_steps": 1220, "total_steps": 10798, "loss": 2.0859, "reward": null, "learning_rate": 0.0009688320472411143, "epoch": 0.23, "percentage": 11.3, "elapsed_time": "0:49:10", "remaining_time": "6:26:04"} +{"current_steps": 1220, "total_steps": 10798, "loss": 2.0859, "reward": null, "learning_rate": 0.0009688320472411143, "epoch": 0.23, "percentage": 11.3, "elapsed_time": "0:49:08", "remaining_time": "6:25:51"} +{"current_steps": 1220, "total_steps": 10798, "loss": 2.0859, "reward": null, "learning_rate": 0.0009688320472411143, "epoch": 0.23, "percentage": 11.3, "elapsed_time": "0:49:12", "remaining_time": "6:26:17"} +{"current_steps": 1220, "total_steps": 10798, "loss": 2.0859, "reward": null, "learning_rate": 0.0009688320472411143, "epoch": 0.23, "percentage": 11.3, "elapsed_time": "0:55:13", "remaining_time": "7:13:35"} +{"current_steps": 1230, "total_steps": 10798, "loss": 2.0932, "reward": null, "learning_rate": 0.0009683244894493613, "epoch": 0.23, "percentage": 11.39, "elapsed_time": "0:55:38", "remaining_time": "7:12:52"} +{"current_steps": 1230, "total_steps": 10798, "loss": 2.0932, "reward": null, "learning_rate": 0.0009683244894493613, "epoch": 0.23, "percentage": 11.39, "elapsed_time": "0:49:33", "remaining_time": "6:25:34"} +{"current_steps": 1230, "total_steps": 10798, "loss": 2.0932, "reward": null, "learning_rate": 0.0009683244894493613, "epoch": 0.23, "percentage": 11.39, "elapsed_time": "0:49:37", "remaining_time": "6:26:00"} +{"current_steps": 1230, "total_steps": 10798, "loss": 2.0932, "reward": null, "learning_rate": 0.0009683244894493613, "epoch": 0.23, "percentage": 11.39, "elapsed_time": "0:49:35", "remaining_time": "6:25:46"} +{"current_steps": 1240, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0009678129674201479, "epoch": 0.23, "percentage": 11.48, "elapsed_time": "0:49:57", "remaining_time": "6:25:07"} +{"current_steps": 1240, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0009678129674201479, "epoch": 0.23, "percentage": 11.48, "elapsed_time": "0:49:59", "remaining_time": "6:25:19"} +{"current_steps": 1240, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0009678129674201479, "epoch": 0.23, "percentage": 11.48, "elapsed_time": "0:50:01", "remaining_time": "6:25:32"} +{"current_steps": 1240, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0009678129674201479, "epoch": 0.23, "percentage": 11.48, "elapsed_time": "0:56:02", "remaining_time": "7:11:59"} +{"current_steps": 1250, "total_steps": 10798, "loss": 2.055, "reward": null, "learning_rate": 0.0009672974854833669, "epoch": 0.23, "percentage": 11.58, "elapsed_time": "0:50:24", "remaining_time": "6:25:01"} +{"current_steps": 1250, "total_steps": 10798, "loss": 2.055, "reward": null, "learning_rate": 0.0009672974854833669, "epoch": 0.23, "percentage": 11.58, "elapsed_time": "0:56:25", "remaining_time": "7:11:02"} +{"current_steps": 1250, "total_steps": 10798, "loss": 2.055, "reward": null, "learning_rate": 0.0009672974854833669, "epoch": 0.23, "percentage": 11.58, "elapsed_time": "0:50:22", "remaining_time": "6:24:48"} +{"current_steps": 1250, "total_steps": 10798, "loss": 2.055, "reward": null, "learning_rate": 0.0009672974854833669, "epoch": 0.23, "percentage": 11.58, "elapsed_time": "0:50:21", "remaining_time": "6:24:35"} +{"current_steps": 1260, "total_steps": 10798, "loss": 2.0665, "reward": null, "learning_rate": 0.0009667780480024304, "epoch": 0.23, "percentage": 11.67, "elapsed_time": "0:56:48", "remaining_time": "7:10:03"} +{"current_steps": 1260, "total_steps": 10798, "loss": 2.0665, "reward": null, "learning_rate": 0.0009667780480024304, "epoch": 0.23, "percentage": 11.67, "elapsed_time": "0:50:47", "remaining_time": "6:24:27"} +{"current_steps": 1260, "total_steps": 10798, "loss": 2.0665, "reward": null, "learning_rate": 0.0009667780480024304, "epoch": 0.23, "percentage": 11.67, "elapsed_time": "0:50:43", "remaining_time": "6:24:02"} +{"current_steps": 1260, "total_steps": 10798, "loss": 2.0665, "reward": null, "learning_rate": 0.0009667780480024304, "epoch": 0.23, "percentage": 11.67, "elapsed_time": "0:50:45", "remaining_time": "6:24:14"} +{"current_steps": 1270, "total_steps": 10798, "loss": 2.0488, "reward": null, "learning_rate": 0.0009662546593742334, "epoch": 0.24, "percentage": 11.76, "elapsed_time": "0:51:11", "remaining_time": "6:24:00"} +{"current_steps": 1270, "total_steps": 10798, "loss": 2.0488, "reward": null, "learning_rate": 0.0009662546593742334, "epoch": 0.24, "percentage": 11.76, "elapsed_time": "0:51:09", "remaining_time": "6:23:47"} +{"current_steps": 1270, "total_steps": 10798, "loss": 2.0488, "reward": null, "learning_rate": 0.0009662546593742334, "epoch": 0.24, "percentage": 11.76, "elapsed_time": "0:57:12", "remaining_time": "7:09:12"} +{"current_steps": 1270, "total_steps": 10798, "loss": 2.0488, "reward": null, "learning_rate": 0.0009662546593742334, "epoch": 0.24, "percentage": 11.76, "elapsed_time": "0:51:07", "remaining_time": "6:23:35"} +{"current_steps": 1280, "total_steps": 10798, "loss": 2.0543, "reward": null, "learning_rate": 0.0009657273240291159, "epoch": 0.24, "percentage": 11.85, "elapsed_time": "0:57:37", "remaining_time": "7:08:27"} +{"current_steps": 1280, "total_steps": 10798, "loss": 2.0543, "reward": null, "learning_rate": 0.0009657273240291159, "epoch": 0.24, "percentage": 11.85, "elapsed_time": "0:51:34", "remaining_time": "6:23:27"} +{"current_steps": 1280, "total_steps": 10798, "loss": 2.0543, "reward": null, "learning_rate": 0.0009657273240291159, "epoch": 0.24, "percentage": 11.85, "elapsed_time": "0:51:35", "remaining_time": "6:23:40"} +{"current_steps": 1280, "total_steps": 10798, "loss": 2.0543, "reward": null, "learning_rate": 0.0009657273240291159, "epoch": 0.24, "percentage": 11.85, "elapsed_time": "0:51:32", "remaining_time": "6:23:15"} +{"current_steps": 1290, "total_steps": 10798, "loss": 2.0418, "reward": null, "learning_rate": 0.0009651960464308261, "epoch": 0.24, "percentage": 11.95, "elapsed_time": "0:58:01", "remaining_time": "7:07:41"} +{"current_steps": 1290, "total_steps": 10798, "loss": 2.0418, "reward": null, "learning_rate": 0.0009651960464308261, "epoch": 0.24, "percentage": 11.95, "elapsed_time": "0:51:58", "remaining_time": "6:23:03"} +{"current_steps": 1290, "total_steps": 10798, "loss": 2.0418, "reward": null, "learning_rate": 0.0009651960464308261, "epoch": 0.24, "percentage": 11.95, "elapsed_time": "0:52:00", "remaining_time": "6:23:16"} +{"current_steps": 1290, "total_steps": 10798, "loss": 2.0418, "reward": null, "learning_rate": 0.0009651960464308261, "epoch": 0.24, "percentage": 11.95, "elapsed_time": "0:51:56", "remaining_time": "6:22:52"} +{"current_steps": 1300, "total_steps": 10798, "loss": 2.033, "reward": null, "learning_rate": 0.0009646608310764819, "epoch": 0.24, "percentage": 12.04, "elapsed_time": "0:58:25", "remaining_time": "7:06:48"} +{"current_steps": 1300, "total_steps": 10798, "loss": 2.033, "reward": null, "learning_rate": 0.0009646608310764819, "epoch": 0.24, "percentage": 12.04, "elapsed_time": "0:52:20", "remaining_time": "6:22:23"} +{"current_steps": 1300, "total_steps": 10798, "loss": 2.033, "reward": null, "learning_rate": 0.0009646608310764819, "epoch": 0.24, "percentage": 12.04, "elapsed_time": "0:52:21", "remaining_time": "6:22:34"} +{"current_steps": 1300, "total_steps": 10798, "loss": 2.033, "reward": null, "learning_rate": 0.0009646608310764819, "epoch": 0.24, "percentage": 12.04, "elapsed_time": "0:52:23", "remaining_time": "6:22:47"} +{"current_steps": 1310, "total_steps": 10798, "loss": 2.1034, "reward": null, "learning_rate": 0.0009641216824965338, "epoch": 0.24, "percentage": 12.13, "elapsed_time": "0:52:46", "remaining_time": "6:22:11"} +{"current_steps": 1310, "total_steps": 10798, "loss": 2.1034, "reward": null, "learning_rate": 0.0009641216824965338, "epoch": 0.24, "percentage": 12.13, "elapsed_time": "0:58:49", "remaining_time": "7:06:02"} +{"current_steps": 1310, "total_steps": 10798, "loss": 2.1034, "reward": null, "learning_rate": 0.0009641216824965338, "epoch": 0.24, "percentage": 12.13, "elapsed_time": "0:52:44", "remaining_time": "6:22:00"} +{"current_steps": 1310, "total_steps": 10798, "loss": 2.1034, "reward": null, "learning_rate": 0.0009641216824965338, "epoch": 0.24, "percentage": 12.13, "elapsed_time": "0:52:47", "remaining_time": "6:22:24"} +{"current_steps": 1320, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.0009635786052547253, "epoch": 0.24, "percentage": 12.22, "elapsed_time": "0:59:14", "remaining_time": "7:05:19"} +{"current_steps": 1320, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.0009635786052547253, "epoch": 0.24, "percentage": 12.22, "elapsed_time": "0:53:12", "remaining_time": "6:22:04"} +{"current_steps": 1320, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.0009635786052547253, "epoch": 0.24, "percentage": 12.22, "elapsed_time": "0:53:10", "remaining_time": "6:21:51"} +{"current_steps": 1320, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.0009635786052547253, "epoch": 0.24, "percentage": 12.22, "elapsed_time": "0:53:09", "remaining_time": "6:21:40"} +{"current_steps": 1330, "total_steps": 10798, "loss": 2.0607, "reward": null, "learning_rate": 0.0009630316039480556, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "0:53:37", "remaining_time": "6:21:42"} +{"current_steps": 1330, "total_steps": 10798, "loss": 2.0607, "reward": null, "learning_rate": 0.0009630316039480556, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "0:53:33", "remaining_time": "6:21:18"} +{"current_steps": 1330, "total_steps": 10798, "loss": 2.0607, "reward": null, "learning_rate": 0.0009630316039480556, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "0:59:38", "remaining_time": "7:04:35"} +{"current_steps": 1330, "total_steps": 10798, "loss": 2.0607, "reward": null, "learning_rate": 0.0009630316039480556, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "0:53:35", "remaining_time": "6:21:29"} +{"current_steps": 1340, "total_steps": 10798, "loss": 2.0457, "reward": null, "learning_rate": 0.0009624806832067394, "epoch": 0.25, "percentage": 12.41, "elapsed_time": "0:53:56", "remaining_time": "6:20:44"} +{"current_steps": 1340, "total_steps": 10798, "loss": 2.0457, "reward": null, "learning_rate": 0.0009624806832067394, "epoch": 0.25, "percentage": 12.41, "elapsed_time": "0:53:59", "remaining_time": "6:21:08"} +{"current_steps": 1340, "total_steps": 10798, "loss": 2.0457, "reward": null, "learning_rate": 0.0009624806832067394, "epoch": 0.25, "percentage": 12.41, "elapsed_time": "0:53:58", "remaining_time": "6:20:55"} +{"current_steps": 1340, "total_steps": 10798, "loss": 2.0457, "reward": null, "learning_rate": 0.0009624806832067394, "epoch": 0.25, "percentage": 12.41, "elapsed_time": "1:00:01", "remaining_time": "7:03:39"} +{"current_steps": 1350, "total_steps": 10798, "loss": 2.032, "reward": null, "learning_rate": 0.0009619258476941686, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "1:00:26", "remaining_time": "7:02:58"} +{"current_steps": 1350, "total_steps": 10798, "loss": 2.032, "reward": null, "learning_rate": 0.0009619258476941686, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "0:54:24", "remaining_time": "6:20:49"} +{"current_steps": 1350, "total_steps": 10798, "loss": 2.032, "reward": null, "learning_rate": 0.0009619258476941686, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "0:54:21", "remaining_time": "6:20:25"} +{"current_steps": 1350, "total_steps": 10798, "loss": 2.032, "reward": null, "learning_rate": 0.0009619258476941686, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "0:54:23", "remaining_time": "6:20:36"} +{"current_steps": 1360, "total_steps": 10798, "loss": 2.0519, "reward": null, "learning_rate": 0.000961367102106873, "epoch": 0.25, "percentage": 12.59, "elapsed_time": "1:00:50", "remaining_time": "7:02:14"} +{"current_steps": 1360, "total_steps": 10798, "loss": 2.0519, "reward": null, "learning_rate": 0.000961367102106873, "epoch": 0.25, "percentage": 12.59, "elapsed_time": "0:54:49", "remaining_time": "6:20:26"} +{"current_steps": 1360, "total_steps": 10798, "loss": 2.0519, "reward": null, "learning_rate": 0.000961367102106873, "epoch": 0.25, "percentage": 12.59, "elapsed_time": "0:54:45", "remaining_time": "6:20:03"} +{"current_steps": 1360, "total_steps": 10798, "loss": 2.0519, "reward": null, "learning_rate": 0.000961367102106873, "epoch": 0.25, "percentage": 12.59, "elapsed_time": "0:54:47", "remaining_time": "6:20:14"} +{"current_steps": 1370, "total_steps": 10798, "loss": 2.0449, "reward": null, "learning_rate": 0.0009608044511744791, "epoch": 0.25, "percentage": 12.69, "elapsed_time": "0:55:12", "remaining_time": "6:19:58"} +{"current_steps": 1370, "total_steps": 10798, "loss": 2.0449, "reward": null, "learning_rate": 0.0009608044511744791, "epoch": 0.25, "percentage": 12.69, "elapsed_time": "0:55:09", "remaining_time": "6:19:35"} +{"current_steps": 1370, "total_steps": 10798, "loss": 2.0449, "reward": null, "learning_rate": 0.0009608044511744791, "epoch": 0.25, "percentage": 12.69, "elapsed_time": "1:01:14", "remaining_time": "7:01:25"} +{"current_steps": 1370, "total_steps": 10798, "loss": 2.0449, "reward": null, "learning_rate": 0.0009608044511744791, "epoch": 0.25, "percentage": 12.69, "elapsed_time": "0:55:11", "remaining_time": "6:19:46"} +{"current_steps": 1380, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0009602378996596721, "epoch": 0.26, "percentage": 12.78, "elapsed_time": "1:01:38", "remaining_time": "7:00:38"} +{"current_steps": 1380, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0009602378996596721, "epoch": 0.26, "percentage": 12.78, "elapsed_time": "0:55:33", "remaining_time": "6:19:08"} +{"current_steps": 1380, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0009602378996596721, "epoch": 0.26, "percentage": 12.78, "elapsed_time": "0:55:34", "remaining_time": "6:19:19"} +{"current_steps": 1380, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0009602378996596721, "epoch": 0.26, "percentage": 12.78, "elapsed_time": "0:55:36", "remaining_time": "6:19:31"} +{"current_steps": 1390, "total_steps": 10798, "loss": 2.0394, "reward": null, "learning_rate": 0.0009596674523581539, "epoch": 0.26, "percentage": 12.87, "elapsed_time": "1:02:02", "remaining_time": "6:59:52"} +{"current_steps": 1390, "total_steps": 10798, "loss": 2.0394, "reward": null, "learning_rate": 0.0009596674523581539, "epoch": 0.26, "percentage": 12.87, "elapsed_time": "0:55:57", "remaining_time": "6:18:43"} +{"current_steps": 1390, "total_steps": 10798, "loss": 2.0394, "reward": null, "learning_rate": 0.0009596674523581539, "epoch": 0.26, "percentage": 12.87, "elapsed_time": "0:55:58", "remaining_time": "6:18:53"} +{"current_steps": 1390, "total_steps": 10798, "loss": 2.0394, "reward": null, "learning_rate": 0.0009596674523581539, "epoch": 0.26, "percentage": 12.87, "elapsed_time": "0:56:00", "remaining_time": "6:19:05"} +{"current_steps": 1400, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0009590931140986035, "epoch": 0.26, "percentage": 12.97, "elapsed_time": "1:02:26", "remaining_time": "6:59:12"} +{"current_steps": 1400, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0009590931140986035, "epoch": 0.26, "percentage": 12.97, "elapsed_time": "0:56:25", "remaining_time": "6:18:45"} +{"current_steps": 1400, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0009590931140986035, "epoch": 0.26, "percentage": 12.97, "elapsed_time": "0:56:22", "remaining_time": "6:18:23"} +{"current_steps": 1400, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0009590931140986035, "epoch": 0.26, "percentage": 12.97, "elapsed_time": "0:56:23", "remaining_time": "6:18:33"} +{"current_steps": 1410, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.0009585148897426354, "epoch": 0.26, "percentage": 13.06, "elapsed_time": "1:02:50", "remaining_time": "6:58:23"} +{"current_steps": 1410, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.0009585148897426354, "epoch": 0.26, "percentage": 13.06, "elapsed_time": "0:56:48", "remaining_time": "6:18:16"} +{"current_steps": 1410, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.0009585148897426354, "epoch": 0.26, "percentage": 13.06, "elapsed_time": "0:56:45", "remaining_time": "6:17:54"} +{"current_steps": 1410, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.0009585148897426354, "epoch": 0.26, "percentage": 13.06, "elapsed_time": "0:56:47", "remaining_time": "6:18:04"} +{"current_steps": 1420, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0009579327841847593, "epoch": 0.26, "percentage": 13.15, "elapsed_time": "0:57:13", "remaining_time": "6:17:54"} +{"current_steps": 1420, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0009579327841847593, "epoch": 0.26, "percentage": 13.15, "elapsed_time": "0:57:09", "remaining_time": "6:17:32"} +{"current_steps": 1420, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0009579327841847593, "epoch": 0.26, "percentage": 13.15, "elapsed_time": "0:57:11", "remaining_time": "6:17:42"} +{"current_steps": 1420, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0009579327841847593, "epoch": 0.26, "percentage": 13.15, "elapsed_time": "1:03:14", "remaining_time": "6:57:41"} +{"current_steps": 1430, "total_steps": 10798, "loss": 2.0509, "reward": null, "learning_rate": 0.000957346802352338, "epoch": 0.26, "percentage": 13.24, "elapsed_time": "1:03:39", "remaining_time": "6:57:01"} +{"current_steps": 1430, "total_steps": 10798, "loss": 2.0509, "reward": null, "learning_rate": 0.000957346802352338, "epoch": 0.26, "percentage": 13.24, "elapsed_time": "0:57:36", "remaining_time": "6:17:22"} +{"current_steps": 1430, "total_steps": 10798, "loss": 2.0509, "reward": null, "learning_rate": 0.000957346802352338, "epoch": 0.26, "percentage": 13.24, "elapsed_time": "0:57:38", "remaining_time": "6:17:33"} +{"current_steps": 1430, "total_steps": 10798, "loss": 2.0509, "reward": null, "learning_rate": 0.000957346802352338, "epoch": 0.26, "percentage": 13.24, "elapsed_time": "0:57:34", "remaining_time": "6:17:11"} +{"current_steps": 1440, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009567569492055456, "epoch": 0.27, "percentage": 13.34, "elapsed_time": "0:57:59", "remaining_time": "6:16:48"} +{"current_steps": 1440, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009567569492055456, "epoch": 0.27, "percentage": 13.34, "elapsed_time": "1:04:03", "remaining_time": "6:56:19"} +{"current_steps": 1440, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009567569492055456, "epoch": 0.27, "percentage": 13.34, "elapsed_time": "0:58:02", "remaining_time": "6:17:10"} +{"current_steps": 1440, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009567569492055456, "epoch": 0.27, "percentage": 13.34, "elapsed_time": "0:58:00", "remaining_time": "6:16:59"} +{"current_steps": 1450, "total_steps": 10798, "loss": 2.0203, "reward": null, "learning_rate": 0.0009561632297373263, "epoch": 0.27, "percentage": 13.43, "elapsed_time": "1:04:27", "remaining_time": "6:55:32"} +{"current_steps": 1450, "total_steps": 10798, "loss": 2.0203, "reward": null, "learning_rate": 0.0009561632297373263, "epoch": 0.27, "percentage": 13.43, "elapsed_time": "0:58:25", "remaining_time": "6:16:42"} +{"current_steps": 1450, "total_steps": 10798, "loss": 2.0203, "reward": null, "learning_rate": 0.0009561632297373263, "epoch": 0.27, "percentage": 13.43, "elapsed_time": "0:58:24", "remaining_time": "6:16:30"} +{"current_steps": 1450, "total_steps": 10798, "loss": 2.0203, "reward": null, "learning_rate": 0.0009561632297373263, "epoch": 0.27, "percentage": 13.43, "elapsed_time": "0:58:22", "remaining_time": "6:16:20"} +{"current_steps": 1460, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0009555656489733513, "epoch": 0.27, "percentage": 13.52, "elapsed_time": "1:04:51", "remaining_time": "6:54:52"} +{"current_steps": 1460, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0009555656489733513, "epoch": 0.27, "percentage": 13.52, "elapsed_time": "0:58:48", "remaining_time": "6:16:08"} +{"current_steps": 1460, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0009555656489733513, "epoch": 0.27, "percentage": 13.52, "elapsed_time": "0:58:47", "remaining_time": "6:15:58"} +{"current_steps": 1460, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0009555656489733513, "epoch": 0.27, "percentage": 13.52, "elapsed_time": "0:58:50", "remaining_time": "6:16:20"} +{"current_steps": 1470, "total_steps": 10798, "loss": 1.9754, "reward": null, "learning_rate": 0.000954964211971977, "epoch": 0.27, "percentage": 13.61, "elapsed_time": "0:59:12", "remaining_time": "6:15:44"} +{"current_steps": 1470, "total_steps": 10798, "loss": 1.9754, "reward": null, "learning_rate": 0.000954964211971977, "epoch": 0.27, "percentage": 13.61, "elapsed_time": "0:59:11", "remaining_time": "6:15:34"} +{"current_steps": 1470, "total_steps": 10798, "loss": 1.9754, "reward": null, "learning_rate": 0.000954964211971977, "epoch": 0.27, "percentage": 13.61, "elapsed_time": "0:59:14", "remaining_time": "6:15:55"} +{"current_steps": 1470, "total_steps": 10798, "loss": 1.9754, "reward": null, "learning_rate": 0.000954964211971977, "epoch": 0.27, "percentage": 13.61, "elapsed_time": "1:05:15", "remaining_time": "6:54:09"} +{"current_steps": 1480, "total_steps": 10798, "loss": 2.0374, "reward": null, "learning_rate": 0.0009543589238242012, "epoch": 0.27, "percentage": 13.71, "elapsed_time": "0:59:36", "remaining_time": "6:15:15"} +{"current_steps": 1480, "total_steps": 10798, "loss": 2.0374, "reward": null, "learning_rate": 0.0009543589238242012, "epoch": 0.27, "percentage": 13.71, "elapsed_time": "0:59:34", "remaining_time": "6:15:04"} +{"current_steps": 1480, "total_steps": 10798, "loss": 2.0374, "reward": null, "learning_rate": 0.0009543589238242012, "epoch": 0.27, "percentage": 13.71, "elapsed_time": "0:59:37", "remaining_time": "6:15:26"} +{"current_steps": 1480, "total_steps": 10798, "loss": 2.0374, "reward": null, "learning_rate": 0.0009543589238242012, "epoch": 0.27, "percentage": 13.71, "elapsed_time": "1:05:39", "remaining_time": "6:53:21"} +{"current_steps": 1490, "total_steps": 10798, "loss": 2.0367, "reward": null, "learning_rate": 0.000953749789653621, "epoch": 0.28, "percentage": 13.8, "elapsed_time": "1:06:04", "remaining_time": "6:52:48"} +{"current_steps": 1490, "total_steps": 10798, "loss": 2.0367, "reward": null, "learning_rate": 0.000953749789653621, "epoch": 0.28, "percentage": 13.8, "elapsed_time": "1:00:03", "remaining_time": "6:15:10"} +{"current_steps": 1490, "total_steps": 10798, "loss": 2.0367, "reward": null, "learning_rate": 0.000953749789653621, "epoch": 0.28, "percentage": 13.8, "elapsed_time": "1:00:00", "remaining_time": "6:14:49"} +{"current_steps": 1490, "total_steps": 10798, "loss": 2.0367, "reward": null, "learning_rate": 0.000953749789653621, "epoch": 0.28, "percentage": 13.8, "elapsed_time": "1:00:01", "remaining_time": "6:14:59"} +{"current_steps": 1500, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.000953136814616389, "epoch": 0.28, "percentage": 13.89, "elapsed_time": "1:06:29", "remaining_time": "6:52:10"} +{"current_steps": 1500, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.000953136814616389, "epoch": 0.28, "percentage": 13.89, "elapsed_time": "1:00:26", "remaining_time": "6:14:38"} +{"current_steps": 1500, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.000953136814616389, "epoch": 0.28, "percentage": 13.89, "elapsed_time": "1:00:24", "remaining_time": "6:14:28"} +{"current_steps": 1500, "total_steps": 10798, "loss": 2.0866, "reward": null, "learning_rate": 0.000953136814616389, "epoch": 0.28, "percentage": 13.89, "elapsed_time": "1:00:28", "remaining_time": "6:14:49"} +{"current_steps": 1510, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0009525200039011694, "epoch": 0.28, "percentage": 13.98, "elapsed_time": "1:00:48", "remaining_time": "6:14:02"} +{"current_steps": 1510, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0009525200039011694, "epoch": 0.28, "percentage": 13.98, "elapsed_time": "1:00:50", "remaining_time": "6:14:12"} +{"current_steps": 1510, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0009525200039011694, "epoch": 0.28, "percentage": 13.98, "elapsed_time": "1:06:53", "remaining_time": "6:51:26"} +{"current_steps": 1510, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0009525200039011694, "epoch": 0.28, "percentage": 13.98, "elapsed_time": "1:00:51", "remaining_time": "6:14:23"} +{"current_steps": 1520, "total_steps": 10798, "loss": 2.0525, "reward": null, "learning_rate": 0.0009518993627290948, "epoch": 0.28, "percentage": 14.08, "elapsed_time": "1:07:18", "remaining_time": "6:50:47"} +{"current_steps": 1520, "total_steps": 10798, "loss": 2.0525, "reward": null, "learning_rate": 0.0009518993627290948, "epoch": 0.28, "percentage": 14.08, "elapsed_time": "1:01:13", "remaining_time": "6:13:40"} +{"current_steps": 1520, "total_steps": 10798, "loss": 2.0525, "reward": null, "learning_rate": 0.0009518993627290948, "epoch": 0.28, "percentage": 14.08, "elapsed_time": "1:01:16", "remaining_time": "6:14:01"} +{"current_steps": 1520, "total_steps": 10798, "loss": 2.0525, "reward": null, "learning_rate": 0.0009518993627290948, "epoch": 0.28, "percentage": 14.08, "elapsed_time": "1:01:14", "remaining_time": "6:13:50"} +{"current_steps": 1530, "total_steps": 10798, "loss": 2.0636, "reward": null, "learning_rate": 0.0009512748963537212, "epoch": 0.28, "percentage": 14.17, "elapsed_time": "1:07:41", "remaining_time": "6:50:00"} +{"current_steps": 1530, "total_steps": 10798, "loss": 2.0636, "reward": null, "learning_rate": 0.0009512748963537212, "epoch": 0.28, "percentage": 14.17, "elapsed_time": "1:01:37", "remaining_time": "6:13:19"} +{"current_steps": 1530, "total_steps": 10798, "loss": 2.0636, "reward": null, "learning_rate": 0.0009512748963537212, "epoch": 0.28, "percentage": 14.17, "elapsed_time": "1:01:39", "remaining_time": "6:13:30"} +{"current_steps": 1530, "total_steps": 10798, "loss": 2.0636, "reward": null, "learning_rate": 0.0009512748963537212, "epoch": 0.28, "percentage": 14.17, "elapsed_time": "1:01:36", "remaining_time": "6:13:10"} +{"current_steps": 1540, "total_steps": 10798, "loss": 2.0522, "reward": null, "learning_rate": 0.000950646610060984, "epoch": 0.29, "percentage": 14.26, "elapsed_time": "1:08:05", "remaining_time": "6:49:23"} +{"current_steps": 1540, "total_steps": 10798, "loss": 2.0522, "reward": null, "learning_rate": 0.000950646610060984, "epoch": 0.29, "percentage": 14.26, "elapsed_time": "1:02:02", "remaining_time": "6:12:59"} +{"current_steps": 1540, "total_steps": 10798, "loss": 2.0522, "reward": null, "learning_rate": 0.000950646610060984, "epoch": 0.29, "percentage": 14.26, "elapsed_time": "1:02:04", "remaining_time": "6:13:10"} +{"current_steps": 1540, "total_steps": 10798, "loss": 2.0522, "reward": null, "learning_rate": 0.000950646610060984, "epoch": 0.29, "percentage": 14.26, "elapsed_time": "1:02:01", "remaining_time": "6:12:49"} +{"current_steps": 1550, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009500145091691532, "epoch": 0.29, "percentage": 14.35, "elapsed_time": "1:08:29", "remaining_time": "6:48:38"} +{"current_steps": 1550, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009500145091691532, "epoch": 0.29, "percentage": 14.35, "elapsed_time": "1:02:24", "remaining_time": "6:12:21"} +{"current_steps": 1550, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009500145091691532, "epoch": 0.29, "percentage": 14.35, "elapsed_time": "1:02:26", "remaining_time": "6:12:31"} +{"current_steps": 1550, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009500145091691532, "epoch": 0.29, "percentage": 14.35, "elapsed_time": "1:02:27", "remaining_time": "6:12:41"} +{"current_steps": 1560, "total_steps": 10798, "loss": 1.9887, "reward": null, "learning_rate": 0.0009493785990287882, "epoch": 0.29, "percentage": 14.45, "elapsed_time": "1:02:51", "remaining_time": "6:12:11"} +{"current_steps": 1560, "total_steps": 10798, "loss": 1.9887, "reward": null, "learning_rate": 0.0009493785990287882, "epoch": 0.29, "percentage": 14.45, "elapsed_time": "1:02:49", "remaining_time": "6:12:01"} +{"current_steps": 1560, "total_steps": 10798, "loss": 1.9887, "reward": null, "learning_rate": 0.0009493785990287882, "epoch": 0.29, "percentage": 14.45, "elapsed_time": "1:02:52", "remaining_time": "6:12:21"} +{"current_steps": 1560, "total_steps": 10798, "loss": 1.9887, "reward": null, "learning_rate": 0.0009493785990287882, "epoch": 0.29, "percentage": 14.45, "elapsed_time": "1:08:54", "remaining_time": "6:48:02"} +{"current_steps": 1570, "total_steps": 10798, "loss": 2.0309, "reward": null, "learning_rate": 0.0009487388850226926, "epoch": 0.29, "percentage": 14.54, "elapsed_time": "1:09:17", "remaining_time": "6:47:19"} +{"current_steps": 1570, "total_steps": 10798, "loss": 2.0309, "reward": null, "learning_rate": 0.0009487388850226926, "epoch": 0.29, "percentage": 14.54, "elapsed_time": "1:03:14", "remaining_time": "6:11:44"} +{"current_steps": 1570, "total_steps": 10798, "loss": 2.0309, "reward": null, "learning_rate": 0.0009487388850226926, "epoch": 0.29, "percentage": 14.54, "elapsed_time": "1:03:13", "remaining_time": "6:11:34"} +{"current_steps": 1570, "total_steps": 10798, "loss": 2.0309, "reward": null, "learning_rate": 0.0009487388850226926, "epoch": 0.29, "percentage": 14.54, "elapsed_time": "1:03:16", "remaining_time": "6:11:54"} +{"current_steps": 1580, "total_steps": 10798, "loss": 1.9954, "reward": null, "learning_rate": 0.000948095372565869, "epoch": 0.29, "percentage": 14.63, "elapsed_time": "1:03:37", "remaining_time": "6:11:14"} +{"current_steps": 1580, "total_steps": 10798, "loss": 1.9954, "reward": null, "learning_rate": 0.000948095372565869, "epoch": 0.29, "percentage": 14.63, "elapsed_time": "1:03:36", "remaining_time": "6:11:05"} +{"current_steps": 1580, "total_steps": 10798, "loss": 1.9954, "reward": null, "learning_rate": 0.000948095372565869, "epoch": 0.29, "percentage": 14.63, "elapsed_time": "1:03:39", "remaining_time": "6:11:24"} +{"current_steps": 1580, "total_steps": 10798, "loss": 1.9954, "reward": null, "learning_rate": 0.000948095372565869, "epoch": 0.29, "percentage": 14.63, "elapsed_time": "1:09:41", "remaining_time": "6:46:33"} +{"current_steps": 1590, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009474480671054726, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "1:04:02", "remaining_time": "6:10:55"} +{"current_steps": 1590, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009474480671054726, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "1:04:01", "remaining_time": "6:10:45"} +{"current_steps": 1590, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009474480671054726, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "1:03:59", "remaining_time": "6:10:36"} +{"current_steps": 1590, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009474480671054726, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "1:10:04", "remaining_time": "6:45:48"} +{"current_steps": 1600, "total_steps": 10798, "loss": 2.0395, "reward": null, "learning_rate": 0.0009467969741207652, "epoch": 0.3, "percentage": 14.82, "elapsed_time": "1:10:28", "remaining_time": "6:45:08"} +{"current_steps": 1600, "total_steps": 10798, "loss": 2.0395, "reward": null, "learning_rate": 0.0009467969741207652, "epoch": 0.3, "percentage": 14.82, "elapsed_time": "1:04:27", "remaining_time": "6:10:30"} +{"current_steps": 1600, "total_steps": 10798, "loss": 2.0395, "reward": null, "learning_rate": 0.0009467969741207652, "epoch": 0.3, "percentage": 14.82, "elapsed_time": "1:04:25", "remaining_time": "6:10:20"} +{"current_steps": 1600, "total_steps": 10798, "loss": 2.0395, "reward": null, "learning_rate": 0.0009467969741207652, "epoch": 0.3, "percentage": 14.82, "elapsed_time": "1:04:23", "remaining_time": "6:10:11"} +{"current_steps": 1610, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0009461420991230693, "epoch": 0.3, "percentage": 14.91, "elapsed_time": "1:04:49", "remaining_time": "6:09:54"} +{"current_steps": 1610, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0009461420991230693, "epoch": 0.3, "percentage": 14.91, "elapsed_time": "1:10:52", "remaining_time": "6:44:27"} +{"current_steps": 1610, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0009461420991230693, "epoch": 0.3, "percentage": 14.91, "elapsed_time": "1:04:50", "remaining_time": "6:10:04"} +{"current_steps": 1610, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0009461420991230693, "epoch": 0.3, "percentage": 14.91, "elapsed_time": "1:04:47", "remaining_time": "6:09:45"} +{"current_steps": 1620, "total_steps": 10798, "loss": 2.0308, "reward": null, "learning_rate": 0.0009454834476557207, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "1:05:14", "remaining_time": "6:09:38"} +{"current_steps": 1620, "total_steps": 10798, "loss": 2.0308, "reward": null, "learning_rate": 0.0009454834476557207, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "1:05:16", "remaining_time": "6:09:48"} +{"current_steps": 1620, "total_steps": 10798, "loss": 2.0308, "reward": null, "learning_rate": 0.0009454834476557207, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "1:05:13", "remaining_time": "6:09:29"} +{"current_steps": 1620, "total_steps": 10798, "loss": 2.0308, "reward": null, "learning_rate": 0.0009454834476557207, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "1:11:17", "remaining_time": "6:43:56"} +{"current_steps": 1630, "total_steps": 10798, "loss": 2.0826, "reward": null, "learning_rate": 0.0009448210252940223, "epoch": 0.3, "percentage": 15.1, "elapsed_time": "1:11:41", "remaining_time": "6:43:14"} +{"current_steps": 1630, "total_steps": 10798, "loss": 2.0826, "reward": null, "learning_rate": 0.0009448210252940223, "epoch": 0.3, "percentage": 15.1, "elapsed_time": "1:05:38", "remaining_time": "6:09:11"} +{"current_steps": 1630, "total_steps": 10798, "loss": 2.0826, "reward": null, "learning_rate": 0.0009448210252940223, "epoch": 0.3, "percentage": 15.1, "elapsed_time": "1:05:36", "remaining_time": "6:09:02"} +{"current_steps": 1630, "total_steps": 10798, "loss": 2.0826, "reward": null, "learning_rate": 0.0009448210252940223, "epoch": 0.3, "percentage": 15.1, "elapsed_time": "1:05:40", "remaining_time": "6:09:21"} +{"current_steps": 1640, "total_steps": 10798, "loss": 2.0424, "reward": null, "learning_rate": 0.0009441548376451963, "epoch": 0.3, "percentage": 15.19, "elapsed_time": "1:12:05", "remaining_time": "6:42:35"} +{"current_steps": 1640, "total_steps": 10798, "loss": 2.0424, "reward": null, "learning_rate": 0.0009441548376451963, "epoch": 0.3, "percentage": 15.19, "elapsed_time": "1:06:02", "remaining_time": "6:08:47"} +{"current_steps": 1640, "total_steps": 10798, "loss": 2.0424, "reward": null, "learning_rate": 0.0009441548376451963, "epoch": 0.3, "percentage": 15.19, "elapsed_time": "1:06:00", "remaining_time": "6:08:38"} +{"current_steps": 1640, "total_steps": 10798, "loss": 2.0424, "reward": null, "learning_rate": 0.0009441548376451963, "epoch": 0.3, "percentage": 15.19, "elapsed_time": "1:06:04", "remaining_time": "6:08:57"} +{"current_steps": 1650, "total_steps": 10798, "loss": 2.0125, "reward": null, "learning_rate": 0.0009434848903483373, "epoch": 0.31, "percentage": 15.28, "elapsed_time": "1:06:25", "remaining_time": "6:08:19"} +{"current_steps": 1650, "total_steps": 10798, "loss": 2.0125, "reward": null, "learning_rate": 0.0009434848903483373, "epoch": 0.31, "percentage": 15.28, "elapsed_time": "1:12:29", "remaining_time": "6:41:53"} +{"current_steps": 1650, "total_steps": 10798, "loss": 2.0125, "reward": null, "learning_rate": 0.0009434848903483373, "epoch": 0.31, "percentage": 15.28, "elapsed_time": "1:06:24", "remaining_time": "6:08:10"} +{"current_steps": 1650, "total_steps": 10798, "loss": 2.0125, "reward": null, "learning_rate": 0.0009434848903483373, "epoch": 0.31, "percentage": 15.28, "elapsed_time": "1:06:27", "remaining_time": "6:08:28"} +{"current_steps": 1660, "total_steps": 10798, "loss": 2.0139, "reward": null, "learning_rate": 0.0009428111890743639, "epoch": 0.31, "percentage": 15.37, "elapsed_time": "1:12:53", "remaining_time": "6:41:15"} +{"current_steps": 1660, "total_steps": 10798, "loss": 2.0139, "reward": null, "learning_rate": 0.0009428111890743639, "epoch": 0.31, "percentage": 15.37, "elapsed_time": "1:06:52", "remaining_time": "6:08:05"} +{"current_steps": 1660, "total_steps": 10798, "loss": 2.0139, "reward": null, "learning_rate": 0.0009428111890743639, "epoch": 0.31, "percentage": 15.37, "elapsed_time": "1:06:50", "remaining_time": "6:07:56"} +{"current_steps": 1660, "total_steps": 10798, "loss": 2.0139, "reward": null, "learning_rate": 0.0009428111890743639, "epoch": 0.31, "percentage": 15.37, "elapsed_time": "1:06:48", "remaining_time": "6:07:47"} +{"current_steps": 1670, "total_steps": 10798, "loss": 2.0682, "reward": null, "learning_rate": 0.0009421337395259717, "epoch": 0.31, "percentage": 15.47, "elapsed_time": "1:13:18", "remaining_time": "6:40:40"} +{"current_steps": 1670, "total_steps": 10798, "loss": 2.0682, "reward": null, "learning_rate": 0.0009421337395259717, "epoch": 0.31, "percentage": 15.47, "elapsed_time": "1:07:13", "remaining_time": "6:07:26"} +{"current_steps": 1670, "total_steps": 10798, "loss": 2.0682, "reward": null, "learning_rate": 0.0009421337395259717, "epoch": 0.31, "percentage": 15.47, "elapsed_time": "1:07:15", "remaining_time": "6:07:35"} +{"current_steps": 1670, "total_steps": 10798, "loss": 2.0682, "reward": null, "learning_rate": 0.0009421337395259717, "epoch": 0.31, "percentage": 15.47, "elapsed_time": "1:07:16", "remaining_time": "6:07:44"} +{"current_steps": 1680, "total_steps": 10798, "loss": 2.0577, "reward": null, "learning_rate": 0.0009414525474375837, "epoch": 0.31, "percentage": 15.56, "elapsed_time": "1:07:40", "remaining_time": "6:07:18"} +{"current_steps": 1680, "total_steps": 10798, "loss": 2.0577, "reward": null, "learning_rate": 0.0009414525474375837, "epoch": 0.31, "percentage": 15.56, "elapsed_time": "1:07:38", "remaining_time": "6:07:09"} +{"current_steps": 1680, "total_steps": 10798, "loss": 2.0577, "reward": null, "learning_rate": 0.0009414525474375837, "epoch": 0.31, "percentage": 15.56, "elapsed_time": "1:13:42", "remaining_time": "6:40:00"} +{"current_steps": 1680, "total_steps": 10798, "loss": 2.0577, "reward": null, "learning_rate": 0.0009414525474375837, "epoch": 0.31, "percentage": 15.56, "elapsed_time": "1:07:37", "remaining_time": "6:07:00"} +{"current_steps": 1690, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0009407676185753029, "epoch": 0.31, "percentage": 15.65, "elapsed_time": "1:08:03", "remaining_time": "6:06:50"} +{"current_steps": 1690, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0009407676185753029, "epoch": 0.31, "percentage": 15.65, "elapsed_time": "1:08:02", "remaining_time": "6:06:40"} +{"current_steps": 1690, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0009407676185753029, "epoch": 0.31, "percentage": 15.65, "elapsed_time": "1:08:00", "remaining_time": "6:06:32"} +{"current_steps": 1690, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0009407676185753029, "epoch": 0.31, "percentage": 15.65, "elapsed_time": "1:14:05", "remaining_time": "6:39:18"} +{"current_steps": 1700, "total_steps": 10798, "loss": 2.0515, "reward": null, "learning_rate": 0.0009400789587368632, "epoch": 0.31, "percentage": 15.74, "elapsed_time": "1:14:31", "remaining_time": "6:38:47"} +{"current_steps": 1700, "total_steps": 10798, "loss": 2.0515, "reward": null, "learning_rate": 0.0009400789587368632, "epoch": 0.31, "percentage": 15.74, "elapsed_time": "1:08:26", "remaining_time": "6:06:15"} +{"current_steps": 1700, "total_steps": 10798, "loss": 2.0515, "reward": null, "learning_rate": 0.0009400789587368632, "epoch": 0.31, "percentage": 15.74, "elapsed_time": "1:08:27", "remaining_time": "6:06:24"} +{"current_steps": 1700, "total_steps": 10798, "loss": 2.0515, "reward": null, "learning_rate": 0.0009400789587368632, "epoch": 0.31, "percentage": 15.74, "elapsed_time": "1:08:29", "remaining_time": "6:06:33"} +{"current_steps": 1710, "total_steps": 10798, "loss": 2.0398, "reward": null, "learning_rate": 0.0009393865737515794, "epoch": 0.32, "percentage": 15.84, "elapsed_time": "1:14:55", "remaining_time": "6:38:12"} +{"current_steps": 1710, "total_steps": 10798, "loss": 2.0398, "reward": null, "learning_rate": 0.0009393865737515794, "epoch": 0.32, "percentage": 15.84, "elapsed_time": "1:08:54", "remaining_time": "6:06:11"} +{"current_steps": 1710, "total_steps": 10798, "loss": 2.0398, "reward": null, "learning_rate": 0.0009393865737515794, "epoch": 0.32, "percentage": 15.84, "elapsed_time": "1:08:50", "remaining_time": "6:05:53"} +{"current_steps": 1710, "total_steps": 10798, "loss": 2.0398, "reward": null, "learning_rate": 0.0009393865737515794, "epoch": 0.32, "percentage": 15.84, "elapsed_time": "1:08:52", "remaining_time": "6:06:02"} +{"current_steps": 1720, "total_steps": 10798, "loss": 2.0146, "reward": null, "learning_rate": 0.0009386904694802997, "epoch": 0.32, "percentage": 15.93, "elapsed_time": "1:15:20", "remaining_time": "6:37:36"} +{"current_steps": 1720, "total_steps": 10798, "loss": 2.0146, "reward": null, "learning_rate": 0.0009386904694802997, "epoch": 0.32, "percentage": 15.93, "elapsed_time": "1:09:18", "remaining_time": "6:05:48"} +{"current_steps": 1720, "total_steps": 10798, "loss": 2.0146, "reward": null, "learning_rate": 0.0009386904694802997, "epoch": 0.32, "percentage": 15.93, "elapsed_time": "1:09:16", "remaining_time": "6:05:39"} +{"current_steps": 1720, "total_steps": 10798, "loss": 2.0146, "reward": null, "learning_rate": 0.0009386904694802997, "epoch": 0.32, "percentage": 15.93, "elapsed_time": "1:09:15", "remaining_time": "6:05:30"} +{"current_steps": 1730, "total_steps": 10798, "loss": 2.0438, "reward": null, "learning_rate": 0.0009379906518153543, "epoch": 0.32, "percentage": 16.02, "elapsed_time": "1:15:44", "remaining_time": "6:37:01"} +{"current_steps": 1730, "total_steps": 10798, "loss": 2.0438, "reward": null, "learning_rate": 0.0009379906518153543, "epoch": 0.32, "percentage": 16.02, "elapsed_time": "1:09:41", "remaining_time": "6:05:17"} +{"current_steps": 1730, "total_steps": 10798, "loss": 2.0438, "reward": null, "learning_rate": 0.0009379906518153543, "epoch": 0.32, "percentage": 16.02, "elapsed_time": "1:09:43", "remaining_time": "6:05:26"} +{"current_steps": 1730, "total_steps": 10798, "loss": 2.0438, "reward": null, "learning_rate": 0.0009379906518153543, "epoch": 0.32, "percentage": 16.02, "elapsed_time": "1:09:39", "remaining_time": "6:05:08"} +{"current_steps": 1740, "total_steps": 10798, "loss": 2.0377, "reward": null, "learning_rate": 0.0009372871266805063, "epoch": 0.32, "percentage": 16.11, "elapsed_time": "1:16:09", "remaining_time": "6:36:26"} +{"current_steps": 1740, "total_steps": 10798, "loss": 2.0377, "reward": null, "learning_rate": 0.0009372871266805063, "epoch": 0.32, "percentage": 16.11, "elapsed_time": "1:10:07", "remaining_time": "6:05:04"} +{"current_steps": 1740, "total_steps": 10798, "loss": 2.0377, "reward": null, "learning_rate": 0.0009372871266805063, "epoch": 0.32, "percentage": 16.11, "elapsed_time": "1:10:06", "remaining_time": "6:04:55"} +{"current_steps": 1740, "total_steps": 10798, "loss": 2.0377, "reward": null, "learning_rate": 0.0009372871266805063, "epoch": 0.32, "percentage": 16.11, "elapsed_time": "1:10:04", "remaining_time": "6:04:47"} +{"current_steps": 1750, "total_steps": 10798, "loss": 2.0789, "reward": null, "learning_rate": 0.000936579900030902, "epoch": 0.32, "percentage": 16.21, "elapsed_time": "1:16:34", "remaining_time": "6:35:52"} +{"current_steps": 1750, "total_steps": 10798, "loss": 2.0789, "reward": null, "learning_rate": 0.000936579900030902, "epoch": 0.32, "percentage": 16.21, "elapsed_time": "1:10:32", "remaining_time": "6:04:43"} +{"current_steps": 1750, "total_steps": 10798, "loss": 2.0789, "reward": null, "learning_rate": 0.000936579900030902, "epoch": 0.32, "percentage": 16.21, "elapsed_time": "1:10:29", "remaining_time": "6:04:26"} +{"current_steps": 1750, "total_steps": 10798, "loss": 2.0789, "reward": null, "learning_rate": 0.000936579900030902, "epoch": 0.32, "percentage": 16.21, "elapsed_time": "1:10:30", "remaining_time": "6:04:34"} +{"current_steps": 1760, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0009358689778530193, "epoch": 0.33, "percentage": 16.3, "elapsed_time": "1:10:53", "remaining_time": "6:04:01"} +{"current_steps": 1760, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0009358689778530193, "epoch": 0.33, "percentage": 16.3, "elapsed_time": "1:10:56", "remaining_time": "6:04:18"} +{"current_steps": 1760, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0009358689778530193, "epoch": 0.33, "percentage": 16.3, "elapsed_time": "1:10:54", "remaining_time": "6:04:09"} +{"current_steps": 1760, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0009358689778530193, "epoch": 0.33, "percentage": 16.3, "elapsed_time": "1:16:58", "remaining_time": "6:35:15"} +{"current_steps": 1770, "total_steps": 10798, "loss": 2.0114, "reward": null, "learning_rate": 0.0009351543661646185, "epoch": 0.33, "percentage": 16.39, "elapsed_time": "1:11:18", "remaining_time": "6:03:43"} +{"current_steps": 1770, "total_steps": 10798, "loss": 2.0114, "reward": null, "learning_rate": 0.0009351543661646185, "epoch": 0.33, "percentage": 16.39, "elapsed_time": "1:17:21", "remaining_time": "6:34:35"} +{"current_steps": 1770, "total_steps": 10798, "loss": 2.0114, "reward": null, "learning_rate": 0.0009351543661646185, "epoch": 0.33, "percentage": 16.39, "elapsed_time": "1:11:17", "remaining_time": "6:03:35"} +{"current_steps": 1770, "total_steps": 10798, "loss": 2.0114, "reward": null, "learning_rate": 0.0009351543661646185, "epoch": 0.33, "percentage": 16.39, "elapsed_time": "1:11:20", "remaining_time": "6:03:52"} +{"current_steps": 1780, "total_steps": 10798, "loss": 2.0242, "reward": null, "learning_rate": 0.0009344360710146898, "epoch": 0.33, "percentage": 16.48, "elapsed_time": "1:17:45", "remaining_time": "6:33:56"} +{"current_steps": 1780, "total_steps": 10798, "loss": 2.0242, "reward": null, "learning_rate": 0.0009344360710146898, "epoch": 0.33, "percentage": 16.48, "elapsed_time": "1:11:42", "remaining_time": "6:03:16"} +{"current_steps": 1780, "total_steps": 10798, "loss": 2.0242, "reward": null, "learning_rate": 0.0009344360710146898, "epoch": 0.33, "percentage": 16.48, "elapsed_time": "1:11:40", "remaining_time": "6:03:08"} +{"current_steps": 1780, "total_steps": 10798, "loss": 2.0242, "reward": null, "learning_rate": 0.0009344360710146898, "epoch": 0.33, "percentage": 16.48, "elapsed_time": "1:11:43", "remaining_time": "6:03:25"} +{"current_steps": 1790, "total_steps": 10798, "loss": 2.0436, "reward": null, "learning_rate": 0.0009337140984834034, "epoch": 0.33, "percentage": 16.58, "elapsed_time": "1:12:05", "remaining_time": "6:02:46"} +{"current_steps": 1790, "total_steps": 10798, "loss": 2.0436, "reward": null, "learning_rate": 0.0009337140984834034, "epoch": 0.33, "percentage": 16.58, "elapsed_time": "1:12:06", "remaining_time": "6:02:54"} +{"current_steps": 1790, "total_steps": 10798, "loss": 2.0436, "reward": null, "learning_rate": 0.0009337140984834034, "epoch": 0.33, "percentage": 16.58, "elapsed_time": "1:12:08", "remaining_time": "6:03:02"} +{"current_steps": 1790, "total_steps": 10798, "loss": 2.0436, "reward": null, "learning_rate": 0.0009337140984834034, "epoch": 0.33, "percentage": 16.58, "elapsed_time": "1:18:10", "remaining_time": "6:33:21"} +{"current_steps": 1800, "total_steps": 10798, "loss": 2.0452, "reward": null, "learning_rate": 0.0009329884546820572, "epoch": 0.33, "percentage": 16.67, "elapsed_time": "1:18:34", "remaining_time": "6:32:46"} +{"current_steps": 1800, "total_steps": 10798, "loss": 2.0452, "reward": null, "learning_rate": 0.0009329884546820572, "epoch": 0.33, "percentage": 16.67, "elapsed_time": "1:12:31", "remaining_time": "6:02:30"} +{"current_steps": 1800, "total_steps": 10798, "loss": 2.0452, "reward": null, "learning_rate": 0.0009329884546820572, "epoch": 0.33, "percentage": 16.67, "elapsed_time": "1:12:29", "remaining_time": "6:02:22"} +{"current_steps": 1800, "total_steps": 10798, "loss": 2.0452, "reward": null, "learning_rate": 0.0009329884546820572, "epoch": 0.33, "percentage": 16.67, "elapsed_time": "1:12:32", "remaining_time": "6:02:39"} +{"current_steps": 1810, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.000932259145753026, "epoch": 0.34, "percentage": 16.76, "elapsed_time": "1:12:57", "remaining_time": "6:02:19"} +{"current_steps": 1810, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.000932259145753026, "epoch": 0.34, "percentage": 16.76, "elapsed_time": "1:12:54", "remaining_time": "6:02:02"} +{"current_steps": 1810, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.000932259145753026, "epoch": 0.34, "percentage": 16.76, "elapsed_time": "1:12:56", "remaining_time": "6:02:10"} +{"current_steps": 1810, "total_steps": 10798, "loss": 2.0254, "reward": null, "learning_rate": 0.000932259145753026, "epoch": 0.34, "percentage": 16.76, "elapsed_time": "1:18:59", "remaining_time": "6:32:13"} +{"current_steps": 1820, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009315261778697083, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "1:13:20", "remaining_time": "6:01:45"} +{"current_steps": 1820, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009315261778697083, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "1:19:23", "remaining_time": "6:31:36"} +{"current_steps": 1820, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009315261778697083, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "1:13:18", "remaining_time": "6:01:37"} +{"current_steps": 1820, "total_steps": 10798, "loss": 2.0409, "reward": null, "learning_rate": 0.0009315261778697083, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "1:13:21", "remaining_time": "6:01:53"} +{"current_steps": 1830, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009307895572364746, "epoch": 0.34, "percentage": 16.95, "elapsed_time": "1:13:44", "remaining_time": "6:01:23"} +{"current_steps": 1830, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009307895572364746, "epoch": 0.34, "percentage": 16.95, "elapsed_time": "1:19:47", "remaining_time": "6:31:03"} +{"current_steps": 1830, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009307895572364746, "epoch": 0.34, "percentage": 16.95, "elapsed_time": "1:13:46", "remaining_time": "6:01:32"} +{"current_steps": 1830, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009307895572364746, "epoch": 0.34, "percentage": 16.95, "elapsed_time": "1:13:43", "remaining_time": "6:01:15"} +{"current_steps": 1840, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009300492900886154, "epoch": 0.34, "percentage": 17.04, "elapsed_time": "1:14:10", "remaining_time": "6:01:05"} +{"current_steps": 1840, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009300492900886154, "epoch": 0.34, "percentage": 17.04, "elapsed_time": "1:14:08", "remaining_time": "6:00:57"} +{"current_steps": 1840, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009300492900886154, "epoch": 0.34, "percentage": 17.04, "elapsed_time": "1:14:06", "remaining_time": "6:00:49"} +{"current_steps": 1840, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0009300492900886154, "epoch": 0.34, "percentage": 17.04, "elapsed_time": "1:20:11", "remaining_time": "6:30:25"} +{"current_steps": 1850, "total_steps": 10798, "loss": 1.9851, "reward": null, "learning_rate": 0.0009293053826922873, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "1:14:31", "remaining_time": "6:00:27"} +{"current_steps": 1850, "total_steps": 10798, "loss": 1.9851, "reward": null, "learning_rate": 0.0009293053826922873, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "1:20:36", "remaining_time": "6:29:52"} +{"current_steps": 1850, "total_steps": 10798, "loss": 1.9851, "reward": null, "learning_rate": 0.0009293053826922873, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "1:14:33", "remaining_time": "6:00:35"} +{"current_steps": 1850, "total_steps": 10798, "loss": 1.9851, "reward": null, "learning_rate": 0.0009293053826922873, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "1:14:34", "remaining_time": "6:00:44"} +{"current_steps": 1860, "total_steps": 10798, "loss": 1.9947, "reward": null, "learning_rate": 0.0009285578413444613, "epoch": 0.34, "percentage": 17.23, "elapsed_time": "1:14:59", "remaining_time": "6:00:22"} +{"current_steps": 1860, "total_steps": 10798, "loss": 1.9947, "reward": null, "learning_rate": 0.0009285578413444613, "epoch": 0.34, "percentage": 17.23, "elapsed_time": "1:21:01", "remaining_time": "6:29:19"} +{"current_steps": 1860, "total_steps": 10798, "loss": 1.9947, "reward": null, "learning_rate": 0.0009285578413444613, "epoch": 0.34, "percentage": 17.23, "elapsed_time": "1:14:56", "remaining_time": "6:00:06"} +{"current_steps": 1860, "total_steps": 10798, "loss": 1.9947, "reward": null, "learning_rate": 0.0009285578413444613, "epoch": 0.34, "percentage": 17.23, "elapsed_time": "1:14:57", "remaining_time": "6:00:14"} +{"current_steps": 1870, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009278066723728682, "epoch": 0.35, "percentage": 17.32, "elapsed_time": "1:21:25", "remaining_time": "6:28:46"} +{"current_steps": 1870, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009278066723728682, "epoch": 0.35, "percentage": 17.32, "elapsed_time": "1:15:22", "remaining_time": "5:59:52"} +{"current_steps": 1870, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009278066723728682, "epoch": 0.35, "percentage": 17.32, "elapsed_time": "1:15:21", "remaining_time": "5:59:44"} +{"current_steps": 1870, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009278066723728682, "epoch": 0.35, "percentage": 17.32, "elapsed_time": "1:15:24", "remaining_time": "6:00:00"} +{"current_steps": 1880, "total_steps": 10798, "loss": 2.0058, "reward": null, "learning_rate": 0.0009270518821359461, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "1:15:44", "remaining_time": "5:59:15"} +{"current_steps": 1880, "total_steps": 10798, "loss": 2.0058, "reward": null, "learning_rate": 0.0009270518821359461, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "1:15:45", "remaining_time": "5:59:23"} +{"current_steps": 1880, "total_steps": 10798, "loss": 2.0058, "reward": null, "learning_rate": 0.0009270518821359461, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "1:21:48", "remaining_time": "6:28:06"} +{"current_steps": 1880, "total_steps": 10798, "loss": 2.0058, "reward": null, "learning_rate": 0.0009270518821359461, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "1:15:47", "remaining_time": "5:59:31"} +{"current_steps": 1890, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009262934770227858, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "1:16:11", "remaining_time": "5:59:06"} +{"current_steps": 1890, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009262934770227858, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "1:22:12", "remaining_time": "6:27:30"} +{"current_steps": 1890, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009262934770227858, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "1:16:08", "remaining_time": "5:58:50"} +{"current_steps": 1890, "total_steps": 10798, "loss": 2.05, "reward": null, "learning_rate": 0.0009262934770227858, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "1:16:09", "remaining_time": "5:58:58"} +{"current_steps": 1900, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.0009255314634530771, "epoch": 0.35, "percentage": 17.6, "elapsed_time": "1:16:35", "remaining_time": "5:58:40"} +{"current_steps": 1900, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.0009255314634530771, "epoch": 0.35, "percentage": 17.6, "elapsed_time": "1:22:36", "remaining_time": "6:26:53"} +{"current_steps": 1900, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.0009255314634530771, "epoch": 0.35, "percentage": 17.6, "elapsed_time": "1:16:33", "remaining_time": "5:58:32"} +{"current_steps": 1900, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.0009255314634530771, "epoch": 0.35, "percentage": 17.6, "elapsed_time": "1:16:32", "remaining_time": "5:58:25"} +{"current_steps": 1910, "total_steps": 10798, "loss": 2.0045, "reward": null, "learning_rate": 0.0009247658478770543, "epoch": 0.35, "percentage": 17.69, "elapsed_time": "1:23:01", "remaining_time": "6:26:21"} +{"current_steps": 1910, "total_steps": 10798, "loss": 2.0045, "reward": null, "learning_rate": 0.0009247658478770543, "epoch": 0.35, "percentage": 17.69, "elapsed_time": "1:16:58", "remaining_time": "5:58:10"} +{"current_steps": 1910, "total_steps": 10798, "loss": 2.0045, "reward": null, "learning_rate": 0.0009247658478770543, "epoch": 0.35, "percentage": 17.69, "elapsed_time": "1:17:00", "remaining_time": "5:58:19"} +{"current_steps": 1910, "total_steps": 10798, "loss": 2.0045, "reward": null, "learning_rate": 0.0009247658478770543, "epoch": 0.35, "percentage": 17.69, "elapsed_time": "1:16:56", "remaining_time": "5:58:03"} +{"current_steps": 1920, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000923996636775442, "epoch": 0.36, "percentage": 17.78, "elapsed_time": "1:17:23", "remaining_time": "5:57:49"} +{"current_steps": 1920, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000923996636775442, "epoch": 0.36, "percentage": 17.78, "elapsed_time": "1:23:26", "remaining_time": "6:25:48"} +{"current_steps": 1920, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000923996636775442, "epoch": 0.36, "percentage": 17.78, "elapsed_time": "1:17:24", "remaining_time": "5:57:57"} +{"current_steps": 1920, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000923996636775442, "epoch": 0.36, "percentage": 17.78, "elapsed_time": "1:17:21", "remaining_time": "5:57:41"} +{"current_steps": 1930, "total_steps": 10798, "loss": 2.0124, "reward": null, "learning_rate": 0.0009232238366593997, "epoch": 0.36, "percentage": 17.87, "elapsed_time": "1:17:44", "remaining_time": "5:57:13"} +{"current_steps": 1930, "total_steps": 10798, "loss": 2.0124, "reward": null, "learning_rate": 0.0009232238366593997, "epoch": 0.36, "percentage": 17.87, "elapsed_time": "1:17:46", "remaining_time": "5:57:20"} +{"current_steps": 1930, "total_steps": 10798, "loss": 2.0124, "reward": null, "learning_rate": 0.0009232238366593997, "epoch": 0.36, "percentage": 17.87, "elapsed_time": "1:23:49", "remaining_time": "6:25:09"} +{"current_steps": 1930, "total_steps": 10798, "loss": 2.0124, "reward": null, "learning_rate": 0.0009232238366593997, "epoch": 0.36, "percentage": 17.87, "elapsed_time": "1:17:48", "remaining_time": "5:57:28"} +{"current_steps": 1940, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0009224474540704671, "epoch": 0.36, "percentage": 17.97, "elapsed_time": "1:18:08", "remaining_time": "5:56:46"} +{"current_steps": 1940, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0009224474540704671, "epoch": 0.36, "percentage": 17.97, "elapsed_time": "1:18:11", "remaining_time": "5:57:02"} +{"current_steps": 1940, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0009224474540704671, "epoch": 0.36, "percentage": 17.97, "elapsed_time": "1:18:09", "remaining_time": "5:56:54"} +{"current_steps": 1940, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0009224474540704671, "epoch": 0.36, "percentage": 17.97, "elapsed_time": "1:24:13", "remaining_time": "6:24:32"} +{"current_steps": 1950, "total_steps": 10798, "loss": 2.0247, "reward": null, "learning_rate": 0.0009216674955805079, "epoch": 0.36, "percentage": 18.06, "elapsed_time": "1:24:37", "remaining_time": "6:24:00"} +{"current_steps": 1950, "total_steps": 10798, "loss": 2.0247, "reward": null, "learning_rate": 0.0009216674955805079, "epoch": 0.36, "percentage": 18.06, "elapsed_time": "1:18:33", "remaining_time": "5:56:25"} +{"current_steps": 1950, "total_steps": 10798, "loss": 2.0247, "reward": null, "learning_rate": 0.0009216674955805079, "epoch": 0.36, "percentage": 18.06, "elapsed_time": "1:18:34", "remaining_time": "5:56:32"} +{"current_steps": 1950, "total_steps": 10798, "loss": 2.0247, "reward": null, "learning_rate": 0.0009216674955805079, "epoch": 0.36, "percentage": 18.06, "elapsed_time": "1:18:36", "remaining_time": "5:56:40"} +{"current_steps": 1960, "total_steps": 10798, "loss": 2.0314, "reward": null, "learning_rate": 0.0009208839677916557, "epoch": 0.36, "percentage": 18.15, "elapsed_time": "1:18:59", "remaining_time": "5:56:11"} +{"current_steps": 1960, "total_steps": 10798, "loss": 2.0314, "reward": null, "learning_rate": 0.0009208839677916557, "epoch": 0.36, "percentage": 18.15, "elapsed_time": "1:25:02", "remaining_time": "6:23:29"} +{"current_steps": 1960, "total_steps": 10798, "loss": 2.0314, "reward": null, "learning_rate": 0.0009208839677916557, "epoch": 0.36, "percentage": 18.15, "elapsed_time": "1:18:58", "remaining_time": "5:56:04"} +{"current_steps": 1960, "total_steps": 10798, "loss": 2.0314, "reward": null, "learning_rate": 0.0009208839677916557, "epoch": 0.36, "percentage": 18.15, "elapsed_time": "1:19:01", "remaining_time": "5:56:19"} +{"current_steps": 1970, "total_steps": 10798, "loss": 2.067, "reward": null, "learning_rate": 0.0009200968773362568, "epoch": 0.36, "percentage": 18.24, "elapsed_time": "1:19:24", "remaining_time": "5:55:48"} +{"current_steps": 1970, "total_steps": 10798, "loss": 2.067, "reward": null, "learning_rate": 0.0009200968773362568, "epoch": 0.36, "percentage": 18.24, "elapsed_time": "1:25:27", "remaining_time": "6:22:56"} +{"current_steps": 1970, "total_steps": 10798, "loss": 2.067, "reward": null, "learning_rate": 0.0009200968773362568, "epoch": 0.36, "percentage": 18.24, "elapsed_time": "1:19:22", "remaining_time": "5:55:41"} +{"current_steps": 1970, "total_steps": 10798, "loss": 2.067, "reward": null, "learning_rate": 0.0009200968773362568, "epoch": 0.36, "percentage": 18.24, "elapsed_time": "1:19:25", "remaining_time": "5:55:56"} +{"current_steps": 1980, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0009193062308768145, "epoch": 0.37, "percentage": 18.34, "elapsed_time": "1:25:53", "remaining_time": "6:22:30"} +{"current_steps": 1980, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0009193062308768145, "epoch": 0.37, "percentage": 18.34, "elapsed_time": "1:19:48", "remaining_time": "5:55:25"} +{"current_steps": 1980, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0009193062308768145, "epoch": 0.37, "percentage": 18.34, "elapsed_time": "1:19:51", "remaining_time": "5:55:40"} +{"current_steps": 1980, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0009193062308768145, "epoch": 0.37, "percentage": 18.34, "elapsed_time": "1:19:50", "remaining_time": "5:55:32"} +{"current_steps": 1990, "total_steps": 10798, "loss": 2.0649, "reward": null, "learning_rate": 0.0009185120351059326, "epoch": 0.37, "percentage": 18.43, "elapsed_time": "1:20:16", "remaining_time": "5:55:16"} +{"current_steps": 1990, "total_steps": 10798, "loss": 2.0649, "reward": null, "learning_rate": 0.0009185120351059326, "epoch": 0.37, "percentage": 18.43, "elapsed_time": "1:26:17", "remaining_time": "6:21:56"} +{"current_steps": 1990, "total_steps": 10798, "loss": 2.0649, "reward": null, "learning_rate": 0.0009185120351059326, "epoch": 0.37, "percentage": 18.43, "elapsed_time": "1:20:12", "remaining_time": "5:55:02"} +{"current_steps": 1990, "total_steps": 10798, "loss": 2.0649, "reward": null, "learning_rate": 0.0009185120351059326, "epoch": 0.37, "percentage": 18.43, "elapsed_time": "1:20:14", "remaining_time": "5:55:09"} +{"current_steps": 2000, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009177142967462591, "epoch": 0.37, "percentage": 18.52, "elapsed_time": "1:20:36", "remaining_time": "5:54:36"} +{"current_steps": 2000, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009177142967462591, "epoch": 0.37, "percentage": 18.52, "elapsed_time": "1:20:40", "remaining_time": "5:54:51"} +{"current_steps": 2000, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009177142967462591, "epoch": 0.37, "percentage": 18.52, "elapsed_time": "1:20:38", "remaining_time": "5:54:43"} +{"current_steps": 2000, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009177142967462591, "epoch": 0.37, "percentage": 18.52, "elapsed_time": "1:26:41", "remaining_time": "6:21:21"} +{"current_steps": 2010, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.0009169130225504289, "epoch": 0.37, "percentage": 18.61, "elapsed_time": "1:27:04", "remaining_time": "6:20:44"} +{"current_steps": 2010, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.0009169130225504289, "epoch": 0.37, "percentage": 18.61, "elapsed_time": "1:21:03", "remaining_time": "5:54:23"} +{"current_steps": 2010, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.0009169130225504289, "epoch": 0.37, "percentage": 18.61, "elapsed_time": "1:21:01", "remaining_time": "5:54:16"} +{"current_steps": 2010, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.0009169130225504289, "epoch": 0.37, "percentage": 18.61, "elapsed_time": "1:21:00", "remaining_time": "5:54:09"} +{"current_steps": 2020, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009161082193010066, "epoch": 0.37, "percentage": 18.71, "elapsed_time": "1:21:26", "remaining_time": "5:53:54"} +{"current_steps": 2020, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009161082193010066, "epoch": 0.37, "percentage": 18.71, "elapsed_time": "1:21:24", "remaining_time": "5:53:47"} +{"current_steps": 2020, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009161082193010066, "epoch": 0.37, "percentage": 18.71, "elapsed_time": "1:21:28", "remaining_time": "5:54:02"} +{"current_steps": 2020, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0009161082193010066, "epoch": 0.37, "percentage": 18.71, "elapsed_time": "1:27:29", "remaining_time": "6:20:13"} +{"current_steps": 2030, "total_steps": 10798, "loss": 2.0757, "reward": null, "learning_rate": 0.0009152998938104296, "epoch": 0.38, "percentage": 18.8, "elapsed_time": "1:21:50", "remaining_time": "5:53:30"} +{"current_steps": 2030, "total_steps": 10798, "loss": 2.0757, "reward": null, "learning_rate": 0.0009152998938104296, "epoch": 0.38, "percentage": 18.8, "elapsed_time": "1:21:52", "remaining_time": "5:53:38"} +{"current_steps": 2030, "total_steps": 10798, "loss": 2.0757, "reward": null, "learning_rate": 0.0009152998938104296, "epoch": 0.38, "percentage": 18.8, "elapsed_time": "1:21:49", "remaining_time": "5:53:23"} +{"current_steps": 2030, "total_steps": 10798, "loss": 2.0757, "reward": null, "learning_rate": 0.0009152998938104296, "epoch": 0.38, "percentage": 18.8, "elapsed_time": "1:27:54", "remaining_time": "6:19:39"} +{"current_steps": 2040, "total_steps": 10798, "loss": 2.0093, "reward": null, "learning_rate": 0.0009144880529209498, "epoch": 0.38, "percentage": 18.89, "elapsed_time": "1:28:18", "remaining_time": "6:19:06"} +{"current_steps": 2040, "total_steps": 10798, "loss": 2.0093, "reward": null, "learning_rate": 0.0009144880529209498, "epoch": 0.38, "percentage": 18.89, "elapsed_time": "1:22:13", "remaining_time": "5:52:59"} +{"current_steps": 2040, "total_steps": 10798, "loss": 2.0093, "reward": null, "learning_rate": 0.0009144880529209498, "epoch": 0.38, "percentage": 18.89, "elapsed_time": "1:22:15", "remaining_time": "5:53:06"} +{"current_steps": 2040, "total_steps": 10798, "loss": 2.0093, "reward": null, "learning_rate": 0.0009144880529209498, "epoch": 0.38, "percentage": 18.89, "elapsed_time": "1:22:16", "remaining_time": "5:53:14"} +{"current_steps": 2050, "total_steps": 10798, "loss": 1.954, "reward": null, "learning_rate": 0.0009136727035045765, "epoch": 0.38, "percentage": 18.98, "elapsed_time": "1:28:41", "remaining_time": "6:18:29"} +{"current_steps": 2050, "total_steps": 10798, "loss": 1.954, "reward": null, "learning_rate": 0.0009136727035045765, "epoch": 0.38, "percentage": 18.98, "elapsed_time": "1:22:38", "remaining_time": "5:52:39"} +{"current_steps": 2050, "total_steps": 10798, "loss": 1.954, "reward": null, "learning_rate": 0.0009136727035045765, "epoch": 0.38, "percentage": 18.98, "elapsed_time": "1:22:40", "remaining_time": "5:52:47"} +{"current_steps": 2050, "total_steps": 10798, "loss": 1.954, "reward": null, "learning_rate": 0.0009136727035045765, "epoch": 0.38, "percentage": 18.98, "elapsed_time": "1:22:37", "remaining_time": "5:52:33"} +{"current_steps": 2060, "total_steps": 10798, "loss": 2.0062, "reward": null, "learning_rate": 0.0009128538524630167, "epoch": 0.38, "percentage": 19.08, "elapsed_time": "1:29:05", "remaining_time": "6:17:53"} +{"current_steps": 2060, "total_steps": 10798, "loss": 2.0062, "reward": null, "learning_rate": 0.0009128538524630167, "epoch": 0.38, "percentage": 19.08, "elapsed_time": "1:23:02", "remaining_time": "5:52:12"} +{"current_steps": 2060, "total_steps": 10798, "loss": 2.0062, "reward": null, "learning_rate": 0.0009128538524630167, "epoch": 0.38, "percentage": 19.08, "elapsed_time": "1:23:00", "remaining_time": "5:52:06"} +{"current_steps": 2060, "total_steps": 10798, "loss": 2.0062, "reward": null, "learning_rate": 0.0009128538524630167, "epoch": 0.38, "percentage": 19.08, "elapsed_time": "1:23:03", "remaining_time": "5:52:20"} +{"current_steps": 2070, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0009120315067276187, "epoch": 0.38, "percentage": 19.17, "elapsed_time": "1:23:25", "remaining_time": "5:51:44"} +{"current_steps": 2070, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0009120315067276187, "epoch": 0.38, "percentage": 19.17, "elapsed_time": "1:23:23", "remaining_time": "5:51:37"} +{"current_steps": 2070, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0009120315067276187, "epoch": 0.38, "percentage": 19.17, "elapsed_time": "1:29:28", "remaining_time": "6:17:16"} +{"current_steps": 2070, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0009120315067276187, "epoch": 0.38, "percentage": 19.17, "elapsed_time": "1:23:27", "remaining_time": "5:51:51"} +{"current_steps": 2080, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009112056732593119, "epoch": 0.39, "percentage": 19.26, "elapsed_time": "1:23:49", "remaining_time": "5:51:19"} +{"current_steps": 2080, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009112056732593119, "epoch": 0.39, "percentage": 19.26, "elapsed_time": "1:23:47", "remaining_time": "5:51:13"} +{"current_steps": 2080, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009112056732593119, "epoch": 0.39, "percentage": 19.26, "elapsed_time": "1:29:52", "remaining_time": "6:16:42"} +{"current_steps": 2080, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0009112056732593119, "epoch": 0.39, "percentage": 19.26, "elapsed_time": "1:23:51", "remaining_time": "5:51:27"} +{"current_steps": 2090, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0009103763590485488, "epoch": 0.39, "percentage": 19.36, "elapsed_time": "1:24:11", "remaining_time": "5:50:47"} +{"current_steps": 2090, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0009103763590485488, "epoch": 0.39, "percentage": 19.36, "elapsed_time": "1:30:16", "remaining_time": "6:16:07"} +{"current_steps": 2090, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0009103763590485488, "epoch": 0.39, "percentage": 19.36, "elapsed_time": "1:24:15", "remaining_time": "5:51:01"} +{"current_steps": 2090, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0009103763590485488, "epoch": 0.39, "percentage": 19.36, "elapsed_time": "1:24:13", "remaining_time": "5:50:54"} +{"current_steps": 2100, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009095435711152449, "epoch": 0.39, "percentage": 19.45, "elapsed_time": "1:24:38", "remaining_time": "5:50:34"} +{"current_steps": 2100, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009095435711152449, "epoch": 0.39, "percentage": 19.45, "elapsed_time": "1:24:35", "remaining_time": "5:50:21"} +{"current_steps": 2100, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009095435711152449, "epoch": 0.39, "percentage": 19.45, "elapsed_time": "1:24:36", "remaining_time": "5:50:27"} +{"current_steps": 2100, "total_steps": 10798, "loss": 2.0208, "reward": null, "learning_rate": 0.0009095435711152449, "epoch": 0.39, "percentage": 19.45, "elapsed_time": "1:30:40", "remaining_time": "6:15:32"} +{"current_steps": 2110, "total_steps": 10798, "loss": 2.0492, "reward": null, "learning_rate": 0.00090870731650872, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "1:25:00", "remaining_time": "5:50:00"} +{"current_steps": 2110, "total_steps": 10798, "loss": 2.0492, "reward": null, "learning_rate": 0.00090870731650872, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "1:31:03", "remaining_time": "6:14:56"} +{"current_steps": 2110, "total_steps": 10798, "loss": 2.0492, "reward": null, "learning_rate": 0.00090870731650872, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "1:25:02", "remaining_time": "5:50:08"} +{"current_steps": 2110, "total_steps": 10798, "loss": 2.0492, "reward": null, "learning_rate": 0.00090870731650872, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "1:24:58", "remaining_time": "5:49:54"} +{"current_steps": 2120, "total_steps": 10798, "loss": 1.9917, "reward": null, "learning_rate": 0.0009078676023076385, "epoch": 0.39, "percentage": 19.63, "elapsed_time": "1:25:24", "remaining_time": "5:49:35"} +{"current_steps": 2120, "total_steps": 10798, "loss": 1.9917, "reward": null, "learning_rate": 0.0009078676023076385, "epoch": 0.39, "percentage": 19.63, "elapsed_time": "1:31:27", "remaining_time": "6:14:22"} +{"current_steps": 2120, "total_steps": 10798, "loss": 1.9917, "reward": null, "learning_rate": 0.0009078676023076385, "epoch": 0.39, "percentage": 19.63, "elapsed_time": "1:25:25", "remaining_time": "5:49:42"} +{"current_steps": 2120, "total_steps": 10798, "loss": 1.9917, "reward": null, "learning_rate": 0.0009078676023076385, "epoch": 0.39, "percentage": 19.63, "elapsed_time": "1:25:22", "remaining_time": "5:49:28"} +{"current_steps": 2130, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0009070244356199492, "epoch": 0.39, "percentage": 19.73, "elapsed_time": "1:31:51", "remaining_time": "6:13:47"} +{"current_steps": 2130, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0009070244356199492, "epoch": 0.39, "percentage": 19.73, "elapsed_time": "1:25:47", "remaining_time": "5:49:09"} +{"current_steps": 2130, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0009070244356199492, "epoch": 0.39, "percentage": 19.73, "elapsed_time": "1:25:49", "remaining_time": "5:49:16"} +{"current_steps": 2130, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0009070244356199492, "epoch": 0.39, "percentage": 19.73, "elapsed_time": "1:25:46", "remaining_time": "5:49:03"} +{"current_steps": 2140, "total_steps": 10798, "loss": 2.01, "reward": null, "learning_rate": 0.0009061778235828253, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "1:26:13", "remaining_time": "5:48:49"} +{"current_steps": 2140, "total_steps": 10798, "loss": 2.01, "reward": null, "learning_rate": 0.0009061778235828253, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "1:32:14", "remaining_time": "6:13:12"} +{"current_steps": 2140, "total_steps": 10798, "loss": 2.01, "reward": null, "learning_rate": 0.0009061778235828253, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "1:26:09", "remaining_time": "5:48:36"} +{"current_steps": 2140, "total_steps": 10798, "loss": 2.01, "reward": null, "learning_rate": 0.0009061778235828253, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "1:26:11", "remaining_time": "5:48:42"} +{"current_steps": 2150, "total_steps": 10798, "loss": 1.9999, "reward": null, "learning_rate": 0.0009054129328980229, "epoch": 0.4, "percentage": 19.91, "elapsed_time": "1:32:37", "remaining_time": "6:12:35"} +{"current_steps": 2150, "total_steps": 10798, "loss": 1.9999, "reward": null, "learning_rate": 0.0009054129328980229, "epoch": 0.4, "percentage": 19.91, "elapsed_time": "1:26:34", "remaining_time": "5:48:14"} +{"current_steps": 2150, "total_steps": 10798, "loss": 1.9999, "reward": null, "learning_rate": 0.0009054129328980229, "epoch": 0.4, "percentage": 19.91, "elapsed_time": "1:26:32", "remaining_time": "5:48:07"} +{"current_steps": 2150, "total_steps": 10798, "loss": 1.9999, "reward": null, "learning_rate": 0.0009054129328980229, "epoch": 0.4, "percentage": 19.91, "elapsed_time": "1:26:36", "remaining_time": "5:48:21"} +{"current_steps": 2160, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.000904559794464287, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "1:26:59", "remaining_time": "5:47:55"} +{"current_steps": 2160, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.000904559794464287, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "1:33:01", "remaining_time": "6:12:00"} +{"current_steps": 2160, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.000904559794464287, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "1:26:58", "remaining_time": "5:47:48"} +{"current_steps": 2160, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.000904559794464287, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "1:26:56", "remaining_time": "5:47:41"} +{"current_steps": 2170, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009037032315436229, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "1:33:24", "remaining_time": "6:11:24"} +{"current_steps": 2170, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009037032315436229, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "1:27:21", "remaining_time": "5:47:19"} +{"current_steps": 2170, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009037032315436229, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "1:27:19", "remaining_time": "5:47:13"} +{"current_steps": 2170, "total_steps": 10798, "loss": 2.0004, "reward": null, "learning_rate": 0.0009037032315436229, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "1:27:23", "remaining_time": "5:47:26"} +{"current_steps": 2180, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0009028432513865994, "epoch": 0.4, "percentage": 20.19, "elapsed_time": "1:27:45", "remaining_time": "5:46:56"} +{"current_steps": 2180, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0009028432513865994, "epoch": 0.4, "percentage": 20.19, "elapsed_time": "1:33:48", "remaining_time": "6:10:52"} +{"current_steps": 2180, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0009028432513865994, "epoch": 0.4, "percentage": 20.19, "elapsed_time": "1:27:47", "remaining_time": "5:47:03"} +{"current_steps": 2180, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0009028432513865994, "epoch": 0.4, "percentage": 20.19, "elapsed_time": "1:27:44", "remaining_time": "5:46:49"} +{"current_steps": 2190, "total_steps": 10798, "loss": 2.0098, "reward": null, "learning_rate": 0.000901979861272711, "epoch": 0.41, "percentage": 20.28, "elapsed_time": "1:34:12", "remaining_time": "6:10:18"} +{"current_steps": 2190, "total_steps": 10798, "loss": 2.0098, "reward": null, "learning_rate": 0.000901979861272711, "epoch": 0.41, "percentage": 20.28, "elapsed_time": "1:28:11", "remaining_time": "5:46:37"} +{"current_steps": 2190, "total_steps": 10798, "loss": 2.0098, "reward": null, "learning_rate": 0.000901979861272711, "epoch": 0.41, "percentage": 20.28, "elapsed_time": "1:28:07", "remaining_time": "5:46:24"} +{"current_steps": 2190, "total_steps": 10798, "loss": 2.0098, "reward": null, "learning_rate": 0.000901979861272711, "epoch": 0.41, "percentage": 20.28, "elapsed_time": "1:28:09", "remaining_time": "5:46:30"} +{"current_steps": 2200, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0009011130685103166, "epoch": 0.41, "percentage": 20.37, "elapsed_time": "1:34:37", "remaining_time": "6:09:49"} +{"current_steps": 2200, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0009011130685103166, "epoch": 0.41, "percentage": 20.37, "elapsed_time": "1:28:32", "remaining_time": "5:46:03"} +{"current_steps": 2200, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0009011130685103166, "epoch": 0.41, "percentage": 20.37, "elapsed_time": "1:28:34", "remaining_time": "5:46:09"} +{"current_steps": 2200, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0009011130685103166, "epoch": 0.41, "percentage": 20.37, "elapsed_time": "1:28:36", "remaining_time": "5:46:16"} +{"current_steps": 2210, "total_steps": 10798, "loss": 2.0135, "reward": null, "learning_rate": 0.0009002428804365775, "epoch": 0.41, "percentage": 20.47, "elapsed_time": "1:29:00", "remaining_time": "5:45:53"} +{"current_steps": 2210, "total_steps": 10798, "loss": 2.0135, "reward": null, "learning_rate": 0.0009002428804365775, "epoch": 0.41, "percentage": 20.47, "elapsed_time": "1:35:02", "remaining_time": "6:09:18"} +{"current_steps": 2210, "total_steps": 10798, "loss": 2.0135, "reward": null, "learning_rate": 0.0009002428804365775, "epoch": 0.41, "percentage": 20.47, "elapsed_time": "1:28:58", "remaining_time": "5:45:46"} +{"current_steps": 2210, "total_steps": 10798, "loss": 2.0135, "reward": null, "learning_rate": 0.0009002428804365775, "epoch": 0.41, "percentage": 20.47, "elapsed_time": "1:28:57", "remaining_time": "5:45:40"} +{"current_steps": 2220, "total_steps": 10798, "loss": 2.0526, "reward": null, "learning_rate": 0.0008993693044173954, "epoch": 0.41, "percentage": 20.56, "elapsed_time": "1:29:25", "remaining_time": "5:45:31"} +{"current_steps": 2220, "total_steps": 10798, "loss": 2.0526, "reward": null, "learning_rate": 0.0008993693044173954, "epoch": 0.41, "percentage": 20.56, "elapsed_time": "1:29:23", "remaining_time": "5:45:24"} +{"current_steps": 2220, "total_steps": 10798, "loss": 2.0526, "reward": null, "learning_rate": 0.0008993693044173954, "epoch": 0.41, "percentage": 20.56, "elapsed_time": "1:35:28", "remaining_time": "6:08:54"} +{"current_steps": 2220, "total_steps": 10798, "loss": 2.0526, "reward": null, "learning_rate": 0.0008993693044173954, "epoch": 0.41, "percentage": 20.56, "elapsed_time": "1:29:26", "remaining_time": "5:45:37"} +{"current_steps": 2230, "total_steps": 10798, "loss": 2.0145, "reward": null, "learning_rate": 0.0008984923478473499, "epoch": 0.41, "percentage": 20.65, "elapsed_time": "1:35:52", "remaining_time": "6:08:22"} +{"current_steps": 2230, "total_steps": 10798, "loss": 2.0145, "reward": null, "learning_rate": 0.0008984923478473499, "epoch": 0.41, "percentage": 20.65, "elapsed_time": "1:29:49", "remaining_time": "5:45:07"} +{"current_steps": 2230, "total_steps": 10798, "loss": 2.0145, "reward": null, "learning_rate": 0.0008984923478473499, "epoch": 0.41, "percentage": 20.65, "elapsed_time": "1:29:51", "remaining_time": "5:45:13"} +{"current_steps": 2230, "total_steps": 10798, "loss": 2.0145, "reward": null, "learning_rate": 0.0008984923478473499, "epoch": 0.41, "percentage": 20.65, "elapsed_time": "1:29:47", "remaining_time": "5:45:00"} +{"current_steps": 2240, "total_steps": 10798, "loss": 2.0364, "reward": null, "learning_rate": 0.0008976120181496365, "epoch": 0.41, "percentage": 20.74, "elapsed_time": "1:36:17", "remaining_time": "6:07:51"} +{"current_steps": 2240, "total_steps": 10798, "loss": 2.0364, "reward": null, "learning_rate": 0.0008976120181496365, "epoch": 0.41, "percentage": 20.74, "elapsed_time": "1:30:15", "remaining_time": "5:44:50"} +{"current_steps": 2240, "total_steps": 10798, "loss": 2.0364, "reward": null, "learning_rate": 0.0008976120181496365, "epoch": 0.41, "percentage": 20.74, "elapsed_time": "1:30:12", "remaining_time": "5:44:38"} +{"current_steps": 2240, "total_steps": 10798, "loss": 2.0364, "reward": null, "learning_rate": 0.0008976120181496365, "epoch": 0.41, "percentage": 20.74, "elapsed_time": "1:30:13", "remaining_time": "5:44:44"} +{"current_steps": 2250, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0008967283227760028, "epoch": 0.42, "percentage": 20.84, "elapsed_time": "1:30:38", "remaining_time": "5:44:22"} +{"current_steps": 2250, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0008967283227760028, "epoch": 0.42, "percentage": 20.84, "elapsed_time": "1:30:36", "remaining_time": "5:44:15"} +{"current_steps": 2250, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0008967283227760028, "epoch": 0.42, "percentage": 20.84, "elapsed_time": "1:30:35", "remaining_time": "5:44:09"} +{"current_steps": 2250, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0008967283227760028, "epoch": 0.42, "percentage": 20.84, "elapsed_time": "1:36:40", "remaining_time": "6:07:15"} +{"current_steps": 2260, "total_steps": 10798, "loss": 1.9874, "reward": null, "learning_rate": 0.000895841269206686, "epoch": 0.42, "percentage": 20.93, "elapsed_time": "1:30:59", "remaining_time": "5:43:43"} +{"current_steps": 2260, "total_steps": 10798, "loss": 1.9874, "reward": null, "learning_rate": 0.000895841269206686, "epoch": 0.42, "percentage": 20.93, "elapsed_time": "1:37:03", "remaining_time": "6:06:42"} +{"current_steps": 2260, "total_steps": 10798, "loss": 1.9874, "reward": null, "learning_rate": 0.000895841269206686, "epoch": 0.42, "percentage": 20.93, "elapsed_time": "1:31:00", "remaining_time": "5:43:49"} +{"current_steps": 2260, "total_steps": 10798, "loss": 1.9874, "reward": null, "learning_rate": 0.000895841269206686, "epoch": 0.42, "percentage": 20.93, "elapsed_time": "1:31:02", "remaining_time": "5:43:56"} +{"current_steps": 2270, "total_steps": 10798, "loss": 2.0699, "reward": null, "learning_rate": 0.0008949508649503495, "epoch": 0.42, "percentage": 21.02, "elapsed_time": "1:31:25", "remaining_time": "5:43:27"} +{"current_steps": 2270, "total_steps": 10798, "loss": 2.0699, "reward": null, "learning_rate": 0.0008949508649503495, "epoch": 0.42, "percentage": 21.02, "elapsed_time": "1:37:28", "remaining_time": "6:06:12"} +{"current_steps": 2270, "total_steps": 10798, "loss": 2.0699, "reward": null, "learning_rate": 0.0008949508649503495, "epoch": 0.42, "percentage": 21.02, "elapsed_time": "1:31:27", "remaining_time": "5:43:34"} +{"current_steps": 2270, "total_steps": 10798, "loss": 2.0699, "reward": null, "learning_rate": 0.0008949508649503495, "epoch": 0.42, "percentage": 21.02, "elapsed_time": "1:31:23", "remaining_time": "5:43:21"} +{"current_steps": 2280, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0008940571175440196, "epoch": 0.42, "percentage": 21.12, "elapsed_time": "1:37:52", "remaining_time": "6:05:40"} +{"current_steps": 2280, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0008940571175440196, "epoch": 0.42, "percentage": 21.12, "elapsed_time": "1:31:51", "remaining_time": "5:43:10"} +{"current_steps": 2280, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0008940571175440196, "epoch": 0.42, "percentage": 21.12, "elapsed_time": "1:31:48", "remaining_time": "5:42:57"} +{"current_steps": 2280, "total_steps": 10798, "loss": 2.0407, "reward": null, "learning_rate": 0.0008940571175440196, "epoch": 0.42, "percentage": 21.12, "elapsed_time": "1:31:49", "remaining_time": "5:43:03"} +{"current_steps": 2290, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008931600345530213, "epoch": 0.42, "percentage": 21.21, "elapsed_time": "1:32:14", "remaining_time": "5:42:43"} +{"current_steps": 2290, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008931600345530213, "epoch": 0.42, "percentage": 21.21, "elapsed_time": "1:38:16", "remaining_time": "6:05:06"} +{"current_steps": 2290, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008931600345530213, "epoch": 0.42, "percentage": 21.21, "elapsed_time": "1:32:11", "remaining_time": "5:42:30"} +{"current_steps": 2290, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008931600345530213, "epoch": 0.42, "percentage": 21.21, "elapsed_time": "1:32:13", "remaining_time": "5:42:36"} +{"current_steps": 2300, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0008922596235709142, "epoch": 0.43, "percentage": 21.3, "elapsed_time": "1:32:39", "remaining_time": "5:42:20"} +{"current_steps": 2300, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0008922596235709142, "epoch": 0.43, "percentage": 21.3, "elapsed_time": "1:32:35", "remaining_time": "5:42:08"} +{"current_steps": 2300, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0008922596235709142, "epoch": 0.43, "percentage": 21.3, "elapsed_time": "1:32:37", "remaining_time": "5:42:13"} +{"current_steps": 2300, "total_steps": 10798, "loss": 2.0235, "reward": null, "learning_rate": 0.0008922596235709142, "epoch": 0.43, "percentage": 21.3, "elapsed_time": "1:38:40", "remaining_time": "6:04:35"} +{"current_steps": 2310, "total_steps": 10798, "loss": 2.0268, "reward": null, "learning_rate": 0.0008913558922194287, "epoch": 0.43, "percentage": 21.39, "elapsed_time": "1:32:59", "remaining_time": "5:41:42"} +{"current_steps": 2310, "total_steps": 10798, "loss": 2.0268, "reward": null, "learning_rate": 0.0008913558922194287, "epoch": 0.43, "percentage": 21.39, "elapsed_time": "1:33:03", "remaining_time": "5:41:55"} +{"current_steps": 2310, "total_steps": 10798, "loss": 2.0268, "reward": null, "learning_rate": 0.0008913558922194287, "epoch": 0.43, "percentage": 21.39, "elapsed_time": "1:33:01", "remaining_time": "5:41:48"} +{"current_steps": 2310, "total_steps": 10798, "loss": 2.0268, "reward": null, "learning_rate": 0.0008913558922194287, "epoch": 0.43, "percentage": 21.39, "elapsed_time": "1:39:04", "remaining_time": "6:04:03"} +{"current_steps": 2320, "total_steps": 10798, "loss": 2.0279, "reward": null, "learning_rate": 0.000890448848148401, "epoch": 0.43, "percentage": 21.49, "elapsed_time": "1:33:25", "remaining_time": "5:41:24"} +{"current_steps": 2320, "total_steps": 10798, "loss": 2.0279, "reward": null, "learning_rate": 0.000890448848148401, "epoch": 0.43, "percentage": 21.49, "elapsed_time": "1:33:24", "remaining_time": "5:41:18"} +{"current_steps": 2320, "total_steps": 10798, "loss": 2.0279, "reward": null, "learning_rate": 0.000890448848148401, "epoch": 0.43, "percentage": 21.49, "elapsed_time": "1:33:27", "remaining_time": "5:41:31"} +{"current_steps": 2320, "total_steps": 10798, "loss": 2.0279, "reward": null, "learning_rate": 0.000890448848148401, "epoch": 0.43, "percentage": 21.49, "elapsed_time": "1:39:28", "remaining_time": "6:03:31"} +{"current_steps": 2330, "total_steps": 10798, "loss": 2.0073, "reward": null, "learning_rate": 0.0008895384990357087, "epoch": 0.43, "percentage": 21.58, "elapsed_time": "1:39:52", "remaining_time": "6:02:59"} +{"current_steps": 2330, "total_steps": 10798, "loss": 2.0073, "reward": null, "learning_rate": 0.0008895384990357087, "epoch": 0.43, "percentage": 21.58, "elapsed_time": "1:33:51", "remaining_time": "5:41:06"} +{"current_steps": 2330, "total_steps": 10798, "loss": 2.0073, "reward": null, "learning_rate": 0.0008895384990357087, "epoch": 0.43, "percentage": 21.58, "elapsed_time": "1:33:47", "remaining_time": "5:40:53"} +{"current_steps": 2330, "total_steps": 10798, "loss": 2.0073, "reward": null, "learning_rate": 0.0008895384990357087, "epoch": 0.43, "percentage": 21.58, "elapsed_time": "1:33:49", "remaining_time": "5:40:59"} +{"current_steps": 2340, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0008886248525872056, "epoch": 0.43, "percentage": 21.67, "elapsed_time": "1:40:15", "remaining_time": "6:02:24"} +{"current_steps": 2340, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0008886248525872056, "epoch": 0.43, "percentage": 21.67, "elapsed_time": "1:34:14", "remaining_time": "5:40:38"} +{"current_steps": 2340, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0008886248525872056, "epoch": 0.43, "percentage": 21.67, "elapsed_time": "1:34:11", "remaining_time": "5:40:25"} +{"current_steps": 2340, "total_steps": 10798, "loss": 2.0262, "reward": null, "learning_rate": 0.0008886248525872056, "epoch": 0.43, "percentage": 21.67, "elapsed_time": "1:34:12", "remaining_time": "5:40:31"} +{"current_steps": 2350, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008877079165366566, "epoch": 0.44, "percentage": 21.76, "elapsed_time": "1:40:39", "remaining_time": "6:01:52"} +{"current_steps": 2350, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008877079165366566, "epoch": 0.44, "percentage": 21.76, "elapsed_time": "1:34:34", "remaining_time": "5:40:00"} +{"current_steps": 2350, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008877079165366566, "epoch": 0.44, "percentage": 21.76, "elapsed_time": "1:34:38", "remaining_time": "5:40:12"} +{"current_steps": 2350, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008877079165366566, "epoch": 0.44, "percentage": 21.76, "elapsed_time": "1:34:36", "remaining_time": "5:40:06"} +{"current_steps": 2360, "total_steps": 10798, "loss": 2.042, "reward": null, "learning_rate": 0.000886787698645672, "epoch": 0.44, "percentage": 21.86, "elapsed_time": "1:34:59", "remaining_time": "5:39:38"} +{"current_steps": 2360, "total_steps": 10798, "loss": 2.042, "reward": null, "learning_rate": 0.000886787698645672, "epoch": 0.44, "percentage": 21.86, "elapsed_time": "1:35:01", "remaining_time": "5:39:44"} +{"current_steps": 2360, "total_steps": 10798, "loss": 2.042, "reward": null, "learning_rate": 0.000886787698645672, "epoch": 0.44, "percentage": 21.86, "elapsed_time": "1:35:03", "remaining_time": "5:39:50"} +{"current_steps": 2360, "total_steps": 10798, "loss": 2.042, "reward": null, "learning_rate": 0.000886787698645672, "epoch": 0.44, "percentage": 21.86, "elapsed_time": "1:41:04", "remaining_time": "6:01:23"} +{"current_steps": 2370, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0008858642067036424, "epoch": 0.44, "percentage": 21.95, "elapsed_time": "1:35:26", "remaining_time": "5:39:23"} +{"current_steps": 2370, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0008858642067036424, "epoch": 0.44, "percentage": 21.95, "elapsed_time": "1:35:28", "remaining_time": "5:39:29"} +{"current_steps": 2370, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0008858642067036424, "epoch": 0.44, "percentage": 21.95, "elapsed_time": "1:35:24", "remaining_time": "5:39:17"} +{"current_steps": 2370, "total_steps": 10798, "loss": 2.0129, "reward": null, "learning_rate": 0.0008858642067036424, "epoch": 0.44, "percentage": 21.95, "elapsed_time": "1:41:29", "remaining_time": "6:00:55"} +{"current_steps": 2380, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0008849374485276715, "epoch": 0.44, "percentage": 22.04, "elapsed_time": "1:35:52", "remaining_time": "5:39:06"} +{"current_steps": 2380, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0008849374485276715, "epoch": 0.44, "percentage": 22.04, "elapsed_time": "1:41:54", "remaining_time": "6:00:25"} +{"current_steps": 2380, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0008849374485276715, "epoch": 0.44, "percentage": 22.04, "elapsed_time": "1:35:49", "remaining_time": "5:38:54"} +{"current_steps": 2380, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0008849374485276715, "epoch": 0.44, "percentage": 22.04, "elapsed_time": "1:35:50", "remaining_time": "5:39:00"} +{"current_steps": 2390, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000884007431962512, "epoch": 0.44, "percentage": 22.13, "elapsed_time": "1:36:15", "remaining_time": "5:38:38"} +{"current_steps": 2390, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000884007431962512, "epoch": 0.44, "percentage": 22.13, "elapsed_time": "1:36:17", "remaining_time": "5:38:44"} +{"current_steps": 2390, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000884007431962512, "epoch": 0.44, "percentage": 22.13, "elapsed_time": "1:42:18", "remaining_time": "5:59:56"} +{"current_steps": 2390, "total_steps": 10798, "loss": 2.0211, "reward": null, "learning_rate": 0.000884007431962512, "epoch": 0.44, "percentage": 22.13, "elapsed_time": "1:36:14", "remaining_time": "5:38:33"} +{"current_steps": 2400, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0008830741648804967, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "1:42:44", "remaining_time": "5:59:30"} +{"current_steps": 2400, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0008830741648804967, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "1:36:39", "remaining_time": "5:38:13"} +{"current_steps": 2400, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0008830741648804967, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "1:36:41", "remaining_time": "5:38:19"} +{"current_steps": 2400, "total_steps": 10798, "loss": 2.0175, "reward": null, "learning_rate": 0.0008830741648804967, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "1:36:43", "remaining_time": "5:38:25"} +{"current_steps": 2410, "total_steps": 10798, "loss": 2.0423, "reward": null, "learning_rate": 0.0008821376551814739, "epoch": 0.45, "percentage": 22.32, "elapsed_time": "1:37:08", "remaining_time": "5:38:06"} +{"current_steps": 2410, "total_steps": 10798, "loss": 2.0423, "reward": null, "learning_rate": 0.0008821376551814739, "epoch": 0.45, "percentage": 22.32, "elapsed_time": "1:37:05", "remaining_time": "5:37:54"} +{"current_steps": 2410, "total_steps": 10798, "loss": 2.0423, "reward": null, "learning_rate": 0.0008821376551814739, "epoch": 0.45, "percentage": 22.32, "elapsed_time": "1:37:06", "remaining_time": "5:38:00"} +{"current_steps": 2410, "total_steps": 10798, "loss": 2.0423, "reward": null, "learning_rate": 0.0008821376551814739, "epoch": 0.45, "percentage": 22.32, "elapsed_time": "1:43:10", "remaining_time": "5:59:04"} +{"current_steps": 2420, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008811979107927396, "epoch": 0.45, "percentage": 22.41, "elapsed_time": "1:43:33", "remaining_time": "5:58:31"} +{"current_steps": 2420, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008811979107927396, "epoch": 0.45, "percentage": 22.41, "elapsed_time": "1:37:30", "remaining_time": "5:37:33"} +{"current_steps": 2420, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008811979107927396, "epoch": 0.45, "percentage": 22.41, "elapsed_time": "1:37:32", "remaining_time": "5:37:39"} +{"current_steps": 2420, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0008811979107927396, "epoch": 0.45, "percentage": 22.41, "elapsed_time": "1:37:28", "remaining_time": "5:37:28"} +{"current_steps": 2430, "total_steps": 10798, "loss": 2.0422, "reward": null, "learning_rate": 0.0008802549396689705, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "1:43:56", "remaining_time": "5:57:56"} +{"current_steps": 2430, "total_steps": 10798, "loss": 2.0422, "reward": null, "learning_rate": 0.0008802549396689705, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "1:37:55", "remaining_time": "5:37:11"} +{"current_steps": 2430, "total_steps": 10798, "loss": 2.0422, "reward": null, "learning_rate": 0.0008802549396689705, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "1:37:51", "remaining_time": "5:37:00"} +{"current_steps": 2430, "total_steps": 10798, "loss": 2.0422, "reward": null, "learning_rate": 0.0008802549396689705, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "1:37:53", "remaining_time": "5:37:05"} +{"current_steps": 2440, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008793087497921566, "epoch": 0.45, "percentage": 22.6, "elapsed_time": "1:38:17", "remaining_time": "5:36:42"} +{"current_steps": 2440, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008793087497921566, "epoch": 0.45, "percentage": 22.6, "elapsed_time": "1:38:16", "remaining_time": "5:36:36"} +{"current_steps": 2440, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008793087497921566, "epoch": 0.45, "percentage": 22.6, "elapsed_time": "1:44:20", "remaining_time": "5:57:26"} +{"current_steps": 2440, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008793087497921566, "epoch": 0.45, "percentage": 22.6, "elapsed_time": "1:38:19", "remaining_time": "5:36:48"} +{"current_steps": 2450, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0008784544334882426, "epoch": 0.45, "percentage": 22.69, "elapsed_time": "1:44:45", "remaining_time": "5:56:55"} +{"current_steps": 2450, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0008784544334882426, "epoch": 0.45, "percentage": 22.69, "elapsed_time": "1:38:41", "remaining_time": "5:36:18"} +{"current_steps": 2450, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0008784544334882426, "epoch": 0.45, "percentage": 22.69, "elapsed_time": "1:38:40", "remaining_time": "5:36:12"} +{"current_steps": 2450, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0008784544334882426, "epoch": 0.45, "percentage": 22.69, "elapsed_time": "1:38:43", "remaining_time": "5:36:24"} +{"current_steps": 2460, "total_steps": 10798, "loss": 2.0348, "reward": null, "learning_rate": 0.000877502150068553, "epoch": 0.46, "percentage": 22.78, "elapsed_time": "1:45:08", "remaining_time": "5:56:23"} +{"current_steps": 2460, "total_steps": 10798, "loss": 2.0348, "reward": null, "learning_rate": 0.000877502150068553, "epoch": 0.46, "percentage": 22.78, "elapsed_time": "1:39:07", "remaining_time": "5:35:58"} +{"current_steps": 2460, "total_steps": 10798, "loss": 2.0348, "reward": null, "learning_rate": 0.000877502150068553, "epoch": 0.46, "percentage": 22.78, "elapsed_time": "1:39:05", "remaining_time": "5:35:52"} +{"current_steps": 2460, "total_steps": 10798, "loss": 2.0348, "reward": null, "learning_rate": 0.000877502150068553, "epoch": 0.46, "percentage": 22.78, "elapsed_time": "1:39:04", "remaining_time": "5:35:47"} +{"current_steps": 2470, "total_steps": 10798, "loss": 2.0232, "reward": null, "learning_rate": 0.0008765466711974225, "epoch": 0.46, "percentage": 22.87, "elapsed_time": "1:39:31", "remaining_time": "5:35:35"} +{"current_steps": 2470, "total_steps": 10798, "loss": 2.0232, "reward": null, "learning_rate": 0.0008765466711974225, "epoch": 0.46, "percentage": 22.87, "elapsed_time": "1:39:30", "remaining_time": "5:35:29"} +{"current_steps": 2470, "total_steps": 10798, "loss": 2.0232, "reward": null, "learning_rate": 0.0008765466711974225, "epoch": 0.46, "percentage": 22.87, "elapsed_time": "1:45:33", "remaining_time": "5:55:53"} +{"current_steps": 2470, "total_steps": 10798, "loss": 2.0232, "reward": null, "learning_rate": 0.0008765466711974225, "epoch": 0.46, "percentage": 22.87, "elapsed_time": "1:39:28", "remaining_time": "5:35:23"} +{"current_steps": 2480, "total_steps": 10798, "loss": 1.9953, "reward": null, "learning_rate": 0.0008755880049627157, "epoch": 0.46, "percentage": 22.97, "elapsed_time": "1:39:54", "remaining_time": "5:35:05"} +{"current_steps": 2480, "total_steps": 10798, "loss": 1.9953, "reward": null, "learning_rate": 0.0008755880049627157, "epoch": 0.46, "percentage": 22.97, "elapsed_time": "1:39:56", "remaining_time": "5:35:11"} +{"current_steps": 2480, "total_steps": 10798, "loss": 1.9953, "reward": null, "learning_rate": 0.0008755880049627157, "epoch": 0.46, "percentage": 22.97, "elapsed_time": "1:39:52", "remaining_time": "5:34:59"} +{"current_steps": 2480, "total_steps": 10798, "loss": 1.9953, "reward": null, "learning_rate": 0.0008755880049627157, "epoch": 0.46, "percentage": 22.97, "elapsed_time": "1:45:57", "remaining_time": "5:55:23"} +{"current_steps": 2490, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0008746261594792776, "epoch": 0.46, "percentage": 23.06, "elapsed_time": "1:46:21", "remaining_time": "5:54:53"} +{"current_steps": 2490, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0008746261594792776, "epoch": 0.46, "percentage": 23.06, "elapsed_time": "1:40:18", "remaining_time": "5:34:41"} +{"current_steps": 2490, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0008746261594792776, "epoch": 0.46, "percentage": 23.06, "elapsed_time": "1:40:20", "remaining_time": "5:34:47"} +{"current_steps": 2490, "total_steps": 10798, "loss": 2.0223, "reward": null, "learning_rate": 0.0008746261594792776, "epoch": 0.46, "percentage": 23.06, "elapsed_time": "1:40:17", "remaining_time": "5:34:36"} +{"current_steps": 2500, "total_steps": 10798, "loss": 2.0332, "reward": null, "learning_rate": 0.0008736611428888644, "epoch": 0.46, "percentage": 23.15, "elapsed_time": "1:46:46", "remaining_time": "5:54:23"} +{"current_steps": 2500, "total_steps": 10798, "loss": 2.0332, "reward": null, "learning_rate": 0.0008736611428888644, "epoch": 0.46, "percentage": 23.15, "elapsed_time": "1:40:44", "remaining_time": "5:34:23"} +{"current_steps": 2500, "total_steps": 10798, "loss": 2.0332, "reward": null, "learning_rate": 0.0008736611428888644, "epoch": 0.46, "percentage": 23.15, "elapsed_time": "1:40:42", "remaining_time": "5:34:17"} +{"current_steps": 2500, "total_steps": 10798, "loss": 2.0332, "reward": null, "learning_rate": 0.0008736611428888644, "epoch": 0.46, "percentage": 23.15, "elapsed_time": "1:40:41", "remaining_time": "5:34:12"} +{"current_steps": 2510, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008726929633600753, "epoch": 0.46, "percentage": 23.25, "elapsed_time": "1:47:10", "remaining_time": "5:53:52"} +{"current_steps": 2510, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008726929633600753, "epoch": 0.46, "percentage": 23.25, "elapsed_time": "1:41:05", "remaining_time": "5:33:48"} +{"current_steps": 2510, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008726929633600753, "epoch": 0.46, "percentage": 23.25, "elapsed_time": "1:41:07", "remaining_time": "5:33:53"} +{"current_steps": 2510, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008726929633600753, "epoch": 0.46, "percentage": 23.25, "elapsed_time": "1:41:08", "remaining_time": "5:33:59"} +{"current_steps": 2520, "total_steps": 10798, "loss": 2.002, "reward": null, "learning_rate": 0.0008717216290882824, "epoch": 0.47, "percentage": 23.34, "elapsed_time": "1:41:32", "remaining_time": "5:33:33"} +{"current_steps": 2520, "total_steps": 10798, "loss": 2.002, "reward": null, "learning_rate": 0.0008717216290882824, "epoch": 0.47, "percentage": 23.34, "elapsed_time": "1:47:34", "remaining_time": "5:53:21"} +{"current_steps": 2520, "total_steps": 10798, "loss": 2.002, "reward": null, "learning_rate": 0.0008717216290882824, "epoch": 0.47, "percentage": 23.34, "elapsed_time": "1:41:29", "remaining_time": "5:33:22"} +{"current_steps": 2520, "total_steps": 10798, "loss": 2.002, "reward": null, "learning_rate": 0.0008717216290882824, "epoch": 0.47, "percentage": 23.34, "elapsed_time": "1:41:30", "remaining_time": "5:33:28"} +{"current_steps": 2530, "total_steps": 10798, "loss": 2.0594, "reward": null, "learning_rate": 0.0008707471482955622, "epoch": 0.47, "percentage": 23.43, "elapsed_time": "1:41:55", "remaining_time": "5:33:05"} +{"current_steps": 2530, "total_steps": 10798, "loss": 2.0594, "reward": null, "learning_rate": 0.0008707471482955622, "epoch": 0.47, "percentage": 23.43, "elapsed_time": "1:41:53", "remaining_time": "5:32:59"} +{"current_steps": 2530, "total_steps": 10798, "loss": 2.0594, "reward": null, "learning_rate": 0.0008707471482955622, "epoch": 0.47, "percentage": 23.43, "elapsed_time": "1:41:57", "remaining_time": "5:33:10"} +{"current_steps": 2530, "total_steps": 10798, "loss": 2.0594, "reward": null, "learning_rate": 0.0008707471482955622, "epoch": 0.47, "percentage": 23.43, "elapsed_time": "1:47:58", "remaining_time": "5:52:52"} +{"current_steps": 2540, "total_steps": 10798, "loss": 2.0214, "reward": null, "learning_rate": 0.0008697695292306253, "epoch": 0.47, "percentage": 23.52, "elapsed_time": "1:42:19", "remaining_time": "5:32:41"} +{"current_steps": 2540, "total_steps": 10798, "loss": 2.0214, "reward": null, "learning_rate": 0.0008697695292306253, "epoch": 0.47, "percentage": 23.52, "elapsed_time": "1:48:22", "remaining_time": "5:52:22"} +{"current_steps": 2540, "total_steps": 10798, "loss": 2.0214, "reward": null, "learning_rate": 0.0008697695292306253, "epoch": 0.47, "percentage": 23.52, "elapsed_time": "1:42:18", "remaining_time": "5:32:35"} +{"current_steps": 2540, "total_steps": 10798, "loss": 2.0214, "reward": null, "learning_rate": 0.0008697695292306253, "epoch": 0.47, "percentage": 23.52, "elapsed_time": "1:42:21", "remaining_time": "5:32:46"} +{"current_steps": 2550, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.0008687887801687473, "epoch": 0.47, "percentage": 23.62, "elapsed_time": "1:42:43", "remaining_time": "5:32:16"} +{"current_steps": 2550, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.0008687887801687473, "epoch": 0.47, "percentage": 23.62, "elapsed_time": "1:48:46", "remaining_time": "5:51:51"} +{"current_steps": 2550, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.0008687887801687473, "epoch": 0.47, "percentage": 23.62, "elapsed_time": "1:42:42", "remaining_time": "5:32:11"} +{"current_steps": 2550, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.0008687887801687473, "epoch": 0.47, "percentage": 23.62, "elapsed_time": "1:42:45", "remaining_time": "5:32:22"} +{"current_steps": 2560, "total_steps": 10798, "loss": 2.0338, "reward": null, "learning_rate": 0.0008678049094116979, "epoch": 0.47, "percentage": 23.71, "elapsed_time": "1:49:11", "remaining_time": "5:51:22"} +{"current_steps": 2560, "total_steps": 10798, "loss": 2.0338, "reward": null, "learning_rate": 0.0008678049094116979, "epoch": 0.47, "percentage": 23.71, "elapsed_time": "1:43:06", "remaining_time": "5:31:48"} +{"current_steps": 2560, "total_steps": 10798, "loss": 2.0338, "reward": null, "learning_rate": 0.0008678049094116979, "epoch": 0.47, "percentage": 23.71, "elapsed_time": "1:43:08", "remaining_time": "5:31:53"} +{"current_steps": 2560, "total_steps": 10798, "loss": 2.0338, "reward": null, "learning_rate": 0.0008678049094116979, "epoch": 0.47, "percentage": 23.71, "elapsed_time": "1:43:10", "remaining_time": "5:31:59"} +{"current_steps": 2570, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008668179252876714, "epoch": 0.48, "percentage": 23.8, "elapsed_time": "1:49:35", "remaining_time": "5:50:50"} +{"current_steps": 2570, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008668179252876714, "epoch": 0.48, "percentage": 23.8, "elapsed_time": "1:43:31", "remaining_time": "5:31:27"} +{"current_steps": 2570, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008668179252876714, "epoch": 0.48, "percentage": 23.8, "elapsed_time": "1:43:33", "remaining_time": "5:31:33"} +{"current_steps": 2570, "total_steps": 10798, "loss": 2.0176, "reward": null, "learning_rate": 0.0008668179252876714, "epoch": 0.48, "percentage": 23.8, "elapsed_time": "1:43:30", "remaining_time": "5:31:22"} +{"current_steps": 2580, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.0008658278361512161, "epoch": 0.48, "percentage": 23.89, "elapsed_time": "1:43:56", "remaining_time": "5:31:03"} +{"current_steps": 2580, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.0008658278361512161, "epoch": 0.48, "percentage": 23.89, "elapsed_time": "1:49:59", "remaining_time": "5:50:20"} +{"current_steps": 2580, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.0008658278361512161, "epoch": 0.48, "percentage": 23.89, "elapsed_time": "1:43:54", "remaining_time": "5:30:58"} +{"current_steps": 2580, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.0008658278361512161, "epoch": 0.48, "percentage": 23.89, "elapsed_time": "1:43:57", "remaining_time": "5:31:09"} +{"current_steps": 2590, "total_steps": 10798, "loss": 2.0141, "reward": null, "learning_rate": 0.0008648346503831627, "epoch": 0.48, "percentage": 23.99, "elapsed_time": "1:44:19", "remaining_time": "5:30:36"} +{"current_steps": 2590, "total_steps": 10798, "loss": 2.0141, "reward": null, "learning_rate": 0.0008648346503831627, "epoch": 0.48, "percentage": 23.99, "elapsed_time": "1:50:22", "remaining_time": "5:49:47"} +{"current_steps": 2590, "total_steps": 10798, "loss": 2.0141, "reward": null, "learning_rate": 0.0008648346503831627, "epoch": 0.48, "percentage": 23.99, "elapsed_time": "1:44:17", "remaining_time": "5:30:31"} +{"current_steps": 2590, "total_steps": 10798, "loss": 2.0141, "reward": null, "learning_rate": 0.0008648346503831627, "epoch": 0.48, "percentage": 23.99, "elapsed_time": "1:44:21", "remaining_time": "5:30:41"} +{"current_steps": 2600, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0008638383763905546, "epoch": 0.48, "percentage": 24.08, "elapsed_time": "1:50:46", "remaining_time": "5:49:17"} +{"current_steps": 2600, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0008638383763905546, "epoch": 0.48, "percentage": 24.08, "elapsed_time": "1:44:43", "remaining_time": "5:30:11"} +{"current_steps": 2600, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0008638383763905546, "epoch": 0.48, "percentage": 24.08, "elapsed_time": "1:44:45", "remaining_time": "5:30:17"} +{"current_steps": 2600, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0008638383763905546, "epoch": 0.48, "percentage": 24.08, "elapsed_time": "1:44:41", "remaining_time": "5:30:06"} +{"current_steps": 2610, "total_steps": 10798, "loss": 2.039, "reward": null, "learning_rate": 0.0008628390226065761, "epoch": 0.48, "percentage": 24.17, "elapsed_time": "1:45:10", "remaining_time": "5:29:58"} +{"current_steps": 2610, "total_steps": 10798, "loss": 2.039, "reward": null, "learning_rate": 0.0008628390226065761, "epoch": 0.48, "percentage": 24.17, "elapsed_time": "1:51:12", "remaining_time": "5:48:52"} +{"current_steps": 2610, "total_steps": 10798, "loss": 2.039, "reward": null, "learning_rate": 0.0008628390226065761, "epoch": 0.48, "percentage": 24.17, "elapsed_time": "1:45:07", "remaining_time": "5:29:47"} +{"current_steps": 2610, "total_steps": 10798, "loss": 2.039, "reward": null, "learning_rate": 0.0008628390226065761, "epoch": 0.48, "percentage": 24.17, "elapsed_time": "1:45:09", "remaining_time": "5:29:52"} +{"current_steps": 2620, "total_steps": 10798, "loss": 1.9418, "reward": null, "learning_rate": 0.0008618365974904808, "epoch": 0.49, "percentage": 24.26, "elapsed_time": "1:51:35", "remaining_time": "5:48:20"} +{"current_steps": 2620, "total_steps": 10798, "loss": 1.9418, "reward": null, "learning_rate": 0.0008618365974904808, "epoch": 0.49, "percentage": 24.26, "elapsed_time": "1:45:31", "remaining_time": "5:29:21"} +{"current_steps": 2620, "total_steps": 10798, "loss": 1.9418, "reward": null, "learning_rate": 0.0008618365974904808, "epoch": 0.49, "percentage": 24.26, "elapsed_time": "1:45:34", "remaining_time": "5:29:31"} +{"current_steps": 2620, "total_steps": 10798, "loss": 1.9418, "reward": null, "learning_rate": 0.0008618365974904808, "epoch": 0.49, "percentage": 24.26, "elapsed_time": "1:45:32", "remaining_time": "5:29:26"} +{"current_steps": 2630, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0008608311095275205, "epoch": 0.49, "percentage": 24.36, "elapsed_time": "1:45:55", "remaining_time": "5:28:58"} +{"current_steps": 2630, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0008608311095275205, "epoch": 0.49, "percentage": 24.36, "elapsed_time": "1:45:57", "remaining_time": "5:29:03"} +{"current_steps": 2630, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0008608311095275205, "epoch": 0.49, "percentage": 24.36, "elapsed_time": "1:45:58", "remaining_time": "5:29:09"} +{"current_steps": 2630, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0008608311095275205, "epoch": 0.49, "percentage": 24.36, "elapsed_time": "1:52:00", "remaining_time": "5:47:51"} +{"current_steps": 2640, "total_steps": 10798, "loss": 2.0174, "reward": null, "learning_rate": 0.0008598225672288731, "epoch": 0.49, "percentage": 24.45, "elapsed_time": "1:52:24", "remaining_time": "5:47:21"} +{"current_steps": 2640, "total_steps": 10798, "loss": 2.0174, "reward": null, "learning_rate": 0.0008598225672288731, "epoch": 0.49, "percentage": 24.45, "elapsed_time": "1:46:19", "remaining_time": "5:28:34"} +{"current_steps": 2640, "total_steps": 10798, "loss": 2.0174, "reward": null, "learning_rate": 0.0008598225672288731, "epoch": 0.49, "percentage": 24.45, "elapsed_time": "1:46:21", "remaining_time": "5:28:39"} +{"current_steps": 2640, "total_steps": 10798, "loss": 2.0174, "reward": null, "learning_rate": 0.0008598225672288731, "epoch": 0.49, "percentage": 24.45, "elapsed_time": "1:46:22", "remaining_time": "5:28:44"} +{"current_steps": 2650, "total_steps": 10798, "loss": 1.984, "reward": null, "learning_rate": 0.0008588109791315707, "epoch": 0.49, "percentage": 24.54, "elapsed_time": "1:46:43", "remaining_time": "5:28:08"} +{"current_steps": 2650, "total_steps": 10798, "loss": 1.984, "reward": null, "learning_rate": 0.0008588109791315707, "epoch": 0.49, "percentage": 24.54, "elapsed_time": "1:52:48", "remaining_time": "5:46:50"} +{"current_steps": 2650, "total_steps": 10798, "loss": 1.984, "reward": null, "learning_rate": 0.0008588109791315707, "epoch": 0.49, "percentage": 24.54, "elapsed_time": "1:46:46", "remaining_time": "5:28:18"} +{"current_steps": 2650, "total_steps": 10798, "loss": 1.984, "reward": null, "learning_rate": 0.0008588109791315707, "epoch": 0.49, "percentage": 24.54, "elapsed_time": "1:46:44", "remaining_time": "5:28:13"} +{"current_steps": 2660, "total_steps": 10798, "loss": 2.0437, "reward": null, "learning_rate": 0.000857796353798427, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "1:53:11", "remaining_time": "5:46:19"} +{"current_steps": 2660, "total_steps": 10798, "loss": 2.0437, "reward": null, "learning_rate": 0.000857796353798427, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "1:47:10", "remaining_time": "5:27:53"} +{"current_steps": 2660, "total_steps": 10798, "loss": 2.0437, "reward": null, "learning_rate": 0.000857796353798427, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "1:47:07", "remaining_time": "5:27:43"} +{"current_steps": 2660, "total_steps": 10798, "loss": 2.0437, "reward": null, "learning_rate": 0.000857796353798427, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "1:47:08", "remaining_time": "5:27:48"} +{"current_steps": 2670, "total_steps": 10798, "loss": 2.0255, "reward": null, "learning_rate": 0.0008567786998179654, "epoch": 0.49, "percentage": 24.73, "elapsed_time": "1:53:36", "remaining_time": "5:45:50"} +{"current_steps": 2670, "total_steps": 10798, "loss": 2.0255, "reward": null, "learning_rate": 0.0008567786998179654, "epoch": 0.49, "percentage": 24.73, "elapsed_time": "1:47:31", "remaining_time": "5:27:20"} +{"current_steps": 2670, "total_steps": 10798, "loss": 2.0255, "reward": null, "learning_rate": 0.0008567786998179654, "epoch": 0.49, "percentage": 24.73, "elapsed_time": "1:47:35", "remaining_time": "5:27:30"} +{"current_steps": 2670, "total_steps": 10798, "loss": 2.0255, "reward": null, "learning_rate": 0.0008567786998179654, "epoch": 0.49, "percentage": 24.73, "elapsed_time": "1:47:33", "remaining_time": "5:27:25"} +{"current_steps": 2680, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0008557580258043459, "epoch": 0.5, "percentage": 24.82, "elapsed_time": "1:47:56", "remaining_time": "5:26:57"} +{"current_steps": 2680, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0008557580258043459, "epoch": 0.5, "percentage": 24.82, "elapsed_time": "1:54:01", "remaining_time": "5:45:22"} +{"current_steps": 2680, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0008557580258043459, "epoch": 0.5, "percentage": 24.82, "elapsed_time": "1:47:57", "remaining_time": "5:27:02"} +{"current_steps": 2680, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0008557580258043459, "epoch": 0.5, "percentage": 24.82, "elapsed_time": "1:47:59", "remaining_time": "5:27:07"} +{"current_steps": 2690, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0008547343403972918, "epoch": 0.5, "percentage": 24.91, "elapsed_time": "1:54:25", "remaining_time": "5:44:54"} +{"current_steps": 2690, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0008547343403972918, "epoch": 0.5, "percentage": 24.91, "elapsed_time": "1:48:22", "remaining_time": "5:26:39"} +{"current_steps": 2690, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0008547343403972918, "epoch": 0.5, "percentage": 24.91, "elapsed_time": "1:48:24", "remaining_time": "5:26:45"} +{"current_steps": 2690, "total_steps": 10798, "loss": 2.0201, "reward": null, "learning_rate": 0.0008547343403972918, "epoch": 0.5, "percentage": 24.91, "elapsed_time": "1:48:21", "remaining_time": "5:26:34"} +{"current_steps": 2700, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0008537076522620175, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "1:48:47", "remaining_time": "5:26:17"} +{"current_steps": 2700, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0008537076522620175, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "1:48:49", "remaining_time": "5:26:22"} +{"current_steps": 2700, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0008537076522620175, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "1:48:45", "remaining_time": "5:26:12"} +{"current_steps": 2700, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0008537076522620175, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "1:54:50", "remaining_time": "5:44:26"} +{"current_steps": 2710, "total_steps": 10798, "loss": 1.9977, "reward": null, "learning_rate": 0.0008526779700891545, "epoch": 0.5, "percentage": 25.1, "elapsed_time": "1:49:09", "remaining_time": "5:25:46"} +{"current_steps": 2710, "total_steps": 10798, "loss": 1.9977, "reward": null, "learning_rate": 0.0008526779700891545, "epoch": 0.5, "percentage": 25.1, "elapsed_time": "1:55:14", "remaining_time": "5:43:55"} +{"current_steps": 2710, "total_steps": 10798, "loss": 1.9977, "reward": null, "learning_rate": 0.0008526779700891545, "epoch": 0.5, "percentage": 25.1, "elapsed_time": "1:49:12", "remaining_time": "5:25:56"} +{"current_steps": 2710, "total_steps": 10798, "loss": 1.9977, "reward": null, "learning_rate": 0.0008526779700891545, "epoch": 0.5, "percentage": 25.1, "elapsed_time": "1:49:11", "remaining_time": "5:25:51"} +{"current_steps": 2720, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0008516453025946781, "epoch": 0.5, "percentage": 25.19, "elapsed_time": "1:49:32", "remaining_time": "5:25:19"} +{"current_steps": 2720, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0008516453025946781, "epoch": 0.5, "percentage": 25.19, "elapsed_time": "1:49:34", "remaining_time": "5:25:24"} +{"current_steps": 2720, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0008516453025946781, "epoch": 0.5, "percentage": 25.19, "elapsed_time": "1:55:37", "remaining_time": "5:43:22"} +{"current_steps": 2720, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0008516453025946781, "epoch": 0.5, "percentage": 25.19, "elapsed_time": "1:49:35", "remaining_time": "5:25:29"} +{"current_steps": 2730, "total_steps": 10798, "loss": 2.0428, "reward": null, "learning_rate": 0.0008506096585198333, "epoch": 0.51, "percentage": 25.28, "elapsed_time": "1:56:02", "remaining_time": "5:42:57"} +{"current_steps": 2730, "total_steps": 10798, "loss": 2.0428, "reward": null, "learning_rate": 0.0008506096585198333, "epoch": 0.51, "percentage": 25.28, "elapsed_time": "1:49:57", "remaining_time": "5:24:59"} +{"current_steps": 2730, "total_steps": 10798, "loss": 2.0428, "reward": null, "learning_rate": 0.0008506096585198333, "epoch": 0.51, "percentage": 25.28, "elapsed_time": "1:49:59", "remaining_time": "5:25:03"} +{"current_steps": 2730, "total_steps": 10798, "loss": 2.0428, "reward": null, "learning_rate": 0.0008506096585198333, "epoch": 0.51, "percentage": 25.28, "elapsed_time": "1:50:01", "remaining_time": "5:25:08"} +{"current_steps": 2740, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0008495710466310613, "epoch": 0.51, "percentage": 25.38, "elapsed_time": "1:56:26", "remaining_time": "5:42:27"} +{"current_steps": 2740, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0008495710466310613, "epoch": 0.51, "percentage": 25.38, "elapsed_time": "1:50:25", "remaining_time": "5:24:44"} +{"current_steps": 2740, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0008495710466310613, "epoch": 0.51, "percentage": 25.38, "elapsed_time": "1:50:23", "remaining_time": "5:24:39"} +{"current_steps": 2740, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0008495710466310613, "epoch": 0.51, "percentage": 25.38, "elapsed_time": "1:50:21", "remaining_time": "5:24:34"} +{"current_steps": 2750, "total_steps": 10798, "loss": 2.0497, "reward": null, "learning_rate": 0.0008485294757199248, "epoch": 0.51, "percentage": 25.47, "elapsed_time": "1:56:50", "remaining_time": "5:41:56"} +{"current_steps": 2750, "total_steps": 10798, "loss": 2.0497, "reward": null, "learning_rate": 0.0008485294757199248, "epoch": 0.51, "percentage": 25.47, "elapsed_time": "1:50:45", "remaining_time": "5:24:08"} +{"current_steps": 2750, "total_steps": 10798, "loss": 2.0497, "reward": null, "learning_rate": 0.0008485294757199248, "epoch": 0.51, "percentage": 25.47, "elapsed_time": "1:50:48", "remaining_time": "5:24:18"} +{"current_steps": 2750, "total_steps": 10798, "loss": 2.0497, "reward": null, "learning_rate": 0.0008485294757199248, "epoch": 0.51, "percentage": 25.47, "elapsed_time": "1:50:47", "remaining_time": "5:24:13"} +{"current_steps": 2760, "total_steps": 10798, "loss": 2.001, "reward": null, "learning_rate": 0.0008474849546030339, "epoch": 0.51, "percentage": 25.56, "elapsed_time": "1:51:10", "remaining_time": "5:23:46"} +{"current_steps": 2760, "total_steps": 10798, "loss": 2.001, "reward": null, "learning_rate": 0.0008474849546030339, "epoch": 0.51, "percentage": 25.56, "elapsed_time": "1:51:08", "remaining_time": "5:23:42"} +{"current_steps": 2760, "total_steps": 10798, "loss": 2.001, "reward": null, "learning_rate": 0.0008474849546030339, "epoch": 0.51, "percentage": 25.56, "elapsed_time": "1:51:12", "remaining_time": "5:23:51"} +{"current_steps": 2760, "total_steps": 10798, "loss": 2.001, "reward": null, "learning_rate": 0.0008474849546030339, "epoch": 0.51, "percentage": 25.56, "elapsed_time": "1:57:13", "remaining_time": "5:41:24"} +{"current_steps": 2770, "total_steps": 10798, "loss": 1.9824, "reward": null, "learning_rate": 0.0008464374921219714, "epoch": 0.51, "percentage": 25.65, "elapsed_time": "1:51:32", "remaining_time": "5:23:15"} +{"current_steps": 2770, "total_steps": 10798, "loss": 1.9824, "reward": null, "learning_rate": 0.0008464374921219714, "epoch": 0.51, "percentage": 25.65, "elapsed_time": "1:51:33", "remaining_time": "5:23:19"} +{"current_steps": 2770, "total_steps": 10798, "loss": 1.9824, "reward": null, "learning_rate": 0.0008464374921219714, "epoch": 0.51, "percentage": 25.65, "elapsed_time": "1:51:35", "remaining_time": "5:23:24"} +{"current_steps": 2770, "total_steps": 10798, "loss": 1.9824, "reward": null, "learning_rate": 0.0008464374921219714, "epoch": 0.51, "percentage": 25.65, "elapsed_time": "1:57:36", "remaining_time": "5:40:52"} +{"current_steps": 2780, "total_steps": 10798, "loss": 2.0378, "reward": null, "learning_rate": 0.0008453870971432179, "epoch": 0.51, "percentage": 25.75, "elapsed_time": "1:58:01", "remaining_time": "5:40:23"} +{"current_steps": 2780, "total_steps": 10798, "loss": 2.0378, "reward": null, "learning_rate": 0.0008453870971432179, "epoch": 0.51, "percentage": 25.75, "elapsed_time": "1:51:58", "remaining_time": "5:22:56"} +{"current_steps": 2780, "total_steps": 10798, "loss": 2.0378, "reward": null, "learning_rate": 0.0008453870971432179, "epoch": 0.51, "percentage": 25.75, "elapsed_time": "1:51:56", "remaining_time": "5:22:51"} +{"current_steps": 2780, "total_steps": 10798, "loss": 2.0378, "reward": null, "learning_rate": 0.0008453870971432179, "epoch": 0.51, "percentage": 25.75, "elapsed_time": "1:51:59", "remaining_time": "5:23:01"} +{"current_steps": 2790, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0008443337785580769, "epoch": 0.52, "percentage": 25.84, "elapsed_time": "1:58:24", "remaining_time": "5:39:52"} +{"current_steps": 2790, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0008443337785580769, "epoch": 0.52, "percentage": 25.84, "elapsed_time": "1:52:23", "remaining_time": "5:22:34"} +{"current_steps": 2790, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0008443337785580769, "epoch": 0.52, "percentage": 25.84, "elapsed_time": "1:52:19", "remaining_time": "5:22:25"} +{"current_steps": 2790, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0008443337785580769, "epoch": 0.52, "percentage": 25.84, "elapsed_time": "1:52:21", "remaining_time": "5:22:29"} +{"current_steps": 2800, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0008432775452825992, "epoch": 0.52, "percentage": 25.93, "elapsed_time": "1:58:48", "remaining_time": "5:39:23"} +{"current_steps": 2800, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0008432775452825992, "epoch": 0.52, "percentage": 25.93, "elapsed_time": "1:52:44", "remaining_time": "5:22:00"} +{"current_steps": 2800, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0008432775452825992, "epoch": 0.52, "percentage": 25.93, "elapsed_time": "1:52:45", "remaining_time": "5:22:05"} +{"current_steps": 2800, "total_steps": 10798, "loss": 2.0563, "reward": null, "learning_rate": 0.0008432775452825992, "epoch": 0.52, "percentage": 25.93, "elapsed_time": "1:52:47", "remaining_time": "5:22:10"} +{"current_steps": 2810, "total_steps": 10798, "loss": 2.0115, "reward": null, "learning_rate": 0.0008422184062575077, "epoch": 0.52, "percentage": 26.02, "elapsed_time": "1:59:13", "remaining_time": "5:38:56"} +{"current_steps": 2810, "total_steps": 10798, "loss": 2.0115, "reward": null, "learning_rate": 0.0008422184062575077, "epoch": 0.52, "percentage": 26.02, "elapsed_time": "1:53:10", "remaining_time": "5:21:43"} +{"current_steps": 2810, "total_steps": 10798, "loss": 2.0115, "reward": null, "learning_rate": 0.0008422184062575077, "epoch": 0.52, "percentage": 26.02, "elapsed_time": "1:53:12", "remaining_time": "5:21:48"} +{"current_steps": 2810, "total_steps": 10798, "loss": 2.0115, "reward": null, "learning_rate": 0.0008422184062575077, "epoch": 0.52, "percentage": 26.02, "elapsed_time": "1:53:08", "remaining_time": "5:21:38"} +{"current_steps": 2820, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0008411563704481217, "epoch": 0.52, "percentage": 26.12, "elapsed_time": "1:53:34", "remaining_time": "5:21:18"} +{"current_steps": 2820, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0008411563704481217, "epoch": 0.52, "percentage": 26.12, "elapsed_time": "1:53:37", "remaining_time": "5:21:28"} +{"current_steps": 2820, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0008411563704481217, "epoch": 0.52, "percentage": 26.12, "elapsed_time": "1:59:39", "remaining_time": "5:38:31"} +{"current_steps": 2820, "total_steps": 10798, "loss": 2.0301, "reward": null, "learning_rate": 0.0008411563704481217, "epoch": 0.52, "percentage": 26.12, "elapsed_time": "1:53:36", "remaining_time": "5:21:23"} +{"current_steps": 2830, "total_steps": 10798, "loss": 1.9912, "reward": null, "learning_rate": 0.0008400914468442814, "epoch": 0.52, "percentage": 26.21, "elapsed_time": "2:00:02", "remaining_time": "5:38:00"} +{"current_steps": 2830, "total_steps": 10798, "loss": 1.9912, "reward": null, "learning_rate": 0.0008400914468442814, "epoch": 0.52, "percentage": 26.21, "elapsed_time": "1:53:59", "remaining_time": "5:20:57"} +{"current_steps": 2830, "total_steps": 10798, "loss": 1.9912, "reward": null, "learning_rate": 0.0008400914468442814, "epoch": 0.52, "percentage": 26.21, "elapsed_time": "1:54:01", "remaining_time": "5:21:02"} +{"current_steps": 2830, "total_steps": 10798, "loss": 1.9912, "reward": null, "learning_rate": 0.0008400914468442814, "epoch": 0.52, "percentage": 26.21, "elapsed_time": "1:53:58", "remaining_time": "5:20:52"} +{"current_steps": 2840, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0008390236444602706, "epoch": 0.53, "percentage": 26.3, "elapsed_time": "2:00:27", "remaining_time": "5:37:33"} +{"current_steps": 2840, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0008390236444602706, "epoch": 0.53, "percentage": 26.3, "elapsed_time": "1:54:26", "remaining_time": "5:20:40"} +{"current_steps": 2840, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0008390236444602706, "epoch": 0.53, "percentage": 26.3, "elapsed_time": "1:54:24", "remaining_time": "5:20:35"} +{"current_steps": 2840, "total_steps": 10798, "loss": 2.0669, "reward": null, "learning_rate": 0.0008390236444602706, "epoch": 0.53, "percentage": 26.3, "elapsed_time": "1:54:22", "remaining_time": "5:20:30"} +{"current_steps": 2850, "total_steps": 10798, "loss": 2.0138, "reward": null, "learning_rate": 0.0008379529723347417, "epoch": 0.53, "percentage": 26.39, "elapsed_time": "2:00:52", "remaining_time": "5:37:05"} +{"current_steps": 2850, "total_steps": 10798, "loss": 2.0138, "reward": null, "learning_rate": 0.0008379529723347417, "epoch": 0.53, "percentage": 26.39, "elapsed_time": "1:54:47", "remaining_time": "5:20:08"} +{"current_steps": 2850, "total_steps": 10798, "loss": 2.0138, "reward": null, "learning_rate": 0.0008379529723347417, "epoch": 0.53, "percentage": 26.39, "elapsed_time": "1:54:49", "remaining_time": "5:20:12"} +{"current_steps": 2850, "total_steps": 10798, "loss": 2.0138, "reward": null, "learning_rate": 0.0008379529723347417, "epoch": 0.53, "percentage": 26.39, "elapsed_time": "1:54:51", "remaining_time": "5:20:17"} +{"current_steps": 2860, "total_steps": 10798, "loss": 2.0486, "reward": null, "learning_rate": 0.0008368794395306386, "epoch": 0.53, "percentage": 26.49, "elapsed_time": "1:55:13", "remaining_time": "5:19:48"} +{"current_steps": 2860, "total_steps": 10798, "loss": 2.0486, "reward": null, "learning_rate": 0.0008368794395306386, "epoch": 0.53, "percentage": 26.49, "elapsed_time": "1:55:11", "remaining_time": "5:19:44"} +{"current_steps": 2860, "total_steps": 10798, "loss": 2.0486, "reward": null, "learning_rate": 0.0008368794395306386, "epoch": 0.53, "percentage": 26.49, "elapsed_time": "2:01:16", "remaining_time": "5:36:36"} +{"current_steps": 2860, "total_steps": 10798, "loss": 2.0486, "reward": null, "learning_rate": 0.0008368794395306386, "epoch": 0.53, "percentage": 26.49, "elapsed_time": "1:55:15", "remaining_time": "5:19:53"} +{"current_steps": 2870, "total_steps": 10798, "loss": 2.0342, "reward": null, "learning_rate": 0.0008358030551351199, "epoch": 0.53, "percentage": 26.58, "elapsed_time": "2:01:41", "remaining_time": "5:36:08"} +{"current_steps": 2870, "total_steps": 10798, "loss": 2.0342, "reward": null, "learning_rate": 0.0008358030551351199, "epoch": 0.53, "percentage": 26.58, "elapsed_time": "1:55:38", "remaining_time": "5:19:25"} +{"current_steps": 2870, "total_steps": 10798, "loss": 2.0342, "reward": null, "learning_rate": 0.0008358030551351199, "epoch": 0.53, "percentage": 26.58, "elapsed_time": "1:55:39", "remaining_time": "5:19:30"} +{"current_steps": 2870, "total_steps": 10798, "loss": 2.0342, "reward": null, "learning_rate": 0.0008358030551351199, "epoch": 0.53, "percentage": 26.58, "elapsed_time": "1:55:36", "remaining_time": "5:19:21"} +{"current_steps": 2880, "total_steps": 10798, "loss": 2.0474, "reward": null, "learning_rate": 0.0008347238282594823, "epoch": 0.53, "percentage": 26.67, "elapsed_time": "2:02:05", "remaining_time": "5:35:40"} +{"current_steps": 2880, "total_steps": 10798, "loss": 2.0474, "reward": null, "learning_rate": 0.0008347238282594823, "epoch": 0.53, "percentage": 26.67, "elapsed_time": "1:56:04", "remaining_time": "5:19:06"} +{"current_steps": 2880, "total_steps": 10798, "loss": 2.0474, "reward": null, "learning_rate": 0.0008347238282594823, "epoch": 0.53, "percentage": 26.67, "elapsed_time": "1:56:00", "remaining_time": "5:18:57"} +{"current_steps": 2880, "total_steps": 10798, "loss": 2.0474, "reward": null, "learning_rate": 0.0008347238282594823, "epoch": 0.53, "percentage": 26.67, "elapsed_time": "1:56:02", "remaining_time": "5:19:01"} +{"current_steps": 2890, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0008336417680390829, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "1:56:28", "remaining_time": "5:18:41"} +{"current_steps": 2890, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0008336417680390829, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "1:56:26", "remaining_time": "5:18:37"} +{"current_steps": 2890, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0008336417680390829, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "2:02:29", "remaining_time": "5:35:11"} +{"current_steps": 2890, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0008336417680390829, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "1:56:24", "remaining_time": "5:18:32"} +{"current_steps": 2900, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0008325568836332633, "epoch": 0.54, "percentage": 26.86, "elapsed_time": "2:02:54", "remaining_time": "5:34:43"} +{"current_steps": 2900, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0008325568836332633, "epoch": 0.54, "percentage": 26.86, "elapsed_time": "1:56:52", "remaining_time": "5:18:19"} +{"current_steps": 2900, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0008325568836332633, "epoch": 0.54, "percentage": 26.86, "elapsed_time": "1:56:51", "remaining_time": "5:18:14"} +{"current_steps": 2900, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0008325568836332633, "epoch": 0.54, "percentage": 26.86, "elapsed_time": "1:56:49", "remaining_time": "5:18:10"} +{"current_steps": 2910, "total_steps": 10798, "loss": 2.0148, "reward": null, "learning_rate": 0.00083146918422527, "epoch": 0.54, "percentage": 26.95, "elapsed_time": "1:57:16", "remaining_time": "5:17:52"} +{"current_steps": 2910, "total_steps": 10798, "loss": 2.0148, "reward": null, "learning_rate": 0.00083146918422527, "epoch": 0.54, "percentage": 26.95, "elapsed_time": "1:57:14", "remaining_time": "5:17:48"} +{"current_steps": 2910, "total_steps": 10798, "loss": 2.0148, "reward": null, "learning_rate": 0.00083146918422527, "epoch": 0.54, "percentage": 26.95, "elapsed_time": "1:57:17", "remaining_time": "5:17:57"} +{"current_steps": 2910, "total_steps": 10798, "loss": 2.0148, "reward": null, "learning_rate": 0.00083146918422527, "epoch": 0.54, "percentage": 26.95, "elapsed_time": "2:03:19", "remaining_time": "5:34:17"} +{"current_steps": 2920, "total_steps": 10798, "loss": 2.0381, "reward": null, "learning_rate": 0.0008303786790221778, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "2:03:43", "remaining_time": "5:33:49"} +{"current_steps": 2920, "total_steps": 10798, "loss": 2.0381, "reward": null, "learning_rate": 0.0008303786790221778, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "1:57:40", "remaining_time": "5:17:29"} +{"current_steps": 2920, "total_steps": 10798, "loss": 2.0381, "reward": null, "learning_rate": 0.0008303786790221778, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "1:57:39", "remaining_time": "5:17:25"} +{"current_steps": 2920, "total_steps": 10798, "loss": 2.0381, "reward": null, "learning_rate": 0.0008303786790221778, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "1:57:42", "remaining_time": "5:17:34"} +{"current_steps": 2930, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0008292853772548126, "epoch": 0.54, "percentage": 27.13, "elapsed_time": "2:04:08", "remaining_time": "5:33:22"} +{"current_steps": 2930, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0008292853772548126, "epoch": 0.54, "percentage": 27.13, "elapsed_time": "1:58:04", "remaining_time": "5:17:02"} +{"current_steps": 2930, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0008292853772548126, "epoch": 0.54, "percentage": 27.13, "elapsed_time": "1:58:05", "remaining_time": "5:17:07"} +{"current_steps": 2930, "total_steps": 10798, "loss": 2.0591, "reward": null, "learning_rate": 0.0008292853772548126, "epoch": 0.54, "percentage": 27.13, "elapsed_time": "1:58:07", "remaining_time": "5:17:11"} +{"current_steps": 2940, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0008281892881776714, "epoch": 0.54, "percentage": 27.23, "elapsed_time": "2:04:32", "remaining_time": "5:32:52"} +{"current_steps": 2940, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0008281892881776714, "epoch": 0.54, "percentage": 27.23, "elapsed_time": "1:58:27", "remaining_time": "5:16:37"} +{"current_steps": 2940, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0008281892881776714, "epoch": 0.54, "percentage": 27.23, "elapsed_time": "1:58:30", "remaining_time": "5:16:46"} +{"current_steps": 2940, "total_steps": 10798, "loss": 2.0238, "reward": null, "learning_rate": 0.0008281892881776714, "epoch": 0.54, "percentage": 27.23, "elapsed_time": "1:58:29", "remaining_time": "5:16:41"} +{"current_steps": 2950, "total_steps": 10798, "loss": 1.9939, "reward": null, "learning_rate": 0.0008270904210688459, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "2:04:56", "remaining_time": "5:32:22"} +{"current_steps": 2950, "total_steps": 10798, "loss": 1.9939, "reward": null, "learning_rate": 0.0008270904210688459, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "1:58:54", "remaining_time": "5:16:21"} +{"current_steps": 2950, "total_steps": 10798, "loss": 1.9939, "reward": null, "learning_rate": 0.0008270904210688459, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "1:58:53", "remaining_time": "5:16:16"} +{"current_steps": 2950, "total_steps": 10798, "loss": 1.9939, "reward": null, "learning_rate": 0.0008270904210688459, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "1:58:51", "remaining_time": "5:16:12"} +{"current_steps": 2960, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0008259887852299427, "epoch": 0.55, "percentage": 27.41, "elapsed_time": "1:59:18", "remaining_time": "5:15:55"} +{"current_steps": 2960, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0008259887852299427, "epoch": 0.55, "percentage": 27.41, "elapsed_time": "2:05:19", "remaining_time": "5:31:52"} +{"current_steps": 2960, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0008259887852299427, "epoch": 0.55, "percentage": 27.41, "elapsed_time": "1:59:16", "remaining_time": "5:15:50"} +{"current_steps": 2960, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0008259887852299427, "epoch": 0.55, "percentage": 27.41, "elapsed_time": "1:59:15", "remaining_time": "5:15:46"} +{"current_steps": 2970, "total_steps": 10798, "loss": 2.0193, "reward": null, "learning_rate": 0.0008248843899860045, "epoch": 0.55, "percentage": 27.51, "elapsed_time": "1:59:39", "remaining_time": "5:15:23"} +{"current_steps": 2970, "total_steps": 10798, "loss": 2.0193, "reward": null, "learning_rate": 0.0008248843899860045, "epoch": 0.55, "percentage": 27.51, "elapsed_time": "1:59:42", "remaining_time": "5:15:32"} +{"current_steps": 2970, "total_steps": 10798, "loss": 2.0193, "reward": null, "learning_rate": 0.0008248843899860045, "epoch": 0.55, "percentage": 27.51, "elapsed_time": "1:59:41", "remaining_time": "5:15:27"} +{"current_steps": 2970, "total_steps": 10798, "loss": 2.0193, "reward": null, "learning_rate": 0.0008248843899860045, "epoch": 0.55, "percentage": 27.51, "elapsed_time": "2:05:44", "remaining_time": "5:31:24"} +{"current_steps": 2980, "total_steps": 10798, "loss": 2.0166, "reward": null, "learning_rate": 0.0008237772446854325, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "2:06:07", "remaining_time": "5:30:53"} +{"current_steps": 2980, "total_steps": 10798, "loss": 2.0166, "reward": null, "learning_rate": 0.0008237772446854325, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "2:00:02", "remaining_time": "5:14:55"} +{"current_steps": 2980, "total_steps": 10798, "loss": 2.0166, "reward": null, "learning_rate": 0.0008237772446854325, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "2:00:04", "remaining_time": "5:15:00"} +{"current_steps": 2980, "total_steps": 10798, "loss": 2.0166, "reward": null, "learning_rate": 0.0008237772446854325, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "2:00:05", "remaining_time": "5:15:04"} +{"current_steps": 2990, "total_steps": 10798, "loss": 2.0219, "reward": null, "learning_rate": 0.0008226673586999058, "epoch": 0.55, "percentage": 27.69, "elapsed_time": "2:06:31", "remaining_time": "5:30:24"} +{"current_steps": 2990, "total_steps": 10798, "loss": 2.0219, "reward": null, "learning_rate": 0.0008226673586999058, "epoch": 0.55, "percentage": 27.69, "elapsed_time": "2:00:30", "remaining_time": "5:14:40"} +{"current_steps": 2990, "total_steps": 10798, "loss": 2.0219, "reward": null, "learning_rate": 0.0008226673586999058, "epoch": 0.55, "percentage": 27.69, "elapsed_time": "2:00:28", "remaining_time": "5:14:35"} +{"current_steps": 2990, "total_steps": 10798, "loss": 2.0219, "reward": null, "learning_rate": 0.0008226673586999058, "epoch": 0.55, "percentage": 27.69, "elapsed_time": "2:00:26", "remaining_time": "5:14:31"} +{"current_steps": 3000, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0008215547414243025, "epoch": 0.56, "percentage": 27.78, "elapsed_time": "2:00:51", "remaining_time": "5:14:10"} +{"current_steps": 3000, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0008215547414243025, "epoch": 0.56, "percentage": 27.78, "elapsed_time": "2:00:50", "remaining_time": "5:14:06"} +{"current_steps": 3000, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0008215547414243025, "epoch": 0.56, "percentage": 27.78, "elapsed_time": "2:00:53", "remaining_time": "5:14:14"} +{"current_steps": 3000, "total_steps": 10798, "loss": 2.0078, "reward": null, "learning_rate": 0.0008215547414243025, "epoch": 0.56, "percentage": 27.78, "elapsed_time": "2:06:55", "remaining_time": "5:29:54"} +{"current_steps": 3010, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.0008204394022766208, "epoch": 0.56, "percentage": 27.88, "elapsed_time": "2:07:18", "remaining_time": "5:29:24"} +{"current_steps": 3010, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.0008204394022766208, "epoch": 0.56, "percentage": 27.88, "elapsed_time": "2:01:14", "remaining_time": "5:13:40"} +{"current_steps": 3010, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.0008204394022766208, "epoch": 0.56, "percentage": 27.88, "elapsed_time": "2:01:15", "remaining_time": "5:13:44"} +{"current_steps": 3010, "total_steps": 10798, "loss": 2.0022, "reward": null, "learning_rate": 0.0008204394022766208, "epoch": 0.56, "percentage": 27.88, "elapsed_time": "2:01:17", "remaining_time": "5:13:49"} +{"current_steps": 3020, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0008193213506978983, "epoch": 0.56, "percentage": 27.97, "elapsed_time": "2:07:42", "remaining_time": "5:28:53"} +{"current_steps": 3020, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0008193213506978983, "epoch": 0.56, "percentage": 27.97, "elapsed_time": "2:01:40", "remaining_time": "5:13:22"} +{"current_steps": 3020, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0008193213506978983, "epoch": 0.56, "percentage": 27.97, "elapsed_time": "2:01:38", "remaining_time": "5:13:18"} +{"current_steps": 3020, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0008193213506978983, "epoch": 0.56, "percentage": 27.97, "elapsed_time": "2:01:37", "remaining_time": "5:13:14"} +{"current_steps": 3030, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.0008182005961521331, "epoch": 0.56, "percentage": 28.06, "elapsed_time": "2:02:01", "remaining_time": "5:12:50"} +{"current_steps": 3030, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.0008182005961521331, "epoch": 0.56, "percentage": 28.06, "elapsed_time": "2:02:03", "remaining_time": "5:12:55"} +{"current_steps": 3030, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.0008182005961521331, "epoch": 0.56, "percentage": 28.06, "elapsed_time": "2:08:04", "remaining_time": "5:28:22"} +{"current_steps": 3030, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.0008182005961521331, "epoch": 0.56, "percentage": 28.06, "elapsed_time": "2:02:00", "remaining_time": "5:12:46"} +{"current_steps": 3040, "total_steps": 10798, "loss": 2.0101, "reward": null, "learning_rate": 0.0008170771481262027, "epoch": 0.56, "percentage": 28.15, "elapsed_time": "2:08:28", "remaining_time": "5:27:51"} +{"current_steps": 3040, "total_steps": 10798, "loss": 2.0101, "reward": null, "learning_rate": 0.0008170771481262027, "epoch": 0.56, "percentage": 28.15, "elapsed_time": "2:02:25", "remaining_time": "5:12:24"} +{"current_steps": 3040, "total_steps": 10798, "loss": 2.0101, "reward": null, "learning_rate": 0.0008170771481262027, "epoch": 0.56, "percentage": 28.15, "elapsed_time": "2:02:26", "remaining_time": "5:12:28"} +{"current_steps": 3040, "total_steps": 10798, "loss": 2.0101, "reward": null, "learning_rate": 0.0008170771481262027, "epoch": 0.56, "percentage": 28.15, "elapsed_time": "2:02:23", "remaining_time": "5:12:20"} +{"current_steps": 3050, "total_steps": 10798, "loss": 2.0307, "reward": null, "learning_rate": 0.0008159510161297846, "epoch": 0.56, "percentage": 28.25, "elapsed_time": "2:08:53", "remaining_time": "5:27:26"} +{"current_steps": 3050, "total_steps": 10798, "loss": 2.0307, "reward": null, "learning_rate": 0.0008159510161297846, "epoch": 0.56, "percentage": 28.25, "elapsed_time": "2:02:52", "remaining_time": "5:12:08"} +{"current_steps": 3050, "total_steps": 10798, "loss": 2.0307, "reward": null, "learning_rate": 0.0008159510161297846, "epoch": 0.56, "percentage": 28.25, "elapsed_time": "2:02:48", "remaining_time": "5:11:59"} +{"current_steps": 3050, "total_steps": 10798, "loss": 2.0307, "reward": null, "learning_rate": 0.0008159510161297846, "epoch": 0.56, "percentage": 28.25, "elapsed_time": "2:02:50", "remaining_time": "5:12:03"} +{"current_steps": 3060, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008148222096952748, "epoch": 0.57, "percentage": 28.34, "elapsed_time": "2:03:13", "remaining_time": "5:11:36"} +{"current_steps": 3060, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008148222096952748, "epoch": 0.57, "percentage": 28.34, "elapsed_time": "2:03:15", "remaining_time": "5:11:40"} +{"current_steps": 3060, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008148222096952748, "epoch": 0.57, "percentage": 28.34, "elapsed_time": "2:09:18", "remaining_time": "5:26:59"} +{"current_steps": 3060, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0008148222096952748, "epoch": 0.57, "percentage": 28.34, "elapsed_time": "2:03:16", "remaining_time": "5:11:45"} +{"current_steps": 3070, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0008136907383777081, "epoch": 0.57, "percentage": 28.43, "elapsed_time": "2:03:39", "remaining_time": "5:11:17"} +{"current_steps": 3070, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0008136907383777081, "epoch": 0.57, "percentage": 28.43, "elapsed_time": "2:03:38", "remaining_time": "5:11:13"} +{"current_steps": 3070, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0008136907383777081, "epoch": 0.57, "percentage": 28.43, "elapsed_time": "2:03:41", "remaining_time": "5:11:22"} +{"current_steps": 3070, "total_steps": 10798, "loss": 2.0415, "reward": null, "learning_rate": 0.0008136907383777081, "epoch": 0.57, "percentage": 28.43, "elapsed_time": "2:09:43", "remaining_time": "5:26:31"} +{"current_steps": 3080, "total_steps": 10798, "loss": 2.0031, "reward": null, "learning_rate": 0.000812556611754677, "epoch": 0.57, "percentage": 28.52, "elapsed_time": "2:04:03", "remaining_time": "5:10:53"} +{"current_steps": 3080, "total_steps": 10798, "loss": 2.0031, "reward": null, "learning_rate": 0.000812556611754677, "epoch": 0.57, "percentage": 28.52, "elapsed_time": "2:04:02", "remaining_time": "5:10:49"} +{"current_steps": 3080, "total_steps": 10798, "loss": 2.0031, "reward": null, "learning_rate": 0.000812556611754677, "epoch": 0.57, "percentage": 28.52, "elapsed_time": "2:04:05", "remaining_time": "5:10:57"} +{"current_steps": 3080, "total_steps": 10798, "loss": 2.0031, "reward": null, "learning_rate": 0.000812556611754677, "epoch": 0.57, "percentage": 28.52, "elapsed_time": "2:10:07", "remaining_time": "5:26:03"} +{"current_steps": 3090, "total_steps": 10798, "loss": 2.0025, "reward": null, "learning_rate": 0.0008114198394262497, "epoch": 0.57, "percentage": 28.62, "elapsed_time": "2:10:31", "remaining_time": "5:25:36"} +{"current_steps": 3090, "total_steps": 10798, "loss": 2.0025, "reward": null, "learning_rate": 0.0008114198394262497, "epoch": 0.57, "percentage": 28.62, "elapsed_time": "2:04:30", "remaining_time": "5:10:34"} +{"current_steps": 3090, "total_steps": 10798, "loss": 2.0025, "reward": null, "learning_rate": 0.0008114198394262497, "epoch": 0.57, "percentage": 28.62, "elapsed_time": "2:04:26", "remaining_time": "5:10:26"} +{"current_steps": 3090, "total_steps": 10798, "loss": 2.0025, "reward": null, "learning_rate": 0.0008114198394262497, "epoch": 0.57, "percentage": 28.62, "elapsed_time": "2:04:28", "remaining_time": "5:10:30"} +{"current_steps": 3100, "total_steps": 10798, "loss": 1.983, "reward": null, "learning_rate": 0.0008102804310148905, "epoch": 0.57, "percentage": 28.71, "elapsed_time": "2:04:53", "remaining_time": "5:10:08"} +{"current_steps": 3100, "total_steps": 10798, "loss": 1.983, "reward": null, "learning_rate": 0.0008102804310148905, "epoch": 0.57, "percentage": 28.71, "elapsed_time": "2:04:52", "remaining_time": "5:10:04"} +{"current_steps": 3100, "total_steps": 10798, "loss": 1.983, "reward": null, "learning_rate": 0.0008102804310148905, "epoch": 0.57, "percentage": 28.71, "elapsed_time": "2:10:57", "remaining_time": "5:25:10"} +{"current_steps": 3100, "total_steps": 10798, "loss": 1.983, "reward": null, "learning_rate": 0.0008102804310148905, "epoch": 0.57, "percentage": 28.71, "elapsed_time": "2:04:55", "remaining_time": "5:10:13"} +{"current_steps": 3110, "total_steps": 10798, "loss": 2.0056, "reward": null, "learning_rate": 0.0008091383961653765, "epoch": 0.58, "percentage": 28.8, "elapsed_time": "2:05:18", "remaining_time": "5:09:45"} +{"current_steps": 3110, "total_steps": 10798, "loss": 2.0056, "reward": null, "learning_rate": 0.0008091383961653765, "epoch": 0.58, "percentage": 28.8, "elapsed_time": "2:05:16", "remaining_time": "5:09:41"} +{"current_steps": 3110, "total_steps": 10798, "loss": 2.0056, "reward": null, "learning_rate": 0.0008091383961653765, "epoch": 0.58, "percentage": 28.8, "elapsed_time": "2:05:20", "remaining_time": "5:09:49"} +{"current_steps": 3110, "total_steps": 10798, "loss": 2.0056, "reward": null, "learning_rate": 0.0008091383961653765, "epoch": 0.58, "percentage": 28.8, "elapsed_time": "2:11:21", "remaining_time": "5:24:43"} +{"current_steps": 3120, "total_steps": 10798, "loss": 1.9679, "reward": null, "learning_rate": 0.0008079937445447175, "epoch": 0.58, "percentage": 28.89, "elapsed_time": "2:05:40", "remaining_time": "5:09:16"} +{"current_steps": 3120, "total_steps": 10798, "loss": 1.9679, "reward": null, "learning_rate": 0.0008079937445447175, "epoch": 0.58, "percentage": 28.89, "elapsed_time": "2:05:42", "remaining_time": "5:09:20"} +{"current_steps": 3120, "total_steps": 10798, "loss": 1.9679, "reward": null, "learning_rate": 0.0008079937445447175, "epoch": 0.58, "percentage": 28.89, "elapsed_time": "2:05:43", "remaining_time": "5:09:24"} +{"current_steps": 3120, "total_steps": 10798, "loss": 1.9679, "reward": null, "learning_rate": 0.0008079937445447175, "epoch": 0.58, "percentage": 28.89, "elapsed_time": "2:11:45", "remaining_time": "5:24:14"} +{"current_steps": 3130, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0008068464858420732, "epoch": 0.58, "percentage": 28.99, "elapsed_time": "2:06:08", "remaining_time": "5:09:01"} +{"current_steps": 3130, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0008068464858420732, "epoch": 0.58, "percentage": 28.99, "elapsed_time": "2:06:05", "remaining_time": "5:08:53"} +{"current_steps": 3130, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0008068464858420732, "epoch": 0.58, "percentage": 28.99, "elapsed_time": "2:06:06", "remaining_time": "5:08:57"} +{"current_steps": 3130, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0008068464858420732, "epoch": 0.58, "percentage": 28.99, "elapsed_time": "2:12:10", "remaining_time": "5:23:47"} +{"current_steps": 3140, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0008056966297686717, "epoch": 0.58, "percentage": 29.08, "elapsed_time": "2:06:33", "remaining_time": "5:08:39"} +{"current_steps": 3140, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0008056966297686717, "epoch": 0.58, "percentage": 29.08, "elapsed_time": "2:12:35", "remaining_time": "5:23:21"} +{"current_steps": 3140, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0008056966297686717, "epoch": 0.58, "percentage": 29.08, "elapsed_time": "2:06:31", "remaining_time": "5:08:35"} +{"current_steps": 3140, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0008056966297686717, "epoch": 0.58, "percentage": 29.08, "elapsed_time": "2:06:30", "remaining_time": "5:08:31"} +{"current_steps": 3150, "total_steps": 10798, "loss": 2.0088, "reward": null, "learning_rate": 0.0008045441860577273, "epoch": 0.58, "percentage": 29.17, "elapsed_time": "2:12:59", "remaining_time": "5:22:53"} +{"current_steps": 3150, "total_steps": 10798, "loss": 2.0088, "reward": null, "learning_rate": 0.0008045441860577273, "epoch": 0.58, "percentage": 29.17, "elapsed_time": "2:06:54", "remaining_time": "5:08:07"} +{"current_steps": 3150, "total_steps": 10798, "loss": 2.0088, "reward": null, "learning_rate": 0.0008045441860577273, "epoch": 0.58, "percentage": 29.17, "elapsed_time": "2:06:56", "remaining_time": "5:08:11"} +{"current_steps": 3150, "total_steps": 10798, "loss": 2.0088, "reward": null, "learning_rate": 0.0008045441860577273, "epoch": 0.58, "percentage": 29.17, "elapsed_time": "2:06:57", "remaining_time": "5:08:15"} +{"current_steps": 3160, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0008033891644643576, "epoch": 0.59, "percentage": 29.26, "elapsed_time": "2:07:20", "remaining_time": "5:07:47"} +{"current_steps": 3160, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0008033891644643576, "epoch": 0.59, "percentage": 29.26, "elapsed_time": "2:07:18", "remaining_time": "5:07:43"} +{"current_steps": 3160, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0008033891644643576, "epoch": 0.59, "percentage": 29.26, "elapsed_time": "2:07:22", "remaining_time": "5:07:51"} +{"current_steps": 3160, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0008033891644643576, "epoch": 0.59, "percentage": 29.26, "elapsed_time": "2:13:23", "remaining_time": "5:22:25"} +{"current_steps": 3170, "total_steps": 10798, "loss": 2.013, "reward": null, "learning_rate": 0.0008022315747655011, "epoch": 0.59, "percentage": 29.36, "elapsed_time": "2:13:49", "remaining_time": "5:22:01"} +{"current_steps": 3170, "total_steps": 10798, "loss": 2.013, "reward": null, "learning_rate": 0.0008022315747655011, "epoch": 0.59, "percentage": 29.36, "elapsed_time": "2:07:46", "remaining_time": "5:07:27"} +{"current_steps": 3170, "total_steps": 10798, "loss": 2.013, "reward": null, "learning_rate": 0.0008022315747655011, "epoch": 0.59, "percentage": 29.36, "elapsed_time": "2:07:48", "remaining_time": "5:07:32"} +{"current_steps": 3170, "total_steps": 10798, "loss": 2.013, "reward": null, "learning_rate": 0.0008022315747655011, "epoch": 0.59, "percentage": 29.36, "elapsed_time": "2:07:44", "remaining_time": "5:07:24"} +{"current_steps": 3180, "total_steps": 10798, "loss": 1.9902, "reward": null, "learning_rate": 0.0008010714267598354, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "2:14:13", "remaining_time": "5:21:34"} +{"current_steps": 3180, "total_steps": 10798, "loss": 1.9902, "reward": null, "learning_rate": 0.0008010714267598354, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "2:08:10", "remaining_time": "5:07:03"} +{"current_steps": 3180, "total_steps": 10798, "loss": 1.9902, "reward": null, "learning_rate": 0.0008010714267598354, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "2:08:09", "remaining_time": "5:07:00"} +{"current_steps": 3180, "total_steps": 10798, "loss": 1.9902, "reward": null, "learning_rate": 0.0008010714267598354, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "2:08:12", "remaining_time": "5:07:08"} +{"current_steps": 3190, "total_steps": 10798, "loss": 2.0133, "reward": null, "learning_rate": 0.0007999087302676926, "epoch": 0.59, "percentage": 29.54, "elapsed_time": "2:08:33", "remaining_time": "5:06:35"} +{"current_steps": 3190, "total_steps": 10798, "loss": 2.0133, "reward": null, "learning_rate": 0.0007999087302676926, "epoch": 0.59, "percentage": 29.54, "elapsed_time": "2:14:37", "remaining_time": "5:21:05"} +{"current_steps": 3190, "total_steps": 10798, "loss": 2.0133, "reward": null, "learning_rate": 0.0007999087302676926, "epoch": 0.59, "percentage": 29.54, "elapsed_time": "2:08:34", "remaining_time": "5:06:39"} +{"current_steps": 3190, "total_steps": 10798, "loss": 2.0133, "reward": null, "learning_rate": 0.0007999087302676926, "epoch": 0.59, "percentage": 29.54, "elapsed_time": "2:08:36", "remaining_time": "5:06:43"} +{"current_steps": 3200, "total_steps": 10798, "loss": 2.0092, "reward": null, "learning_rate": 0.0007987434951309774, "epoch": 0.59, "percentage": 29.64, "elapsed_time": "2:09:00", "remaining_time": "5:06:18"} +{"current_steps": 3200, "total_steps": 10798, "loss": 2.0092, "reward": null, "learning_rate": 0.0007987434951309774, "epoch": 0.59, "percentage": 29.64, "elapsed_time": "2:08:56", "remaining_time": "5:06:10"} +{"current_steps": 3200, "total_steps": 10798, "loss": 2.0092, "reward": null, "learning_rate": 0.0007987434951309774, "epoch": 0.59, "percentage": 29.64, "elapsed_time": "2:15:01", "remaining_time": "5:20:36"} +{"current_steps": 3200, "total_steps": 10798, "loss": 2.0092, "reward": null, "learning_rate": 0.0007987434951309774, "epoch": 0.59, "percentage": 29.64, "elapsed_time": "2:08:58", "remaining_time": "5:06:14"} +{"current_steps": 3210, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0007975757312130836, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "2:15:25", "remaining_time": "5:20:08"} +{"current_steps": 3210, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0007975757312130836, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "2:09:21", "remaining_time": "5:05:45"} +{"current_steps": 3210, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0007975757312130836, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "2:09:24", "remaining_time": "5:05:53"} +{"current_steps": 3210, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0007975757312130836, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "2:09:22", "remaining_time": "5:05:49"} +{"current_steps": 3220, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0007964054483988103, "epoch": 0.6, "percentage": 29.82, "elapsed_time": "2:15:50", "remaining_time": "5:19:40"} +{"current_steps": 3220, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0007964054483988103, "epoch": 0.6, "percentage": 29.82, "elapsed_time": "2:09:46", "remaining_time": "5:05:25"} +{"current_steps": 3220, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0007964054483988103, "epoch": 0.6, "percentage": 29.82, "elapsed_time": "2:09:48", "remaining_time": "5:05:29"} +{"current_steps": 3220, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0007964054483988103, "epoch": 0.6, "percentage": 29.82, "elapsed_time": "2:09:45", "remaining_time": "5:05:21"} +{"current_steps": 3230, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.000795232656594278, "epoch": 0.6, "percentage": 29.91, "elapsed_time": "2:10:12", "remaining_time": "5:05:06"} +{"current_steps": 3230, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.000795232656594278, "epoch": 0.6, "percentage": 29.91, "elapsed_time": "2:10:11", "remaining_time": "5:05:01"} +{"current_steps": 3230, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.000795232656594278, "epoch": 0.6, "percentage": 29.91, "elapsed_time": "2:16:14", "remaining_time": "5:19:12"} +{"current_steps": 3230, "total_steps": 10798, "loss": 2.016, "reward": null, "learning_rate": 0.000795232656594278, "epoch": 0.6, "percentage": 29.91, "elapsed_time": "2:10:09", "remaining_time": "5:04:58"} +{"current_steps": 3240, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0007940573657268458, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "2:16:39", "remaining_time": "5:18:48"} +{"current_steps": 3240, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0007940573657268458, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "2:10:35", "remaining_time": "5:04:37"} +{"current_steps": 3240, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0007940573657268458, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "2:10:38", "remaining_time": "5:04:44"} +{"current_steps": 3240, "total_steps": 10798, "loss": 2.0386, "reward": null, "learning_rate": 0.0007940573657268458, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "2:10:36", "remaining_time": "5:04:40"} +{"current_steps": 3250, "total_steps": 10798, "loss": 1.9602, "reward": null, "learning_rate": 0.0007928795857450259, "epoch": 0.6, "percentage": 30.1, "elapsed_time": "2:10:59", "remaining_time": "5:04:12"} +{"current_steps": 3250, "total_steps": 10798, "loss": 1.9602, "reward": null, "learning_rate": 0.0007928795857450259, "epoch": 0.6, "percentage": 30.1, "elapsed_time": "2:11:02", "remaining_time": "5:04:20"} +{"current_steps": 3250, "total_steps": 10798, "loss": 1.9602, "reward": null, "learning_rate": 0.0007928795857450259, "epoch": 0.6, "percentage": 30.1, "elapsed_time": "2:11:00", "remaining_time": "5:04:16"} +{"current_steps": 3250, "total_steps": 10798, "loss": 1.9602, "reward": null, "learning_rate": 0.0007928795857450259, "epoch": 0.6, "percentage": 30.1, "elapsed_time": "2:17:03", "remaining_time": "5:18:19"} +{"current_steps": 3260, "total_steps": 10798, "loss": 1.9681, "reward": null, "learning_rate": 0.0007916993266184007, "epoch": 0.6, "percentage": 30.19, "elapsed_time": "2:11:23", "remaining_time": "5:03:49"} +{"current_steps": 3260, "total_steps": 10798, "loss": 1.9681, "reward": null, "learning_rate": 0.0007916993266184007, "epoch": 0.6, "percentage": 30.19, "elapsed_time": "2:11:25", "remaining_time": "5:03:53"} +{"current_steps": 3260, "total_steps": 10798, "loss": 1.9681, "reward": null, "learning_rate": 0.0007916993266184007, "epoch": 0.6, "percentage": 30.19, "elapsed_time": "2:11:22", "remaining_time": "5:03:45"} +{"current_steps": 3260, "total_steps": 10798, "loss": 1.9681, "reward": null, "learning_rate": 0.0007916993266184007, "epoch": 0.6, "percentage": 30.19, "elapsed_time": "2:17:26", "remaining_time": "5:17:49"} +{"current_steps": 3270, "total_steps": 10798, "loss": 2.0326, "reward": null, "learning_rate": 0.0007905165983375379, "epoch": 0.61, "percentage": 30.28, "elapsed_time": "2:11:47", "remaining_time": "5:03:24"} +{"current_steps": 3270, "total_steps": 10798, "loss": 2.0326, "reward": null, "learning_rate": 0.0007905165983375379, "epoch": 0.61, "percentage": 30.28, "elapsed_time": "2:11:46", "remaining_time": "5:03:20"} +{"current_steps": 3270, "total_steps": 10798, "loss": 2.0326, "reward": null, "learning_rate": 0.0007905165983375379, "epoch": 0.61, "percentage": 30.28, "elapsed_time": "2:17:50", "remaining_time": "5:17:20"} +{"current_steps": 3270, "total_steps": 10798, "loss": 2.0326, "reward": null, "learning_rate": 0.0007905165983375379, "epoch": 0.61, "percentage": 30.28, "elapsed_time": "2:11:49", "remaining_time": "5:03:28"} +{"current_steps": 3280, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0007893314109139058, "epoch": 0.61, "percentage": 30.38, "elapsed_time": "2:18:15", "remaining_time": "5:16:53"} +{"current_steps": 3280, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0007893314109139058, "epoch": 0.61, "percentage": 30.38, "elapsed_time": "2:12:12", "remaining_time": "5:03:01"} +{"current_steps": 3280, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0007893314109139058, "epoch": 0.61, "percentage": 30.38, "elapsed_time": "2:12:13", "remaining_time": "5:03:05"} +{"current_steps": 3280, "total_steps": 10798, "loss": 1.9958, "reward": null, "learning_rate": 0.0007893314109139058, "epoch": 0.61, "percentage": 30.38, "elapsed_time": "2:12:10", "remaining_time": "5:02:57"} +{"current_steps": 3290, "total_steps": 10798, "loss": 2.0077, "reward": null, "learning_rate": 0.0007881437743797882, "epoch": 0.61, "percentage": 30.47, "elapsed_time": "2:18:39", "remaining_time": "5:16:25"} +{"current_steps": 3290, "total_steps": 10798, "loss": 2.0077, "reward": null, "learning_rate": 0.0007881437743797882, "epoch": 0.61, "percentage": 30.47, "elapsed_time": "2:12:36", "remaining_time": "5:02:36"} +{"current_steps": 3290, "total_steps": 10798, "loss": 2.0077, "reward": null, "learning_rate": 0.0007881437743797882, "epoch": 0.61, "percentage": 30.47, "elapsed_time": "2:12:37", "remaining_time": "5:02:40"} +{"current_steps": 3290, "total_steps": 10798, "loss": 2.0077, "reward": null, "learning_rate": 0.0007881437743797882, "epoch": 0.61, "percentage": 30.47, "elapsed_time": "2:12:34", "remaining_time": "5:02:32"} +{"current_steps": 3300, "total_steps": 10798, "loss": 1.9813, "reward": null, "learning_rate": 0.0007869536987882008, "epoch": 0.61, "percentage": 30.56, "elapsed_time": "2:19:03", "remaining_time": "5:15:57"} +{"current_steps": 3300, "total_steps": 10798, "loss": 1.9813, "reward": null, "learning_rate": 0.0007869536987882008, "epoch": 0.61, "percentage": 30.56, "elapsed_time": "2:13:01", "remaining_time": "5:02:15"} +{"current_steps": 3300, "total_steps": 10798, "loss": 1.9813, "reward": null, "learning_rate": 0.0007869536987882008, "epoch": 0.61, "percentage": 30.56, "elapsed_time": "2:12:58", "remaining_time": "5:02:08"} +{"current_steps": 3300, "total_steps": 10798, "loss": 1.9813, "reward": null, "learning_rate": 0.0007869536987882008, "epoch": 0.61, "percentage": 30.56, "elapsed_time": "2:13:00", "remaining_time": "5:02:11"} +{"current_steps": 3310, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.0007857611942128044, "epoch": 0.61, "percentage": 30.65, "elapsed_time": "2:19:26", "remaining_time": "5:15:27"} +{"current_steps": 3310, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.0007857611942128044, "epoch": 0.61, "percentage": 30.65, "elapsed_time": "2:13:23", "remaining_time": "5:01:45"} +{"current_steps": 3310, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.0007857611942128044, "epoch": 0.61, "percentage": 30.65, "elapsed_time": "2:13:21", "remaining_time": "5:01:42"} +{"current_steps": 3310, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.0007857611942128044, "epoch": 0.61, "percentage": 30.65, "elapsed_time": "2:13:25", "remaining_time": "5:01:49"} +{"current_steps": 3320, "total_steps": 10798, "loss": 1.9919, "reward": null, "learning_rate": 0.0007845662707478214, "epoch": 0.61, "percentage": 30.75, "elapsed_time": "2:13:47", "remaining_time": "5:01:21"} +{"current_steps": 3320, "total_steps": 10798, "loss": 1.9919, "reward": null, "learning_rate": 0.0007845662707478214, "epoch": 0.61, "percentage": 30.75, "elapsed_time": "2:13:46", "remaining_time": "5:01:18"} +{"current_steps": 3320, "total_steps": 10798, "loss": 1.9919, "reward": null, "learning_rate": 0.0007845662707478214, "epoch": 0.61, "percentage": 30.75, "elapsed_time": "2:19:50", "remaining_time": "5:14:59"} +{"current_steps": 3320, "total_steps": 10798, "loss": 1.9919, "reward": null, "learning_rate": 0.0007845662707478214, "epoch": 0.61, "percentage": 30.75, "elapsed_time": "2:13:49", "remaining_time": "5:01:25"} +{"current_steps": 3330, "total_steps": 10798, "loss": 1.9922, "reward": null, "learning_rate": 0.0007833689385079485, "epoch": 0.62, "percentage": 30.84, "elapsed_time": "2:20:14", "remaining_time": "5:14:31"} +{"current_steps": 3330, "total_steps": 10798, "loss": 1.9922, "reward": null, "learning_rate": 0.0007833689385079485, "epoch": 0.62, "percentage": 30.84, "elapsed_time": "2:14:11", "remaining_time": "5:00:56"} +{"current_steps": 3330, "total_steps": 10798, "loss": 1.9922, "reward": null, "learning_rate": 0.0007833689385079485, "epoch": 0.62, "percentage": 30.84, "elapsed_time": "2:14:09", "remaining_time": "5:00:53"} +{"current_steps": 3330, "total_steps": 10798, "loss": 1.9922, "reward": null, "learning_rate": 0.0007833689385079485, "epoch": 0.62, "percentage": 30.84, "elapsed_time": "2:14:13", "remaining_time": "5:01:00"} +{"current_steps": 3340, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0007821692076282725, "epoch": 0.62, "percentage": 30.93, "elapsed_time": "2:20:39", "remaining_time": "5:14:03"} +{"current_steps": 3340, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0007821692076282725, "epoch": 0.62, "percentage": 30.93, "elapsed_time": "2:14:37", "remaining_time": "5:00:36"} +{"current_steps": 3340, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0007821692076282725, "epoch": 0.62, "percentage": 30.93, "elapsed_time": "2:14:35", "remaining_time": "5:00:32"} +{"current_steps": 3340, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0007821692076282725, "epoch": 0.62, "percentage": 30.93, "elapsed_time": "2:14:34", "remaining_time": "5:00:29"} +{"current_steps": 3350, "total_steps": 10798, "loss": 2.0231, "reward": null, "learning_rate": 0.0007809670882641842, "epoch": 0.62, "percentage": 31.02, "elapsed_time": "2:14:57", "remaining_time": "5:00:03"} +{"current_steps": 3350, "total_steps": 10798, "loss": 2.0231, "reward": null, "learning_rate": 0.0007809670882641842, "epoch": 0.62, "percentage": 31.02, "elapsed_time": "2:21:02", "remaining_time": "5:13:34"} +{"current_steps": 3350, "total_steps": 10798, "loss": 2.0231, "reward": null, "learning_rate": 0.0007809670882641842, "epoch": 0.62, "percentage": 31.02, "elapsed_time": "2:14:59", "remaining_time": "5:00:07"} +{"current_steps": 3350, "total_steps": 10798, "loss": 2.0231, "reward": null, "learning_rate": 0.0007809670882641842, "epoch": 0.62, "percentage": 31.02, "elapsed_time": "2:15:01", "remaining_time": "5:00:10"} +{"current_steps": 3360, "total_steps": 10798, "loss": 1.9971, "reward": null, "learning_rate": 0.0007797625905912915, "epoch": 0.62, "percentage": 31.12, "elapsed_time": "2:15:23", "remaining_time": "4:59:43"} +{"current_steps": 3360, "total_steps": 10798, "loss": 1.9971, "reward": null, "learning_rate": 0.0007797625905912915, "epoch": 0.62, "percentage": 31.12, "elapsed_time": "2:21:27", "remaining_time": "5:13:07"} +{"current_steps": 3360, "total_steps": 10798, "loss": 1.9971, "reward": null, "learning_rate": 0.0007797625905912915, "epoch": 0.62, "percentage": 31.12, "elapsed_time": "2:15:25", "remaining_time": "4:59:47"} +{"current_steps": 3360, "total_steps": 10798, "loss": 1.9971, "reward": null, "learning_rate": 0.0007797625905912915, "epoch": 0.62, "percentage": 31.12, "elapsed_time": "2:15:22", "remaining_time": "4:59:40"} +{"current_steps": 3370, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0007785557248053351, "epoch": 0.62, "percentage": 31.21, "elapsed_time": "2:15:46", "remaining_time": "4:59:15"} +{"current_steps": 3370, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0007785557248053351, "epoch": 0.62, "percentage": 31.21, "elapsed_time": "2:15:48", "remaining_time": "4:59:19"} +{"current_steps": 3370, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0007785557248053351, "epoch": 0.62, "percentage": 31.21, "elapsed_time": "2:15:49", "remaining_time": "4:59:23"} +{"current_steps": 3370, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0007785557248053351, "epoch": 0.62, "percentage": 31.21, "elapsed_time": "2:21:51", "remaining_time": "5:12:40"} +{"current_steps": 3380, "total_steps": 10798, "loss": 1.9855, "reward": null, "learning_rate": 0.0007773465011221002, "epoch": 0.63, "percentage": 31.3, "elapsed_time": "2:16:14", "remaining_time": "4:59:00"} +{"current_steps": 3380, "total_steps": 10798, "loss": 1.9855, "reward": null, "learning_rate": 0.0007773465011221002, "epoch": 0.63, "percentage": 31.3, "elapsed_time": "2:16:12", "remaining_time": "4:58:56"} +{"current_steps": 3380, "total_steps": 10798, "loss": 1.9855, "reward": null, "learning_rate": 0.0007773465011221002, "epoch": 0.63, "percentage": 31.3, "elapsed_time": "2:22:15", "remaining_time": "5:12:13"} +{"current_steps": 3380, "total_steps": 10798, "loss": 1.9855, "reward": null, "learning_rate": 0.0007773465011221002, "epoch": 0.63, "percentage": 31.3, "elapsed_time": "2:16:11", "remaining_time": "4:58:52"} +{"current_steps": 3390, "total_steps": 10798, "loss": 2.0421, "reward": null, "learning_rate": 0.0007761349297773315, "epoch": 0.63, "percentage": 31.39, "elapsed_time": "2:16:35", "remaining_time": "4:58:29"} +{"current_steps": 3390, "total_steps": 10798, "loss": 2.0421, "reward": null, "learning_rate": 0.0007761349297773315, "epoch": 0.63, "percentage": 31.39, "elapsed_time": "2:16:37", "remaining_time": "4:58:32"} +{"current_steps": 3390, "total_steps": 10798, "loss": 2.0421, "reward": null, "learning_rate": 0.0007761349297773315, "epoch": 0.63, "percentage": 31.39, "elapsed_time": "2:22:40", "remaining_time": "5:11:46"} +{"current_steps": 3390, "total_steps": 10798, "loss": 2.0421, "reward": null, "learning_rate": 0.0007761349297773315, "epoch": 0.63, "percentage": 31.39, "elapsed_time": "2:16:38", "remaining_time": "4:58:36"} +{"current_steps": 3400, "total_steps": 10798, "loss": 1.9795, "reward": null, "learning_rate": 0.0007749210210266457, "epoch": 0.63, "percentage": 31.49, "elapsed_time": "2:23:04", "remaining_time": "5:11:19"} +{"current_steps": 3400, "total_steps": 10798, "loss": 1.9795, "reward": null, "learning_rate": 0.0007749210210266457, "epoch": 0.63, "percentage": 31.49, "elapsed_time": "2:17:00", "remaining_time": "4:58:05"} +{"current_steps": 3400, "total_steps": 10798, "loss": 1.9795, "reward": null, "learning_rate": 0.0007749210210266457, "epoch": 0.63, "percentage": 31.49, "elapsed_time": "2:17:03", "remaining_time": "4:58:13"} +{"current_steps": 3400, "total_steps": 10798, "loss": 1.9795, "reward": null, "learning_rate": 0.0007749210210266457, "epoch": 0.63, "percentage": 31.49, "elapsed_time": "2:17:01", "remaining_time": "4:58:09"} +{"current_steps": 3410, "total_steps": 10798, "loss": 2.0006, "reward": null, "learning_rate": 0.0007737047851454451, "epoch": 0.63, "percentage": 31.58, "elapsed_time": "2:23:29", "remaining_time": "5:10:52"} +{"current_steps": 3410, "total_steps": 10798, "loss": 2.0006, "reward": null, "learning_rate": 0.0007737047851454451, "epoch": 0.63, "percentage": 31.58, "elapsed_time": "2:17:24", "remaining_time": "4:57:42"} +{"current_steps": 3410, "total_steps": 10798, "loss": 2.0006, "reward": null, "learning_rate": 0.0007737047851454451, "epoch": 0.63, "percentage": 31.58, "elapsed_time": "2:17:27", "remaining_time": "4:57:49"} +{"current_steps": 3410, "total_steps": 10798, "loss": 2.0006, "reward": null, "learning_rate": 0.0007737047851454451, "epoch": 0.63, "percentage": 31.58, "elapsed_time": "2:17:26", "remaining_time": "4:57:45"} +{"current_steps": 3420, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0007724862324288309, "epoch": 0.63, "percentage": 31.67, "elapsed_time": "2:17:53", "remaining_time": "4:57:27"} +{"current_steps": 3420, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0007724862324288309, "epoch": 0.63, "percentage": 31.67, "elapsed_time": "2:17:51", "remaining_time": "4:57:23"} +{"current_steps": 3420, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0007724862324288309, "epoch": 0.63, "percentage": 31.67, "elapsed_time": "2:17:49", "remaining_time": "4:57:20"} +{"current_steps": 3420, "total_steps": 10798, "loss": 2.011, "reward": null, "learning_rate": 0.0007724862324288309, "epoch": 0.63, "percentage": 31.67, "elapsed_time": "2:23:54", "remaining_time": "5:10:27"} +{"current_steps": 3430, "total_steps": 10798, "loss": 1.9969, "reward": null, "learning_rate": 0.0007712653731915147, "epoch": 0.64, "percentage": 31.77, "elapsed_time": "2:24:19", "remaining_time": "5:10:00"} +{"current_steps": 3430, "total_steps": 10798, "loss": 1.9969, "reward": null, "learning_rate": 0.0007712653731915147, "epoch": 0.64, "percentage": 31.77, "elapsed_time": "2:18:17", "remaining_time": "4:57:03"} +{"current_steps": 3430, "total_steps": 10798, "loss": 1.9969, "reward": null, "learning_rate": 0.0007712653731915147, "epoch": 0.64, "percentage": 31.77, "elapsed_time": "2:18:15", "remaining_time": "4:57:00"} +{"current_steps": 3430, "total_steps": 10798, "loss": 1.9969, "reward": null, "learning_rate": 0.0007712653731915147, "epoch": 0.64, "percentage": 31.77, "elapsed_time": "2:18:14", "remaining_time": "4:56:56"} +{"current_steps": 3440, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.0007700422177677331, "epoch": 0.64, "percentage": 31.86, "elapsed_time": "2:24:43", "remaining_time": "5:09:33"} +{"current_steps": 3440, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.0007700422177677331, "epoch": 0.64, "percentage": 31.86, "elapsed_time": "2:18:40", "remaining_time": "4:56:36"} +{"current_steps": 3440, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.0007700422177677331, "epoch": 0.64, "percentage": 31.86, "elapsed_time": "2:18:42", "remaining_time": "4:56:40"} +{"current_steps": 3440, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.0007700422177677331, "epoch": 0.64, "percentage": 31.86, "elapsed_time": "2:18:38", "remaining_time": "4:56:33"} +{"current_steps": 3450, "total_steps": 10798, "loss": 1.9858, "reward": null, "learning_rate": 0.0007688167765111592, "epoch": 0.64, "percentage": 31.95, "elapsed_time": "2:19:02", "remaining_time": "4:56:07"} +{"current_steps": 3450, "total_steps": 10798, "loss": 1.9858, "reward": null, "learning_rate": 0.0007688167765111592, "epoch": 0.64, "percentage": 31.95, "elapsed_time": "2:25:06", "remaining_time": "5:09:04"} +{"current_steps": 3450, "total_steps": 10798, "loss": 1.9858, "reward": null, "learning_rate": 0.0007688167765111592, "epoch": 0.64, "percentage": 31.95, "elapsed_time": "2:19:05", "remaining_time": "4:56:14"} +{"current_steps": 3450, "total_steps": 10798, "loss": 1.9858, "reward": null, "learning_rate": 0.0007688167765111592, "epoch": 0.64, "percentage": 31.95, "elapsed_time": "2:19:03", "remaining_time": "4:56:10"} +{"current_steps": 3460, "total_steps": 10798, "loss": 1.9945, "reward": null, "learning_rate": 0.0007675890597948141, "epoch": 0.64, "percentage": 32.04, "elapsed_time": "2:25:30", "remaining_time": "5:08:36"} +{"current_steps": 3460, "total_steps": 10798, "loss": 1.9945, "reward": null, "learning_rate": 0.0007675890597948141, "epoch": 0.64, "percentage": 32.04, "elapsed_time": "2:19:29", "remaining_time": "4:55:50"} +{"current_steps": 3460, "total_steps": 10798, "loss": 1.9945, "reward": null, "learning_rate": 0.0007675890597948141, "epoch": 0.64, "percentage": 32.04, "elapsed_time": "2:19:27", "remaining_time": "4:55:46"} +{"current_steps": 3460, "total_steps": 10798, "loss": 1.9945, "reward": null, "learning_rate": 0.0007675890597948141, "epoch": 0.64, "percentage": 32.04, "elapsed_time": "2:19:26", "remaining_time": "4:55:42"} +{"current_steps": 3470, "total_steps": 10798, "loss": 2.0116, "reward": null, "learning_rate": 0.0007663590780109814, "epoch": 0.64, "percentage": 32.14, "elapsed_time": "2:19:50", "remaining_time": "4:55:18"} +{"current_steps": 3470, "total_steps": 10798, "loss": 2.0116, "reward": null, "learning_rate": 0.0007663590780109814, "epoch": 0.64, "percentage": 32.14, "elapsed_time": "2:19:53", "remaining_time": "4:55:25"} +{"current_steps": 3470, "total_steps": 10798, "loss": 2.0116, "reward": null, "learning_rate": 0.0007663590780109814, "epoch": 0.64, "percentage": 32.14, "elapsed_time": "2:25:55", "remaining_time": "5:08:09"} +{"current_steps": 3470, "total_steps": 10798, "loss": 2.0116, "reward": null, "learning_rate": 0.0007663590780109814, "epoch": 0.64, "percentage": 32.14, "elapsed_time": "2:19:51", "remaining_time": "4:55:22"} +{"current_steps": 3480, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0007651268415711168, "epoch": 0.64, "percentage": 32.23, "elapsed_time": "2:26:20", "remaining_time": "5:07:44"} +{"current_steps": 3480, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0007651268415711168, "epoch": 0.64, "percentage": 32.23, "elapsed_time": "2:20:19", "remaining_time": "4:55:04"} +{"current_steps": 3480, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0007651268415711168, "epoch": 0.64, "percentage": 32.23, "elapsed_time": "2:20:15", "remaining_time": "4:54:57"} +{"current_steps": 3480, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0007651268415711168, "epoch": 0.64, "percentage": 32.23, "elapsed_time": "2:20:17", "remaining_time": "4:55:00"} +{"current_steps": 3490, "total_steps": 10798, "loss": 2.0113, "reward": null, "learning_rate": 0.0007638923609057616, "epoch": 0.65, "percentage": 32.32, "elapsed_time": "2:20:39", "remaining_time": "4:54:32"} +{"current_steps": 3490, "total_steps": 10798, "loss": 2.0113, "reward": null, "learning_rate": 0.0007638923609057616, "epoch": 0.65, "percentage": 32.32, "elapsed_time": "2:20:41", "remaining_time": "4:54:36"} +{"current_steps": 3490, "total_steps": 10798, "loss": 2.0113, "reward": null, "learning_rate": 0.0007638923609057616, "epoch": 0.65, "percentage": 32.32, "elapsed_time": "2:26:44", "remaining_time": "5:07:16"} +{"current_steps": 3490, "total_steps": 10798, "loss": 2.0113, "reward": null, "learning_rate": 0.0007638923609057616, "epoch": 0.65, "percentage": 32.32, "elapsed_time": "2:20:43", "remaining_time": "4:54:39"} +{"current_steps": 3500, "total_steps": 10798, "loss": 1.9927, "reward": null, "learning_rate": 0.0007626556464644538, "epoch": 0.65, "percentage": 32.41, "elapsed_time": "2:21:06", "remaining_time": "4:54:14"} +{"current_steps": 3500, "total_steps": 10798, "loss": 1.9927, "reward": null, "learning_rate": 0.0007626556464644538, "epoch": 0.65, "percentage": 32.41, "elapsed_time": "2:21:04", "remaining_time": "4:54:10"} +{"current_steps": 3500, "total_steps": 10798, "loss": 1.9927, "reward": null, "learning_rate": 0.0007626556464644538, "epoch": 0.65, "percentage": 32.41, "elapsed_time": "2:27:08", "remaining_time": "5:06:47"} +{"current_steps": 3500, "total_steps": 10798, "loss": 1.9927, "reward": null, "learning_rate": 0.0007626556464644538, "epoch": 0.65, "percentage": 32.41, "elapsed_time": "2:21:03", "remaining_time": "4:54:07"} +{"current_steps": 3510, "total_steps": 10798, "loss": 2.0209, "reward": null, "learning_rate": 0.0007614167087156393, "epoch": 0.65, "percentage": 32.51, "elapsed_time": "2:21:27", "remaining_time": "4:53:43"} +{"current_steps": 3510, "total_steps": 10798, "loss": 2.0209, "reward": null, "learning_rate": 0.0007614167087156393, "epoch": 0.65, "percentage": 32.51, "elapsed_time": "2:21:26", "remaining_time": "4:53:40"} +{"current_steps": 3510, "total_steps": 10798, "loss": 2.0209, "reward": null, "learning_rate": 0.0007614167087156393, "epoch": 0.65, "percentage": 32.51, "elapsed_time": "2:21:29", "remaining_time": "4:53:47"} +{"current_steps": 3510, "total_steps": 10798, "loss": 2.0209, "reward": null, "learning_rate": 0.0007614167087156393, "epoch": 0.65, "percentage": 32.51, "elapsed_time": "2:27:31", "remaining_time": "5:06:18"} +{"current_steps": 3520, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0007601755581465844, "epoch": 0.65, "percentage": 32.6, "elapsed_time": "2:21:51", "remaining_time": "4:53:18"} +{"current_steps": 3520, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0007601755581465844, "epoch": 0.65, "percentage": 32.6, "elapsed_time": "2:21:53", "remaining_time": "4:53:21"} +{"current_steps": 3520, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0007601755581465844, "epoch": 0.65, "percentage": 32.6, "elapsed_time": "2:21:49", "remaining_time": "4:53:14"} +{"current_steps": 3520, "total_steps": 10798, "loss": 1.9941, "reward": null, "learning_rate": 0.0007601755581465844, "epoch": 0.65, "percentage": 32.6, "elapsed_time": "2:27:54", "remaining_time": "5:05:49"} +{"current_steps": 3530, "total_steps": 10798, "loss": 2.0443, "reward": null, "learning_rate": 0.0007589322052632855, "epoch": 0.65, "percentage": 32.69, "elapsed_time": "2:22:15", "remaining_time": "4:52:53"} +{"current_steps": 3530, "total_steps": 10798, "loss": 2.0443, "reward": null, "learning_rate": 0.0007589322052632855, "epoch": 0.65, "percentage": 32.69, "elapsed_time": "2:22:13", "remaining_time": "4:52:49"} +{"current_steps": 3530, "total_steps": 10798, "loss": 2.0443, "reward": null, "learning_rate": 0.0007589322052632855, "epoch": 0.65, "percentage": 32.69, "elapsed_time": "2:28:18", "remaining_time": "5:05:20"} +{"current_steps": 3530, "total_steps": 10798, "loss": 2.0443, "reward": null, "learning_rate": 0.0007589322052632855, "epoch": 0.65, "percentage": 32.69, "elapsed_time": "2:22:16", "remaining_time": "4:52:56"} +{"current_steps": 3540, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.0007576866605903812, "epoch": 0.66, "percentage": 32.78, "elapsed_time": "2:22:38", "remaining_time": "4:52:26"} +{"current_steps": 3540, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.0007576866605903812, "epoch": 0.66, "percentage": 32.78, "elapsed_time": "2:22:39", "remaining_time": "4:52:29"} +{"current_steps": 3540, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.0007576866605903812, "epoch": 0.66, "percentage": 32.78, "elapsed_time": "2:22:41", "remaining_time": "4:52:33"} +{"current_steps": 3540, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.0007576866605903812, "epoch": 0.66, "percentage": 32.78, "elapsed_time": "2:28:42", "remaining_time": "5:04:54"} +{"current_steps": 3550, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0007564389346710638, "epoch": 0.66, "percentage": 32.88, "elapsed_time": "2:23:04", "remaining_time": "4:52:07"} +{"current_steps": 3550, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0007564389346710638, "epoch": 0.66, "percentage": 32.88, "elapsed_time": "2:29:07", "remaining_time": "5:04:28"} +{"current_steps": 3550, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0007564389346710638, "epoch": 0.66, "percentage": 32.88, "elapsed_time": "2:23:02", "remaining_time": "4:52:03"} +{"current_steps": 3550, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0007564389346710638, "epoch": 0.66, "percentage": 32.88, "elapsed_time": "2:23:06", "remaining_time": "4:52:10"} +{"current_steps": 3560, "total_steps": 10798, "loss": 2.0034, "reward": null, "learning_rate": 0.0007551890380669879, "epoch": 0.66, "percentage": 32.97, "elapsed_time": "2:23:30", "remaining_time": "4:51:46"} +{"current_steps": 3560, "total_steps": 10798, "loss": 2.0034, "reward": null, "learning_rate": 0.0007551890380669879, "epoch": 0.66, "percentage": 32.97, "elapsed_time": "2:23:27", "remaining_time": "4:51:39"} +{"current_steps": 3560, "total_steps": 10798, "loss": 2.0034, "reward": null, "learning_rate": 0.0007551890380669879, "epoch": 0.66, "percentage": 32.97, "elapsed_time": "2:29:31", "remaining_time": "5:04:01"} +{"current_steps": 3560, "total_steps": 10798, "loss": 2.0034, "reward": null, "learning_rate": 0.0007551890380669879, "epoch": 0.66, "percentage": 32.97, "elapsed_time": "2:23:28", "remaining_time": "4:51:42"} +{"current_steps": 3570, "total_steps": 10798, "loss": 1.953, "reward": null, "learning_rate": 0.0007539369813581836, "epoch": 0.66, "percentage": 33.06, "elapsed_time": "2:29:56", "remaining_time": "5:03:35"} +{"current_steps": 3570, "total_steps": 10798, "loss": 1.953, "reward": null, "learning_rate": 0.0007539369813581836, "epoch": 0.66, "percentage": 33.06, "elapsed_time": "2:23:55", "remaining_time": "4:51:23"} +{"current_steps": 3570, "total_steps": 10798, "loss": 1.953, "reward": null, "learning_rate": 0.0007539369813581836, "epoch": 0.66, "percentage": 33.06, "elapsed_time": "2:23:53", "remaining_time": "4:51:19"} +{"current_steps": 3570, "total_steps": 10798, "loss": 1.953, "reward": null, "learning_rate": 0.0007539369813581836, "epoch": 0.66, "percentage": 33.06, "elapsed_time": "2:23:51", "remaining_time": "4:51:16"} +{"current_steps": 3580, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.000752682775142965, "epoch": 0.66, "percentage": 33.15, "elapsed_time": "2:30:21", "remaining_time": "5:03:10"} +{"current_steps": 3580, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.000752682775142965, "epoch": 0.66, "percentage": 33.15, "elapsed_time": "2:24:18", "remaining_time": "4:50:57"} +{"current_steps": 3580, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.000752682775142965, "epoch": 0.66, "percentage": 33.15, "elapsed_time": "2:24:17", "remaining_time": "4:50:54"} +{"current_steps": 3580, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.000752682775142965, "epoch": 0.66, "percentage": 33.15, "elapsed_time": "2:24:20", "remaining_time": "4:51:01"} +{"current_steps": 3590, "total_steps": 10798, "loss": 2.0096, "reward": null, "learning_rate": 0.0007514264300378411, "epoch": 0.66, "percentage": 33.25, "elapsed_time": "2:24:40", "remaining_time": "4:50:28"} +{"current_steps": 3590, "total_steps": 10798, "loss": 2.0096, "reward": null, "learning_rate": 0.0007514264300378411, "epoch": 0.66, "percentage": 33.25, "elapsed_time": "2:24:43", "remaining_time": "4:50:35"} +{"current_steps": 3590, "total_steps": 10798, "loss": 2.0096, "reward": null, "learning_rate": 0.0007514264300378411, "epoch": 0.66, "percentage": 33.25, "elapsed_time": "2:30:45", "remaining_time": "5:02:41"} +{"current_steps": 3590, "total_steps": 10798, "loss": 2.0096, "reward": null, "learning_rate": 0.0007514264300378411, "epoch": 0.66, "percentage": 33.25, "elapsed_time": "2:24:42", "remaining_time": "4:50:32"} +{"current_steps": 3600, "total_steps": 10798, "loss": 2.0431, "reward": null, "learning_rate": 0.0007501679566774267, "epoch": 0.67, "percentage": 33.34, "elapsed_time": "2:25:08", "remaining_time": "4:50:11"} +{"current_steps": 3600, "total_steps": 10798, "loss": 2.0431, "reward": null, "learning_rate": 0.0007501679566774267, "epoch": 0.67, "percentage": 33.34, "elapsed_time": "2:25:05", "remaining_time": "4:50:05"} +{"current_steps": 3600, "total_steps": 10798, "loss": 2.0431, "reward": null, "learning_rate": 0.0007501679566774267, "epoch": 0.67, "percentage": 33.34, "elapsed_time": "2:31:09", "remaining_time": "5:02:14"} +{"current_steps": 3600, "total_steps": 10798, "loss": 2.0431, "reward": null, "learning_rate": 0.0007501679566774267, "epoch": 0.67, "percentage": 33.34, "elapsed_time": "2:25:06", "remaining_time": "4:50:08"} +{"current_steps": 3610, "total_steps": 10798, "loss": 1.961, "reward": null, "learning_rate": 0.0007489073657143506, "epoch": 0.67, "percentage": 33.43, "elapsed_time": "2:31:33", "remaining_time": "5:01:46"} +{"current_steps": 3610, "total_steps": 10798, "loss": 1.961, "reward": null, "learning_rate": 0.0007489073657143506, "epoch": 0.67, "percentage": 33.43, "elapsed_time": "2:25:28", "remaining_time": "4:49:40"} +{"current_steps": 3610, "total_steps": 10798, "loss": 1.961, "reward": null, "learning_rate": 0.0007489073657143506, "epoch": 0.67, "percentage": 33.43, "elapsed_time": "2:25:30", "remaining_time": "4:49:43"} +{"current_steps": 3610, "total_steps": 10798, "loss": 1.961, "reward": null, "learning_rate": 0.0007489073657143506, "epoch": 0.67, "percentage": 33.43, "elapsed_time": "2:25:32", "remaining_time": "4:49:47"} +{"current_steps": 3620, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0007476446678191676, "epoch": 0.67, "percentage": 33.52, "elapsed_time": "2:25:54", "remaining_time": "4:49:18"} +{"current_steps": 3620, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0007476446678191676, "epoch": 0.67, "percentage": 33.52, "elapsed_time": "2:25:55", "remaining_time": "4:49:21"} +{"current_steps": 3620, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0007476446678191676, "epoch": 0.67, "percentage": 33.52, "elapsed_time": "2:31:58", "remaining_time": "5:01:21"} +{"current_steps": 3620, "total_steps": 10798, "loss": 2.0179, "reward": null, "learning_rate": 0.0007476446678191676, "epoch": 0.67, "percentage": 33.52, "elapsed_time": "2:25:57", "remaining_time": "4:49:25"} +{"current_steps": 3630, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0007463798736802665, "epoch": 0.67, "percentage": 33.62, "elapsed_time": "2:26:19", "remaining_time": "4:48:56"} +{"current_steps": 3630, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0007463798736802665, "epoch": 0.67, "percentage": 33.62, "elapsed_time": "2:26:17", "remaining_time": "4:48:53"} +{"current_steps": 3630, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0007463798736802665, "epoch": 0.67, "percentage": 33.62, "elapsed_time": "2:32:22", "remaining_time": "5:00:53"} +{"current_steps": 3630, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0007463798736802665, "epoch": 0.67, "percentage": 33.62, "elapsed_time": "2:26:21", "remaining_time": "4:48:59"} +{"current_steps": 3640, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007451129940037804, "epoch": 0.67, "percentage": 33.71, "elapsed_time": "2:32:46", "remaining_time": "5:00:25"} +{"current_steps": 3640, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007451129940037804, "epoch": 0.67, "percentage": 33.71, "elapsed_time": "2:26:41", "remaining_time": "4:48:28"} +{"current_steps": 3640, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007451129940037804, "epoch": 0.67, "percentage": 33.71, "elapsed_time": "2:26:43", "remaining_time": "4:48:31"} +{"current_steps": 3640, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007451129940037804, "epoch": 0.67, "percentage": 33.71, "elapsed_time": "2:26:44", "remaining_time": "4:48:34"} +{"current_steps": 3650, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000743844039513496, "epoch": 0.68, "percentage": 33.8, "elapsed_time": "2:27:05", "remaining_time": "4:48:04"} +{"current_steps": 3650, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000743844039513496, "epoch": 0.68, "percentage": 33.8, "elapsed_time": "2:27:09", "remaining_time": "4:48:10"} +{"current_steps": 3650, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000743844039513496, "epoch": 0.68, "percentage": 33.8, "elapsed_time": "2:27:07", "remaining_time": "4:48:07"} +{"current_steps": 3650, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000743844039513496, "epoch": 0.68, "percentage": 33.8, "elapsed_time": "2:33:10", "remaining_time": "4:59:58"} +{"current_steps": 3660, "total_steps": 10798, "loss": 1.9866, "reward": null, "learning_rate": 0.0007425730209507622, "epoch": 0.68, "percentage": 33.9, "elapsed_time": "2:27:31", "remaining_time": "4:47:43"} +{"current_steps": 3660, "total_steps": 10798, "loss": 1.9866, "reward": null, "learning_rate": 0.0007425730209507622, "epoch": 0.68, "percentage": 33.9, "elapsed_time": "2:27:30", "remaining_time": "4:47:40"} +{"current_steps": 3660, "total_steps": 10798, "loss": 1.9866, "reward": null, "learning_rate": 0.0007425730209507622, "epoch": 0.68, "percentage": 33.9, "elapsed_time": "2:27:33", "remaining_time": "4:47:46"} +{"current_steps": 3660, "total_steps": 10798, "loss": 1.9866, "reward": null, "learning_rate": 0.0007425730209507622, "epoch": 0.68, "percentage": 33.9, "elapsed_time": "2:33:34", "remaining_time": "4:59:31"} +{"current_steps": 3670, "total_steps": 10798, "loss": 1.9508, "reward": null, "learning_rate": 0.0007412999490744008, "epoch": 0.68, "percentage": 33.99, "elapsed_time": "2:27:56", "remaining_time": "4:47:20"} +{"current_steps": 3670, "total_steps": 10798, "loss": 1.9508, "reward": null, "learning_rate": 0.0007412999490744008, "epoch": 0.68, "percentage": 33.99, "elapsed_time": "2:27:54", "remaining_time": "4:47:17"} +{"current_steps": 3670, "total_steps": 10798, "loss": 1.9508, "reward": null, "learning_rate": 0.0007412999490744008, "epoch": 0.68, "percentage": 33.99, "elapsed_time": "2:27:58", "remaining_time": "4:47:23"} +{"current_steps": 3670, "total_steps": 10798, "loss": 1.9508, "reward": null, "learning_rate": 0.0007412999490744008, "epoch": 0.68, "percentage": 33.99, "elapsed_time": "2:33:59", "remaining_time": "4:59:05"} +{"current_steps": 3680, "total_steps": 10798, "loss": 2.0261, "reward": null, "learning_rate": 0.0007400248346606129, "epoch": 0.68, "percentage": 34.08, "elapsed_time": "2:34:23", "remaining_time": "4:58:38"} +{"current_steps": 3680, "total_steps": 10798, "loss": 2.0261, "reward": null, "learning_rate": 0.0007400248346606129, "epoch": 0.68, "percentage": 34.08, "elapsed_time": "2:28:20", "remaining_time": "4:46:55"} +{"current_steps": 3680, "total_steps": 10798, "loss": 2.0261, "reward": null, "learning_rate": 0.0007400248346606129, "epoch": 0.68, "percentage": 34.08, "elapsed_time": "2:28:22", "remaining_time": "4:46:59"} +{"current_steps": 3680, "total_steps": 10798, "loss": 2.0261, "reward": null, "learning_rate": 0.0007400248346606129, "epoch": 0.68, "percentage": 34.08, "elapsed_time": "2:28:18", "remaining_time": "4:46:52"} +{"current_steps": 3690, "total_steps": 10798, "loss": 1.9946, "reward": null, "learning_rate": 0.0007387476885028902, "epoch": 0.68, "percentage": 34.17, "elapsed_time": "2:34:47", "remaining_time": "4:58:09"} +{"current_steps": 3690, "total_steps": 10798, "loss": 1.9946, "reward": null, "learning_rate": 0.0007387476885028902, "epoch": 0.68, "percentage": 34.17, "elapsed_time": "2:28:42", "remaining_time": "4:46:27"} +{"current_steps": 3690, "total_steps": 10798, "loss": 1.9946, "reward": null, "learning_rate": 0.0007387476885028902, "epoch": 0.68, "percentage": 34.17, "elapsed_time": "2:28:44", "remaining_time": "4:46:30"} +{"current_steps": 3690, "total_steps": 10798, "loss": 1.9946, "reward": null, "learning_rate": 0.0007387476885028902, "epoch": 0.68, "percentage": 34.17, "elapsed_time": "2:28:45", "remaining_time": "4:46:33"} +{"current_steps": 3700, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0007374685214119221, "epoch": 0.69, "percentage": 34.27, "elapsed_time": "2:29:05", "remaining_time": "4:46:01"} +{"current_steps": 3700, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0007374685214119221, "epoch": 0.69, "percentage": 34.27, "elapsed_time": "2:35:10", "remaining_time": "4:57:41"} +{"current_steps": 3700, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0007374685214119221, "epoch": 0.69, "percentage": 34.27, "elapsed_time": "2:29:07", "remaining_time": "4:46:04"} +{"current_steps": 3700, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0007374685214119221, "epoch": 0.69, "percentage": 34.27, "elapsed_time": "2:29:09", "remaining_time": "4:46:08"} +{"current_steps": 3710, "total_steps": 10798, "loss": 1.9802, "reward": null, "learning_rate": 0.0007361873442155049, "epoch": 0.69, "percentage": 34.36, "elapsed_time": "2:35:35", "remaining_time": "4:57:16"} +{"current_steps": 3710, "total_steps": 10798, "loss": 1.9802, "reward": null, "learning_rate": 0.0007361873442155049, "epoch": 0.69, "percentage": 34.36, "elapsed_time": "2:29:32", "remaining_time": "4:45:42"} +{"current_steps": 3710, "total_steps": 10798, "loss": 1.9802, "reward": null, "learning_rate": 0.0007361873442155049, "epoch": 0.69, "percentage": 34.36, "elapsed_time": "2:29:34", "remaining_time": "4:45:45"} +{"current_steps": 3710, "total_steps": 10798, "loss": 1.9802, "reward": null, "learning_rate": 0.0007361873442155049, "epoch": 0.69, "percentage": 34.36, "elapsed_time": "2:29:31", "remaining_time": "4:45:39"} +{"current_steps": 3720, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 0.0007349041677584496, "epoch": 0.69, "percentage": 34.45, "elapsed_time": "2:29:59", "remaining_time": "4:45:22"} +{"current_steps": 3720, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 0.0007349041677584496, "epoch": 0.69, "percentage": 34.45, "elapsed_time": "2:29:57", "remaining_time": "4:45:19"} +{"current_steps": 3720, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 0.0007349041677584496, "epoch": 0.69, "percentage": 34.45, "elapsed_time": "2:36:00", "remaining_time": "4:56:50"} +{"current_steps": 3720, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 0.0007349041677584496, "epoch": 0.69, "percentage": 34.45, "elapsed_time": "2:29:55", "remaining_time": "4:45:16"} +{"current_steps": 3730, "total_steps": 10798, "loss": 1.964, "reward": null, "learning_rate": 0.0007336190029024907, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "2:36:26", "remaining_time": "4:56:25"} +{"current_steps": 3730, "total_steps": 10798, "loss": 1.964, "reward": null, "learning_rate": 0.0007336190029024907, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "2:30:21", "remaining_time": "4:44:54"} +{"current_steps": 3730, "total_steps": 10798, "loss": 1.964, "reward": null, "learning_rate": 0.0007336190029024907, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "2:30:24", "remaining_time": "4:45:00"} +{"current_steps": 3730, "total_steps": 10798, "loss": 1.964, "reward": null, "learning_rate": 0.0007336190029024907, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "2:30:22", "remaining_time": "4:44:57"} +{"current_steps": 3740, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0007323318605261933, "epoch": 0.69, "percentage": 34.64, "elapsed_time": "2:36:49", "remaining_time": "4:55:57"} +{"current_steps": 3740, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0007323318605261933, "epoch": 0.69, "percentage": 34.64, "elapsed_time": "2:30:46", "remaining_time": "4:44:31"} +{"current_steps": 3740, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0007323318605261933, "epoch": 0.69, "percentage": 34.64, "elapsed_time": "2:30:44", "remaining_time": "4:44:28"} +{"current_steps": 3740, "total_steps": 10798, "loss": 2.0009, "reward": null, "learning_rate": 0.0007323318605261933, "epoch": 0.69, "percentage": 34.64, "elapsed_time": "2:30:47", "remaining_time": "4:44:35"} +{"current_steps": 3750, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0007310427515248626, "epoch": 0.69, "percentage": 34.73, "elapsed_time": "2:37:12", "remaining_time": "4:55:28"} +{"current_steps": 3750, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0007310427515248626, "epoch": 0.69, "percentage": 34.73, "elapsed_time": "2:31:09", "remaining_time": "4:44:06"} +{"current_steps": 3750, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0007310427515248626, "epoch": 0.69, "percentage": 34.73, "elapsed_time": "2:31:11", "remaining_time": "4:44:09"} +{"current_steps": 3750, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0007310427515248626, "epoch": 0.69, "percentage": 34.73, "elapsed_time": "2:31:08", "remaining_time": "4:44:03"} +{"current_steps": 3760, "total_steps": 10798, "loss": 1.9744, "reward": null, "learning_rate": 0.0007297516868104501, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "2:31:34", "remaining_time": "4:43:44"} +{"current_steps": 3760, "total_steps": 10798, "loss": 1.9744, "reward": null, "learning_rate": 0.0007297516868104501, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "2:37:36", "remaining_time": "4:55:00"} +{"current_steps": 3760, "total_steps": 10798, "loss": 1.9744, "reward": null, "learning_rate": 0.0007297516868104501, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "2:31:31", "remaining_time": "4:43:37"} +{"current_steps": 3760, "total_steps": 10798, "loss": 1.9744, "reward": null, "learning_rate": 0.0007297516868104501, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "2:31:33", "remaining_time": "4:43:40"} +{"current_steps": 3770, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.000728458677311462, "epoch": 0.7, "percentage": 34.91, "elapsed_time": "2:31:58", "remaining_time": "4:43:19"} +{"current_steps": 3770, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.000728458677311462, "epoch": 0.7, "percentage": 34.91, "elapsed_time": "2:31:55", "remaining_time": "4:43:13"} +{"current_steps": 3770, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.000728458677311462, "epoch": 0.7, "percentage": 34.91, "elapsed_time": "2:38:00", "remaining_time": "4:54:33"} +{"current_steps": 3770, "total_steps": 10798, "loss": 2.0197, "reward": null, "learning_rate": 0.000728458677311462, "epoch": 0.7, "percentage": 34.91, "elapsed_time": "2:31:57", "remaining_time": "4:43:16"} +{"current_steps": 3780, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007271637339728667, "epoch": 0.7, "percentage": 35.01, "elapsed_time": "2:32:21", "remaining_time": "4:42:52"} +{"current_steps": 3780, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007271637339728667, "epoch": 0.7, "percentage": 35.01, "elapsed_time": "2:38:23", "remaining_time": "4:54:04"} +{"current_steps": 3780, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007271637339728667, "epoch": 0.7, "percentage": 35.01, "elapsed_time": "2:32:20", "remaining_time": "4:42:49"} +{"current_steps": 3780, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007271637339728667, "epoch": 0.7, "percentage": 35.01, "elapsed_time": "2:32:18", "remaining_time": "4:42:46"} +{"current_steps": 3790, "total_steps": 10798, "loss": 1.9721, "reward": null, "learning_rate": 0.0007258668677560019, "epoch": 0.7, "percentage": 35.1, "elapsed_time": "2:38:47", "remaining_time": "4:53:37"} +{"current_steps": 3790, "total_steps": 10798, "loss": 1.9721, "reward": null, "learning_rate": 0.0007258668677560019, "epoch": 0.7, "percentage": 35.1, "elapsed_time": "2:32:43", "remaining_time": "4:42:23"} +{"current_steps": 3790, "total_steps": 10798, "loss": 1.9721, "reward": null, "learning_rate": 0.0007258668677560019, "epoch": 0.7, "percentage": 35.1, "elapsed_time": "2:32:44", "remaining_time": "4:42:26"} +{"current_steps": 3790, "total_steps": 10798, "loss": 1.9721, "reward": null, "learning_rate": 0.0007258668677560019, "epoch": 0.7, "percentage": 35.1, "elapsed_time": "2:32:46", "remaining_time": "4:42:29"} +{"current_steps": 3800, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0007245680896384818, "epoch": 0.7, "percentage": 35.19, "elapsed_time": "2:33:08", "remaining_time": "4:42:00"} +{"current_steps": 3800, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0007245680896384818, "epoch": 0.7, "percentage": 35.19, "elapsed_time": "2:33:11", "remaining_time": "4:42:06"} +{"current_steps": 3800, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0007245680896384818, "epoch": 0.7, "percentage": 35.19, "elapsed_time": "2:39:12", "remaining_time": "4:53:12"} +{"current_steps": 3800, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0007245680896384818, "epoch": 0.7, "percentage": 35.19, "elapsed_time": "2:33:09", "remaining_time": "4:42:03"} +{"current_steps": 3810, "total_steps": 10798, "loss": 1.9762, "reward": null, "learning_rate": 0.0007232674106141048, "epoch": 0.71, "percentage": 35.28, "elapsed_time": "2:39:37", "remaining_time": "4:52:45"} +{"current_steps": 3810, "total_steps": 10798, "loss": 1.9762, "reward": null, "learning_rate": 0.0007232674106141048, "epoch": 0.71, "percentage": 35.28, "elapsed_time": "2:33:33", "remaining_time": "4:41:39"} +{"current_steps": 3810, "total_steps": 10798, "loss": 1.9762, "reward": null, "learning_rate": 0.0007232674106141048, "epoch": 0.71, "percentage": 35.28, "elapsed_time": "2:33:35", "remaining_time": "4:41:42"} +{"current_steps": 3810, "total_steps": 10798, "loss": 1.9762, "reward": null, "learning_rate": 0.0007232674106141048, "epoch": 0.71, "percentage": 35.28, "elapsed_time": "2:33:32", "remaining_time": "4:41:36"} +{"current_steps": 3820, "total_steps": 10798, "loss": 2.0026, "reward": null, "learning_rate": 0.0007219648416927592, "epoch": 0.71, "percentage": 35.38, "elapsed_time": "2:33:58", "remaining_time": "4:41:16"} +{"current_steps": 3820, "total_steps": 10798, "loss": 2.0026, "reward": null, "learning_rate": 0.0007219648416927592, "epoch": 0.71, "percentage": 35.38, "elapsed_time": "2:40:00", "remaining_time": "4:52:17"} +{"current_steps": 3820, "total_steps": 10798, "loss": 2.0026, "reward": null, "learning_rate": 0.0007219648416927592, "epoch": 0.71, "percentage": 35.38, "elapsed_time": "2:33:57", "remaining_time": "4:41:13"} +{"current_steps": 3820, "total_steps": 10798, "loss": 2.0026, "reward": null, "learning_rate": 0.0007219648416927592, "epoch": 0.71, "percentage": 35.38, "elapsed_time": "2:33:55", "remaining_time": "4:41:10"} +{"current_steps": 3830, "total_steps": 10798, "loss": 1.9876, "reward": null, "learning_rate": 0.0007206603939003314, "epoch": 0.71, "percentage": 35.47, "elapsed_time": "2:34:19", "remaining_time": "4:40:46"} +{"current_steps": 3830, "total_steps": 10798, "loss": 1.9876, "reward": null, "learning_rate": 0.0007206603939003314, "epoch": 0.71, "percentage": 35.47, "elapsed_time": "2:34:22", "remaining_time": "4:40:52"} +{"current_steps": 3830, "total_steps": 10798, "loss": 1.9876, "reward": null, "learning_rate": 0.0007206603939003314, "epoch": 0.71, "percentage": 35.47, "elapsed_time": "2:40:24", "remaining_time": "4:51:49"} +{"current_steps": 3830, "total_steps": 10798, "loss": 1.9876, "reward": null, "learning_rate": 0.0007206603939003314, "epoch": 0.71, "percentage": 35.47, "elapsed_time": "2:34:21", "remaining_time": "4:40:49"} +{"current_steps": 3840, "total_steps": 10798, "loss": 1.9991, "reward": null, "learning_rate": 0.0007193540782786117, "epoch": 0.71, "percentage": 35.56, "elapsed_time": "2:40:48", "remaining_time": "4:51:22"} +{"current_steps": 3840, "total_steps": 10798, "loss": 1.9991, "reward": null, "learning_rate": 0.0007193540782786117, "epoch": 0.71, "percentage": 35.56, "elapsed_time": "2:34:45", "remaining_time": "4:40:24"} +{"current_steps": 3840, "total_steps": 10798, "loss": 1.9991, "reward": null, "learning_rate": 0.0007193540782786117, "epoch": 0.71, "percentage": 35.56, "elapsed_time": "2:34:43", "remaining_time": "4:40:21"} +{"current_steps": 3840, "total_steps": 10798, "loss": 1.9991, "reward": null, "learning_rate": 0.0007193540782786117, "epoch": 0.71, "percentage": 35.56, "elapsed_time": "2:34:46", "remaining_time": "4:40:27"} +{"current_steps": 3850, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0007180459058852011, "epoch": 0.71, "percentage": 35.65, "elapsed_time": "2:35:09", "remaining_time": "4:40:00"} +{"current_steps": 3850, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0007180459058852011, "epoch": 0.71, "percentage": 35.65, "elapsed_time": "2:35:11", "remaining_time": "4:40:03"} +{"current_steps": 3850, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0007180459058852011, "epoch": 0.71, "percentage": 35.65, "elapsed_time": "2:41:12", "remaining_time": "4:50:55"} +{"current_steps": 3850, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.0007180459058852011, "epoch": 0.71, "percentage": 35.65, "elapsed_time": "2:35:07", "remaining_time": "4:39:57"} +{"current_steps": 3860, "total_steps": 10798, "loss": 2.0581, "reward": null, "learning_rate": 0.0007167358877934176, "epoch": 0.71, "percentage": 35.75, "elapsed_time": "2:35:35", "remaining_time": "4:39:39"} +{"current_steps": 3860, "total_steps": 10798, "loss": 2.0581, "reward": null, "learning_rate": 0.0007167358877934176, "epoch": 0.71, "percentage": 35.75, "elapsed_time": "2:35:31", "remaining_time": "4:39:33"} +{"current_steps": 3860, "total_steps": 10798, "loss": 2.0581, "reward": null, "learning_rate": 0.0007167358877934176, "epoch": 0.71, "percentage": 35.75, "elapsed_time": "2:41:36", "remaining_time": "4:50:28"} +{"current_steps": 3860, "total_steps": 10798, "loss": 2.0581, "reward": null, "learning_rate": 0.0007167358877934176, "epoch": 0.71, "percentage": 35.75, "elapsed_time": "2:35:33", "remaining_time": "4:39:36"} +{"current_steps": 3870, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0007154240350922025, "epoch": 0.72, "percentage": 35.84, "elapsed_time": "2:35:59", "remaining_time": "4:39:15"} +{"current_steps": 3870, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0007154240350922025, "epoch": 0.72, "percentage": 35.84, "elapsed_time": "2:35:56", "remaining_time": "4:39:09"} +{"current_steps": 3870, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0007154240350922025, "epoch": 0.72, "percentage": 35.84, "elapsed_time": "2:42:01", "remaining_time": "4:50:02"} +{"current_steps": 3870, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0007154240350922025, "epoch": 0.72, "percentage": 35.84, "elapsed_time": "2:35:58", "remaining_time": "4:39:12"} +{"current_steps": 3880, "total_steps": 10798, "loss": 2.0151, "reward": null, "learning_rate": 0.0007141103588860265, "epoch": 0.72, "percentage": 35.93, "elapsed_time": "2:36:20", "remaining_time": "4:38:44"} +{"current_steps": 3880, "total_steps": 10798, "loss": 2.0151, "reward": null, "learning_rate": 0.0007141103588860265, "epoch": 0.72, "percentage": 35.93, "elapsed_time": "2:36:21", "remaining_time": "4:38:47"} +{"current_steps": 3880, "total_steps": 10798, "loss": 2.0151, "reward": null, "learning_rate": 0.0007141103588860265, "epoch": 0.72, "percentage": 35.93, "elapsed_time": "2:42:24", "remaining_time": "4:49:34"} +{"current_steps": 3880, "total_steps": 10798, "loss": 2.0151, "reward": null, "learning_rate": 0.0007141103588860265, "epoch": 0.72, "percentage": 35.93, "elapsed_time": "2:36:23", "remaining_time": "4:38:50"} +{"current_steps": 3890, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.000712794870294796, "epoch": 0.72, "percentage": 36.03, "elapsed_time": "2:36:45", "remaining_time": "4:38:23"} +{"current_steps": 3890, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.000712794870294796, "epoch": 0.72, "percentage": 36.03, "elapsed_time": "2:42:49", "remaining_time": "4:49:08"} +{"current_steps": 3890, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.000712794870294796, "epoch": 0.72, "percentage": 36.03, "elapsed_time": "2:36:47", "remaining_time": "4:38:26"} +{"current_steps": 3890, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.000712794870294796, "epoch": 0.72, "percentage": 36.03, "elapsed_time": "2:36:44", "remaining_time": "4:38:20"} +{"current_steps": 3900, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0007114775804537586, "epoch": 0.72, "percentage": 36.12, "elapsed_time": "2:37:09", "remaining_time": "4:37:57"} +{"current_steps": 3900, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0007114775804537586, "epoch": 0.72, "percentage": 36.12, "elapsed_time": "2:43:14", "remaining_time": "4:48:42"} +{"current_steps": 3900, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0007114775804537586, "epoch": 0.72, "percentage": 36.12, "elapsed_time": "2:37:10", "remaining_time": "4:38:00"} +{"current_steps": 3900, "total_steps": 10798, "loss": 1.9936, "reward": null, "learning_rate": 0.0007114775804537586, "epoch": 0.72, "percentage": 36.12, "elapsed_time": "2:37:12", "remaining_time": "4:38:03"} +{"current_steps": 3910, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007101585005134088, "epoch": 0.72, "percentage": 36.21, "elapsed_time": "2:43:37", "remaining_time": "4:48:15"} +{"current_steps": 3910, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007101585005134088, "epoch": 0.72, "percentage": 36.21, "elapsed_time": "2:37:33", "remaining_time": "4:37:32"} +{"current_steps": 3910, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007101585005134088, "epoch": 0.72, "percentage": 36.21, "elapsed_time": "2:37:34", "remaining_time": "4:37:35"} +{"current_steps": 3910, "total_steps": 10798, "loss": 2.0016, "reward": null, "learning_rate": 0.0007101585005134088, "epoch": 0.72, "percentage": 36.21, "elapsed_time": "2:37:36", "remaining_time": "4:37:38"} +{"current_steps": 3920, "total_steps": 10798, "loss": 1.9628, "reward": null, "learning_rate": 0.0007088376416393944, "epoch": 0.73, "percentage": 36.3, "elapsed_time": "2:37:59", "remaining_time": "4:37:13"} +{"current_steps": 3920, "total_steps": 10798, "loss": 1.9628, "reward": null, "learning_rate": 0.0007088376416393944, "epoch": 0.73, "percentage": 36.3, "elapsed_time": "2:37:56", "remaining_time": "4:37:07"} +{"current_steps": 3920, "total_steps": 10798, "loss": 1.9628, "reward": null, "learning_rate": 0.0007088376416393944, "epoch": 0.73, "percentage": 36.3, "elapsed_time": "2:37:58", "remaining_time": "4:37:10"} +{"current_steps": 3920, "total_steps": 10798, "loss": 1.9628, "reward": null, "learning_rate": 0.0007088376416393944, "epoch": 0.73, "percentage": 36.3, "elapsed_time": "2:44:01", "remaining_time": "4:47:47"} +{"current_steps": 3930, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007075150150124208, "epoch": 0.73, "percentage": 36.4, "elapsed_time": "2:38:23", "remaining_time": "4:36:48"} +{"current_steps": 3930, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007075150150124208, "epoch": 0.73, "percentage": 36.4, "elapsed_time": "2:44:25", "remaining_time": "4:47:20"} +{"current_steps": 3930, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007075150150124208, "epoch": 0.73, "percentage": 36.4, "elapsed_time": "2:38:21", "remaining_time": "4:36:45"} +{"current_steps": 3930, "total_steps": 10798, "loss": 1.9955, "reward": null, "learning_rate": 0.0007075150150124208, "epoch": 0.73, "percentage": 36.4, "elapsed_time": "2:38:20", "remaining_time": "4:36:42"} +{"current_steps": 3940, "total_steps": 10798, "loss": 1.9731, "reward": null, "learning_rate": 0.0007061906318281568, "epoch": 0.73, "percentage": 36.49, "elapsed_time": "2:44:47", "remaining_time": "4:46:50"} +{"current_steps": 3940, "total_steps": 10798, "loss": 1.9731, "reward": null, "learning_rate": 0.0007061906318281568, "epoch": 0.73, "percentage": 36.49, "elapsed_time": "2:38:42", "remaining_time": "4:36:15"} +{"current_steps": 3940, "total_steps": 10798, "loss": 1.9731, "reward": null, "learning_rate": 0.0007061906318281568, "epoch": 0.73, "percentage": 36.49, "elapsed_time": "2:38:44", "remaining_time": "4:36:18"} +{"current_steps": 3940, "total_steps": 10798, "loss": 1.9731, "reward": null, "learning_rate": 0.0007061906318281568, "epoch": 0.73, "percentage": 36.49, "elapsed_time": "2:38:46", "remaining_time": "4:36:21"} +{"current_steps": 3950, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0007048645032971407, "epoch": 0.73, "percentage": 36.58, "elapsed_time": "2:39:08", "remaining_time": "4:35:53"} +{"current_steps": 3950, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0007048645032971407, "epoch": 0.73, "percentage": 36.58, "elapsed_time": "2:45:11", "remaining_time": "4:46:23"} +{"current_steps": 3950, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0007048645032971407, "epoch": 0.73, "percentage": 36.58, "elapsed_time": "2:39:10", "remaining_time": "4:35:56"} +{"current_steps": 3950, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.0007048645032971407, "epoch": 0.73, "percentage": 36.58, "elapsed_time": "2:39:06", "remaining_time": "4:35:51"} +{"current_steps": 3960, "total_steps": 10798, "loss": 1.985, "reward": null, "learning_rate": 0.0007035366406446839, "epoch": 0.73, "percentage": 36.67, "elapsed_time": "2:39:31", "remaining_time": "4:35:27"} +{"current_steps": 3960, "total_steps": 10798, "loss": 1.985, "reward": null, "learning_rate": 0.0007035366406446839, "epoch": 0.73, "percentage": 36.67, "elapsed_time": "2:39:33", "remaining_time": "4:35:30"} +{"current_steps": 3960, "total_steps": 10798, "loss": 1.985, "reward": null, "learning_rate": 0.0007035366406446839, "epoch": 0.73, "percentage": 36.67, "elapsed_time": "2:45:36", "remaining_time": "4:45:57"} +{"current_steps": 3960, "total_steps": 10798, "loss": 1.985, "reward": null, "learning_rate": 0.0007035366406446839, "epoch": 0.73, "percentage": 36.67, "elapsed_time": "2:39:34", "remaining_time": "4:35:33"} +{"current_steps": 3970, "total_steps": 10798, "loss": 1.9961, "reward": null, "learning_rate": 0.0007022070551107774, "epoch": 0.74, "percentage": 36.77, "elapsed_time": "2:46:00", "remaining_time": "4:45:30"} +{"current_steps": 3970, "total_steps": 10798, "loss": 1.9961, "reward": null, "learning_rate": 0.0007022070551107774, "epoch": 0.74, "percentage": 36.77, "elapsed_time": "2:39:56", "remaining_time": "4:35:05"} +{"current_steps": 3970, "total_steps": 10798, "loss": 1.9961, "reward": null, "learning_rate": 0.0007022070551107774, "epoch": 0.74, "percentage": 36.77, "elapsed_time": "2:39:58", "remaining_time": "4:35:08"} +{"current_steps": 3970, "total_steps": 10798, "loss": 1.9961, "reward": null, "learning_rate": 0.0007022070551107774, "epoch": 0.74, "percentage": 36.77, "elapsed_time": "2:39:55", "remaining_time": "4:35:02"} +{"current_steps": 3980, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0007008757579499954, "epoch": 0.74, "percentage": 36.86, "elapsed_time": "2:40:23", "remaining_time": "4:34:44"} +{"current_steps": 3980, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0007008757579499954, "epoch": 0.74, "percentage": 36.86, "elapsed_time": "2:46:24", "remaining_time": "4:45:04"} +{"current_steps": 3980, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0007008757579499954, "epoch": 0.74, "percentage": 36.86, "elapsed_time": "2:40:21", "remaining_time": "4:34:41"} +{"current_steps": 3980, "total_steps": 10798, "loss": 2.0112, "reward": null, "learning_rate": 0.0007008757579499954, "epoch": 0.74, "percentage": 36.86, "elapsed_time": "2:40:19", "remaining_time": "4:34:39"} +{"current_steps": 3990, "total_steps": 10798, "loss": 2.0086, "reward": null, "learning_rate": 0.0006995427604314004, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "2:40:43", "remaining_time": "4:34:14"} +{"current_steps": 3990, "total_steps": 10798, "loss": 2.0086, "reward": null, "learning_rate": 0.0006995427604314004, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "2:40:47", "remaining_time": "4:34:20"} +{"current_steps": 3990, "total_steps": 10798, "loss": 2.0086, "reward": null, "learning_rate": 0.0006995427604314004, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "2:40:45", "remaining_time": "4:34:17"} +{"current_steps": 3990, "total_steps": 10798, "loss": 2.0086, "reward": null, "learning_rate": 0.0006995427604314004, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "2:46:48", "remaining_time": "4:44:37"} +{"current_steps": 4000, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0006982080738384487, "epoch": 0.74, "percentage": 37.04, "elapsed_time": "2:41:10", "remaining_time": "4:33:54"} +{"current_steps": 4000, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0006982080738384487, "epoch": 0.74, "percentage": 37.04, "elapsed_time": "2:47:13", "remaining_time": "4:44:11"} +{"current_steps": 4000, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0006982080738384487, "epoch": 0.74, "percentage": 37.04, "elapsed_time": "2:41:08", "remaining_time": "4:33:51"} +{"current_steps": 4000, "total_steps": 10798, "loss": 2.019, "reward": null, "learning_rate": 0.0006982080738384487, "epoch": 0.74, "percentage": 37.04, "elapsed_time": "2:41:12", "remaining_time": "4:33:57"} +{"current_steps": 4010, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006968717094688933, "epoch": 0.74, "percentage": 37.14, "elapsed_time": "2:41:33", "remaining_time": "4:33:28"} +{"current_steps": 4010, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006968717094688933, "epoch": 0.74, "percentage": 37.14, "elapsed_time": "2:47:38", "remaining_time": "4:43:46"} +{"current_steps": 4010, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006968717094688933, "epoch": 0.74, "percentage": 37.14, "elapsed_time": "2:41:36", "remaining_time": "4:33:34"} +{"current_steps": 4010, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006968717094688933, "epoch": 0.74, "percentage": 37.14, "elapsed_time": "2:41:35", "remaining_time": "4:33:31"} +{"current_steps": 4020, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.0006955336786346898, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "2:48:03", "remaining_time": "4:43:21"} +{"current_steps": 4020, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.0006955336786346898, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "2:42:01", "remaining_time": "4:33:11"} +{"current_steps": 4020, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.0006955336786346898, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "2:42:00", "remaining_time": "4:33:08"} +{"current_steps": 4020, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.0006955336786346898, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "2:41:58", "remaining_time": "4:33:06"} +{"current_steps": 4030, "total_steps": 10798, "loss": 1.9878, "reward": null, "learning_rate": 0.0006941939926618997, "epoch": 0.75, "percentage": 37.32, "elapsed_time": "2:42:25", "remaining_time": "4:32:46"} +{"current_steps": 4030, "total_steps": 10798, "loss": 1.9878, "reward": null, "learning_rate": 0.0006941939926618997, "epoch": 0.75, "percentage": 37.32, "elapsed_time": "2:42:23", "remaining_time": "4:32:43"} +{"current_steps": 4030, "total_steps": 10798, "loss": 1.9878, "reward": null, "learning_rate": 0.0006941939926618997, "epoch": 0.75, "percentage": 37.32, "elapsed_time": "2:42:22", "remaining_time": "4:32:41"} +{"current_steps": 4030, "total_steps": 10798, "loss": 1.9878, "reward": null, "learning_rate": 0.0006941939926618997, "epoch": 0.75, "percentage": 37.32, "elapsed_time": "2:48:26", "remaining_time": "4:42:53"} +{"current_steps": 4040, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0006928526628905942, "epoch": 0.75, "percentage": 37.41, "elapsed_time": "2:48:50", "remaining_time": "4:42:26"} +{"current_steps": 4040, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0006928526628905942, "epoch": 0.75, "percentage": 37.41, "elapsed_time": "2:42:46", "remaining_time": "4:32:16"} +{"current_steps": 4040, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0006928526628905942, "epoch": 0.75, "percentage": 37.41, "elapsed_time": "2:42:49", "remaining_time": "4:32:22"} +{"current_steps": 4040, "total_steps": 10798, "loss": 2.0067, "reward": null, "learning_rate": 0.0006928526628905942, "epoch": 0.75, "percentage": 37.41, "elapsed_time": "2:42:47", "remaining_time": "4:32:19"} +{"current_steps": 4050, "total_steps": 10798, "loss": 2.035, "reward": null, "learning_rate": 0.0006915097006747601, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "2:43:10", "remaining_time": "4:31:51"} +{"current_steps": 4050, "total_steps": 10798, "loss": 2.035, "reward": null, "learning_rate": 0.0006915097006747601, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "2:43:11", "remaining_time": "4:31:54"} +{"current_steps": 4050, "total_steps": 10798, "loss": 2.035, "reward": null, "learning_rate": 0.0006915097006747601, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "2:49:14", "remaining_time": "4:41:59"} +{"current_steps": 4050, "total_steps": 10798, "loss": 2.035, "reward": null, "learning_rate": 0.0006915097006747601, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "2:43:13", "remaining_time": "4:31:57"} +{"current_steps": 4060, "total_steps": 10798, "loss": 1.9614, "reward": null, "learning_rate": 0.0006901651173822013, "epoch": 0.75, "percentage": 37.6, "elapsed_time": "2:43:37", "remaining_time": "4:31:33"} +{"current_steps": 4060, "total_steps": 10798, "loss": 1.9614, "reward": null, "learning_rate": 0.0006901651173822013, "epoch": 0.75, "percentage": 37.6, "elapsed_time": "2:49:39", "remaining_time": "4:41:33"} +{"current_steps": 4060, "total_steps": 10798, "loss": 1.9614, "reward": null, "learning_rate": 0.0006901651173822013, "epoch": 0.75, "percentage": 37.6, "elapsed_time": "2:43:34", "remaining_time": "4:31:28"} +{"current_steps": 4060, "total_steps": 10798, "loss": 1.9614, "reward": null, "learning_rate": 0.0006901651173822013, "epoch": 0.75, "percentage": 37.6, "elapsed_time": "2:43:36", "remaining_time": "4:31:30"} +{"current_steps": 4070, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0006888189243944439, "epoch": 0.75, "percentage": 37.69, "elapsed_time": "2:43:58", "remaining_time": "4:31:04"} +{"current_steps": 4070, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0006888189243944439, "epoch": 0.75, "percentage": 37.69, "elapsed_time": "2:44:02", "remaining_time": "4:31:09"} +{"current_steps": 4070, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0006888189243944439, "epoch": 0.75, "percentage": 37.69, "elapsed_time": "2:44:00", "remaining_time": "4:31:06"} +{"current_steps": 4070, "total_steps": 10798, "loss": 1.9655, "reward": null, "learning_rate": 0.0006888189243944439, "epoch": 0.75, "percentage": 37.69, "elapsed_time": "2:50:03", "remaining_time": "4:41:07"} +{"current_steps": 4080, "total_steps": 10798, "loss": 1.9692, "reward": null, "learning_rate": 0.0006874711331066401, "epoch": 0.76, "percentage": 37.78, "elapsed_time": "2:44:27", "remaining_time": "4:30:47"} +{"current_steps": 4080, "total_steps": 10798, "loss": 1.9692, "reward": null, "learning_rate": 0.0006874711331066401, "epoch": 0.76, "percentage": 37.78, "elapsed_time": "2:44:25", "remaining_time": "4:30:44"} +{"current_steps": 4080, "total_steps": 10798, "loss": 1.9692, "reward": null, "learning_rate": 0.0006874711331066401, "epoch": 0.76, "percentage": 37.78, "elapsed_time": "2:50:28", "remaining_time": "4:40:42"} +{"current_steps": 4080, "total_steps": 10798, "loss": 1.9692, "reward": null, "learning_rate": 0.0006874711331066401, "epoch": 0.76, "percentage": 37.78, "elapsed_time": "2:44:23", "remaining_time": "4:30:41"} +{"current_steps": 4090, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.0006861217549274705, "epoch": 0.76, "percentage": 37.88, "elapsed_time": "2:50:53", "remaining_time": "4:40:16"} +{"current_steps": 4090, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.0006861217549274705, "epoch": 0.76, "percentage": 37.88, "elapsed_time": "2:44:48", "remaining_time": "4:30:17"} +{"current_steps": 4090, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.0006861217549274705, "epoch": 0.76, "percentage": 37.88, "elapsed_time": "2:44:49", "remaining_time": "4:30:20"} +{"current_steps": 4090, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.0006861217549274705, "epoch": 0.76, "percentage": 37.88, "elapsed_time": "2:44:51", "remaining_time": "4:30:23"} +{"current_steps": 4100, "total_steps": 10798, "loss": 1.9804, "reward": null, "learning_rate": 0.0006847708012790492, "epoch": 0.76, "percentage": 37.97, "elapsed_time": "2:45:13", "remaining_time": "4:29:55"} +{"current_steps": 4100, "total_steps": 10798, "loss": 1.9804, "reward": null, "learning_rate": 0.0006847708012790492, "epoch": 0.76, "percentage": 37.97, "elapsed_time": "2:51:18", "remaining_time": "4:39:51"} +{"current_steps": 4100, "total_steps": 10798, "loss": 1.9804, "reward": null, "learning_rate": 0.0006847708012790492, "epoch": 0.76, "percentage": 37.97, "elapsed_time": "2:45:16", "remaining_time": "4:30:00"} +{"current_steps": 4100, "total_steps": 10798, "loss": 1.9804, "reward": null, "learning_rate": 0.0006847708012790492, "epoch": 0.76, "percentage": 37.97, "elapsed_time": "2:45:15", "remaining_time": "4:29:57"} +{"current_steps": 4110, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006834182835968253, "epoch": 0.76, "percentage": 38.06, "elapsed_time": "2:51:42", "remaining_time": "4:39:24"} +{"current_steps": 4110, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006834182835968253, "epoch": 0.76, "percentage": 38.06, "elapsed_time": "2:45:37", "remaining_time": "4:29:30"} +{"current_steps": 4110, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006834182835968253, "epoch": 0.76, "percentage": 38.06, "elapsed_time": "2:45:39", "remaining_time": "4:29:33"} +{"current_steps": 4110, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006834182835968253, "epoch": 0.76, "percentage": 38.06, "elapsed_time": "2:45:40", "remaining_time": "4:29:36"} +{"current_steps": 4120, "total_steps": 10798, "loss": 2.0153, "reward": null, "learning_rate": 0.0006820642133294876, "epoch": 0.76, "percentage": 38.16, "elapsed_time": "2:46:01", "remaining_time": "4:29:06"} +{"current_steps": 4120, "total_steps": 10798, "loss": 2.0153, "reward": null, "learning_rate": 0.0006820642133294876, "epoch": 0.76, "percentage": 38.16, "elapsed_time": "2:46:04", "remaining_time": "4:29:11"} +{"current_steps": 4120, "total_steps": 10798, "loss": 2.0153, "reward": null, "learning_rate": 0.0006820642133294876, "epoch": 0.76, "percentage": 38.16, "elapsed_time": "2:46:03", "remaining_time": "4:29:08"} +{"current_steps": 4120, "total_steps": 10798, "loss": 2.0153, "reward": null, "learning_rate": 0.0006820642133294876, "epoch": 0.76, "percentage": 38.16, "elapsed_time": "2:52:06", "remaining_time": "4:38:57"} +{"current_steps": 4130, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 0.0006807086019388669, "epoch": 0.76, "percentage": 38.25, "elapsed_time": "2:46:27", "remaining_time": "4:28:44"} +{"current_steps": 4130, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 0.0006807086019388669, "epoch": 0.76, "percentage": 38.25, "elapsed_time": "2:52:30", "remaining_time": "4:38:30"} +{"current_steps": 4130, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 0.0006807086019388669, "epoch": 0.76, "percentage": 38.25, "elapsed_time": "2:46:25", "remaining_time": "4:28:41"} +{"current_steps": 4130, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 0.0006807086019388669, "epoch": 0.76, "percentage": 38.25, "elapsed_time": "2:46:28", "remaining_time": "4:28:47"} +{"current_steps": 4140, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.0006793514608998393, "epoch": 0.77, "percentage": 38.34, "elapsed_time": "2:52:54", "remaining_time": "4:38:04"} +{"current_steps": 4140, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.0006793514608998393, "epoch": 0.77, "percentage": 38.34, "elapsed_time": "2:46:51", "remaining_time": "4:28:20"} +{"current_steps": 4140, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.0006793514608998393, "epoch": 0.77, "percentage": 38.34, "elapsed_time": "2:46:53", "remaining_time": "4:28:23"} +{"current_steps": 4140, "total_steps": 10798, "loss": 2.0162, "reward": null, "learning_rate": 0.0006793514608998393, "epoch": 0.77, "percentage": 38.34, "elapsed_time": "2:46:49", "remaining_time": "4:28:18"} +{"current_steps": 4150, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.000677992801700229, "epoch": 0.77, "percentage": 38.43, "elapsed_time": "2:47:13", "remaining_time": "4:27:52"} +{"current_steps": 4150, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.000677992801700229, "epoch": 0.77, "percentage": 38.43, "elapsed_time": "2:47:14", "remaining_time": "4:27:54"} +{"current_steps": 4150, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.000677992801700229, "epoch": 0.77, "percentage": 38.43, "elapsed_time": "2:47:16", "remaining_time": "4:27:57"} +{"current_steps": 4150, "total_steps": 10798, "loss": 1.994, "reward": null, "learning_rate": 0.000677992801700229, "epoch": 0.77, "percentage": 38.43, "elapsed_time": "2:53:17", "remaining_time": "4:37:36"} +{"current_steps": 4160, "total_steps": 10798, "loss": 1.9992, "reward": null, "learning_rate": 0.0006766326358407104, "epoch": 0.77, "percentage": 38.53, "elapsed_time": "2:47:36", "remaining_time": "4:27:26"} +{"current_steps": 4160, "total_steps": 10798, "loss": 1.9992, "reward": null, "learning_rate": 0.0006766326358407104, "epoch": 0.77, "percentage": 38.53, "elapsed_time": "2:53:41", "remaining_time": "4:37:08"} +{"current_steps": 4160, "total_steps": 10798, "loss": 1.9992, "reward": null, "learning_rate": 0.0006766326358407104, "epoch": 0.77, "percentage": 38.53, "elapsed_time": "2:47:38", "remaining_time": "4:27:29"} +{"current_steps": 4160, "total_steps": 10798, "loss": 1.9992, "reward": null, "learning_rate": 0.0006766326358407104, "epoch": 0.77, "percentage": 38.53, "elapsed_time": "2:47:39", "remaining_time": "4:27:32"} +{"current_steps": 4170, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0006752709748347125, "epoch": 0.77, "percentage": 38.62, "elapsed_time": "2:54:04", "remaining_time": "4:36:41"} +{"current_steps": 4170, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0006752709748347125, "epoch": 0.77, "percentage": 38.62, "elapsed_time": "2:47:59", "remaining_time": "4:27:01"} +{"current_steps": 4170, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0006752709748347125, "epoch": 0.77, "percentage": 38.62, "elapsed_time": "2:48:01", "remaining_time": "4:27:04"} +{"current_steps": 4170, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0006752709748347125, "epoch": 0.77, "percentage": 38.62, "elapsed_time": "2:48:03", "remaining_time": "4:27:06"} +{"current_steps": 4180, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 0.000673907830208319, "epoch": 0.77, "percentage": 38.71, "elapsed_time": "2:54:29", "remaining_time": "4:36:15"} +{"current_steps": 4180, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 0.000673907830208319, "epoch": 0.77, "percentage": 38.71, "elapsed_time": "2:48:24", "remaining_time": "4:26:37"} +{"current_steps": 4180, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 0.000673907830208319, "epoch": 0.77, "percentage": 38.71, "elapsed_time": "2:48:25", "remaining_time": "4:26:40"} +{"current_steps": 4180, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 0.000673907830208319, "epoch": 0.77, "percentage": 38.71, "elapsed_time": "2:48:27", "remaining_time": "4:26:43"} +{"current_steps": 4190, "total_steps": 10798, "loss": 1.9982, "reward": null, "learning_rate": 0.0006725432135001732, "epoch": 0.78, "percentage": 38.8, "elapsed_time": "2:54:53", "remaining_time": "4:35:48"} +{"current_steps": 4190, "total_steps": 10798, "loss": 1.9982, "reward": null, "learning_rate": 0.0006725432135001732, "epoch": 0.78, "percentage": 38.8, "elapsed_time": "2:48:48", "remaining_time": "4:26:13"} +{"current_steps": 4190, "total_steps": 10798, "loss": 1.9982, "reward": null, "learning_rate": 0.0006725432135001732, "epoch": 0.78, "percentage": 38.8, "elapsed_time": "2:48:50", "remaining_time": "4:26:15"} +{"current_steps": 4190, "total_steps": 10798, "loss": 1.9982, "reward": null, "learning_rate": 0.0006725432135001732, "epoch": 0.78, "percentage": 38.8, "elapsed_time": "2:48:51", "remaining_time": "4:26:18"} +{"current_steps": 4200, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0006711771362613785, "epoch": 0.78, "percentage": 38.9, "elapsed_time": "2:49:13", "remaining_time": "4:25:50"} +{"current_steps": 4200, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0006711771362613785, "epoch": 0.78, "percentage": 38.9, "elapsed_time": "2:49:12", "remaining_time": "4:25:48"} +{"current_steps": 4200, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0006711771362613785, "epoch": 0.78, "percentage": 38.9, "elapsed_time": "2:55:16", "remaining_time": "4:35:21"} +{"current_steps": 4200, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0006711771362613785, "epoch": 0.78, "percentage": 38.9, "elapsed_time": "2:49:15", "remaining_time": "4:25:53"} +{"current_steps": 4210, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006698096100554014, "epoch": 0.78, "percentage": 38.99, "elapsed_time": "2:55:40", "remaining_time": "4:34:54"} +{"current_steps": 4210, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006698096100554014, "epoch": 0.78, "percentage": 38.99, "elapsed_time": "2:49:35", "remaining_time": "4:25:23"} +{"current_steps": 4210, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006698096100554014, "epoch": 0.78, "percentage": 38.99, "elapsed_time": "2:49:37", "remaining_time": "4:25:26"} +{"current_steps": 4210, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006698096100554014, "epoch": 0.78, "percentage": 38.99, "elapsed_time": "2:49:39", "remaining_time": "4:25:29"} +{"current_steps": 4220, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0006684406464579735, "epoch": 0.78, "percentage": 39.08, "elapsed_time": "2:50:00", "remaining_time": "4:25:00"} +{"current_steps": 4220, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0006684406464579735, "epoch": 0.78, "percentage": 39.08, "elapsed_time": "2:50:03", "remaining_time": "4:25:05"} +{"current_steps": 4220, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0006684406464579735, "epoch": 0.78, "percentage": 39.08, "elapsed_time": "2:50:02", "remaining_time": "4:25:02"} +{"current_steps": 4220, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0006684406464579735, "epoch": 0.78, "percentage": 39.08, "elapsed_time": "2:56:05", "remaining_time": "4:34:28"} +{"current_steps": 4230, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006670702570569937, "epoch": 0.78, "percentage": 39.17, "elapsed_time": "2:56:29", "remaining_time": "4:34:02"} +{"current_steps": 4230, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006670702570569937, "epoch": 0.78, "percentage": 39.17, "elapsed_time": "2:50:26", "remaining_time": "4:24:38"} +{"current_steps": 4230, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006670702570569937, "epoch": 0.78, "percentage": 39.17, "elapsed_time": "2:50:24", "remaining_time": "4:24:36"} +{"current_steps": 4230, "total_steps": 10798, "loss": 1.9838, "reward": null, "learning_rate": 0.0006670702570569937, "epoch": 0.78, "percentage": 39.17, "elapsed_time": "2:50:28", "remaining_time": "4:24:41"} +{"current_steps": 4240, "total_steps": 10798, "loss": 1.9747, "reward": null, "learning_rate": 0.0006656984534524296, "epoch": 0.79, "percentage": 39.27, "elapsed_time": "2:50:50", "remaining_time": "4:24:14"} +{"current_steps": 4240, "total_steps": 10798, "loss": 1.9747, "reward": null, "learning_rate": 0.0006656984534524296, "epoch": 0.79, "percentage": 39.27, "elapsed_time": "2:50:49", "remaining_time": "4:24:12"} +{"current_steps": 4240, "total_steps": 10798, "loss": 1.9747, "reward": null, "learning_rate": 0.0006656984534524296, "epoch": 0.79, "percentage": 39.27, "elapsed_time": "2:50:52", "remaining_time": "4:24:17"} +{"current_steps": 4240, "total_steps": 10798, "loss": 1.9747, "reward": null, "learning_rate": 0.0006656984534524296, "epoch": 0.79, "percentage": 39.27, "elapsed_time": "2:56:54", "remaining_time": "4:33:36"} +{"current_steps": 4250, "total_steps": 10798, "loss": 1.9896, "reward": null, "learning_rate": 0.0006643252472562201, "epoch": 0.79, "percentage": 39.36, "elapsed_time": "2:51:15", "remaining_time": "4:23:51"} +{"current_steps": 4250, "total_steps": 10798, "loss": 1.9896, "reward": null, "learning_rate": 0.0006643252472562201, "epoch": 0.79, "percentage": 39.36, "elapsed_time": "2:51:17", "remaining_time": "4:23:53"} +{"current_steps": 4250, "total_steps": 10798, "loss": 1.9896, "reward": null, "learning_rate": 0.0006643252472562201, "epoch": 0.79, "percentage": 39.36, "elapsed_time": "2:57:18", "remaining_time": "4:33:10"} +{"current_steps": 4250, "total_steps": 10798, "loss": 1.9896, "reward": null, "learning_rate": 0.0006643252472562201, "epoch": 0.79, "percentage": 39.36, "elapsed_time": "2:51:13", "remaining_time": "4:23:48"} +{"current_steps": 4260, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.000662950650092176, "epoch": 0.79, "percentage": 39.45, "elapsed_time": "2:51:37", "remaining_time": "4:23:24"} +{"current_steps": 4260, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.000662950650092176, "epoch": 0.79, "percentage": 39.45, "elapsed_time": "2:51:39", "remaining_time": "4:23:26"} +{"current_steps": 4260, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.000662950650092176, "epoch": 0.79, "percentage": 39.45, "elapsed_time": "2:51:41", "remaining_time": "4:23:29"} +{"current_steps": 4260, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.000662950650092176, "epoch": 0.79, "percentage": 39.45, "elapsed_time": "2:57:42", "remaining_time": "4:32:44"} +{"current_steps": 4270, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0006615746735958832, "epoch": 0.79, "percentage": 39.54, "elapsed_time": "2:58:07", "remaining_time": "4:32:19"} +{"current_steps": 4270, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0006615746735958832, "epoch": 0.79, "percentage": 39.54, "elapsed_time": "2:52:02", "remaining_time": "4:23:01"} +{"current_steps": 4270, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0006615746735958832, "epoch": 0.79, "percentage": 39.54, "elapsed_time": "2:52:04", "remaining_time": "4:23:04"} +{"current_steps": 4270, "total_steps": 10798, "loss": 2.0075, "reward": null, "learning_rate": 0.0006615746735958832, "epoch": 0.79, "percentage": 39.54, "elapsed_time": "2:52:06", "remaining_time": "4:23:06"} +{"current_steps": 4280, "total_steps": 10798, "loss": 1.9918, "reward": null, "learning_rate": 0.0006603351250463683, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "2:52:26", "remaining_time": "4:22:36"} +{"current_steps": 4280, "total_steps": 10798, "loss": 1.9918, "reward": null, "learning_rate": 0.0006603351250463683, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "2:52:27", "remaining_time": "4:22:38"} +{"current_steps": 4280, "total_steps": 10798, "loss": 1.9918, "reward": null, "learning_rate": 0.0006603351250463683, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "2:58:31", "remaining_time": "4:31:51"} +{"current_steps": 4280, "total_steps": 10798, "loss": 1.9918, "reward": null, "learning_rate": 0.0006603351250463683, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "2:52:29", "remaining_time": "4:22:41"} +{"current_steps": 4290, "total_steps": 10798, "loss": 1.9669, "reward": null, "learning_rate": 0.000658956559916577, "epoch": 0.79, "percentage": 39.73, "elapsed_time": "2:58:54", "remaining_time": "4:31:25"} +{"current_steps": 4290, "total_steps": 10798, "loss": 1.9669, "reward": null, "learning_rate": 0.000658956559916577, "epoch": 0.79, "percentage": 39.73, "elapsed_time": "2:52:51", "remaining_time": "4:22:14"} +{"current_steps": 4290, "total_steps": 10798, "loss": 1.9669, "reward": null, "learning_rate": 0.000658956559916577, "epoch": 0.79, "percentage": 39.73, "elapsed_time": "2:52:50", "remaining_time": "4:22:11"} +{"current_steps": 4290, "total_steps": 10798, "loss": 1.9669, "reward": null, "learning_rate": 0.000658956559916577, "epoch": 0.79, "percentage": 39.73, "elapsed_time": "2:52:53", "remaining_time": "4:22:16"} +{"current_steps": 4300, "total_steps": 10798, "loss": 1.9645, "reward": null, "learning_rate": 0.0006575766492634068, "epoch": 0.8, "percentage": 39.82, "elapsed_time": "2:59:18", "remaining_time": "4:30:58"} +{"current_steps": 4300, "total_steps": 10798, "loss": 1.9645, "reward": null, "learning_rate": 0.0006575766492634068, "epoch": 0.8, "percentage": 39.82, "elapsed_time": "2:53:15", "remaining_time": "4:21:49"} +{"current_steps": 4300, "total_steps": 10798, "loss": 1.9645, "reward": null, "learning_rate": 0.0006575766492634068, "epoch": 0.8, "percentage": 39.82, "elapsed_time": "2:53:17", "remaining_time": "4:21:51"} +{"current_steps": 4300, "total_steps": 10798, "loss": 1.9645, "reward": null, "learning_rate": 0.0006575766492634068, "epoch": 0.8, "percentage": 39.82, "elapsed_time": "2:53:13", "remaining_time": "4:21:46"} +{"current_steps": 4310, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0006561954047674206, "epoch": 0.8, "percentage": 39.91, "elapsed_time": "2:53:37", "remaining_time": "4:21:22"} +{"current_steps": 4310, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0006561954047674206, "epoch": 0.8, "percentage": 39.91, "elapsed_time": "2:53:39", "remaining_time": "4:21:24"} +{"current_steps": 4310, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0006561954047674206, "epoch": 0.8, "percentage": 39.91, "elapsed_time": "2:59:42", "remaining_time": "4:30:31"} +{"current_steps": 4310, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0006561954047674206, "epoch": 0.8, "percentage": 39.91, "elapsed_time": "2:53:41", "remaining_time": "4:21:27"} +{"current_steps": 4320, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0006548128381204714, "epoch": 0.8, "percentage": 40.01, "elapsed_time": "2:54:03", "remaining_time": "4:21:00"} +{"current_steps": 4320, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0006548128381204714, "epoch": 0.8, "percentage": 40.01, "elapsed_time": "3:00:06", "remaining_time": "4:30:05"} +{"current_steps": 4320, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0006548128381204714, "epoch": 0.8, "percentage": 40.01, "elapsed_time": "2:54:05", "remaining_time": "4:21:03"} +{"current_steps": 4320, "total_steps": 10798, "loss": 1.9934, "reward": null, "learning_rate": 0.0006548128381204714, "epoch": 0.8, "percentage": 40.01, "elapsed_time": "2:54:01", "remaining_time": "4:20:57"} +{"current_steps": 4330, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006534289610256039, "epoch": 0.8, "percentage": 40.1, "elapsed_time": "3:00:30", "remaining_time": "4:29:38"} +{"current_steps": 4330, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006534289610256039, "epoch": 0.8, "percentage": 40.1, "elapsed_time": "2:54:26", "remaining_time": "4:20:33"} +{"current_steps": 4330, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006534289610256039, "epoch": 0.8, "percentage": 40.1, "elapsed_time": "2:54:29", "remaining_time": "4:20:38"} +{"current_steps": 4330, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.0006534289610256039, "epoch": 0.8, "percentage": 40.1, "elapsed_time": "2:54:27", "remaining_time": "4:20:36"} +{"current_steps": 4340, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006520437851969557, "epoch": 0.8, "percentage": 40.19, "elapsed_time": "2:54:50", "remaining_time": "4:20:09"} +{"current_steps": 4340, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006520437851969557, "epoch": 0.8, "percentage": 40.19, "elapsed_time": "3:00:54", "remaining_time": "4:29:12"} +{"current_steps": 4340, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006520437851969557, "epoch": 0.8, "percentage": 40.19, "elapsed_time": "2:54:51", "remaining_time": "4:20:11"} +{"current_steps": 4340, "total_steps": 10798, "loss": 1.9983, "reward": null, "learning_rate": 0.0006520437851969557, "epoch": 0.8, "percentage": 40.19, "elapsed_time": "2:54:53", "remaining_time": "4:20:14"} +{"current_steps": 4350, "total_steps": 10798, "loss": 1.9906, "reward": null, "learning_rate": 0.0006506573223596575, "epoch": 0.81, "percentage": 40.29, "elapsed_time": "2:55:14", "remaining_time": "4:19:46"} +{"current_steps": 4350, "total_steps": 10798, "loss": 1.9906, "reward": null, "learning_rate": 0.0006506573223596575, "epoch": 0.81, "percentage": 40.29, "elapsed_time": "3:01:18", "remaining_time": "4:28:44"} +{"current_steps": 4350, "total_steps": 10798, "loss": 1.9906, "reward": null, "learning_rate": 0.0006506573223596575, "epoch": 0.81, "percentage": 40.29, "elapsed_time": "2:55:13", "remaining_time": "4:19:43"} +{"current_steps": 4350, "total_steps": 10798, "loss": 1.9906, "reward": null, "learning_rate": 0.0006506573223596575, "epoch": 0.81, "percentage": 40.29, "elapsed_time": "2:55:16", "remaining_time": "4:19:48"} +{"current_steps": 4360, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0006492695842497347, "epoch": 0.81, "percentage": 40.38, "elapsed_time": "3:01:42", "remaining_time": "4:28:18"} +{"current_steps": 4360, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0006492695842497347, "epoch": 0.81, "percentage": 40.38, "elapsed_time": "2:55:39", "remaining_time": "4:19:21"} +{"current_steps": 4360, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0006492695842497347, "epoch": 0.81, "percentage": 40.38, "elapsed_time": "2:55:40", "remaining_time": "4:19:24"} +{"current_steps": 4360, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0006492695842497347, "epoch": 0.81, "percentage": 40.38, "elapsed_time": "2:55:37", "remaining_time": "4:19:19"} +{"current_steps": 4370, "total_steps": 10798, "loss": 2.0015, "reward": null, "learning_rate": 0.0006478805826140066, "epoch": 0.81, "percentage": 40.47, "elapsed_time": "3:02:05", "remaining_time": "4:27:50"} +{"current_steps": 4370, "total_steps": 10798, "loss": 2.0015, "reward": null, "learning_rate": 0.0006478805826140066, "epoch": 0.81, "percentage": 40.47, "elapsed_time": "2:56:00", "remaining_time": "4:18:54"} +{"current_steps": 4370, "total_steps": 10798, "loss": 2.0015, "reward": null, "learning_rate": 0.0006478805826140066, "epoch": 0.81, "percentage": 40.47, "elapsed_time": "2:56:04", "remaining_time": "4:18:59"} +{"current_steps": 4370, "total_steps": 10798, "loss": 2.0015, "reward": null, "learning_rate": 0.0006478805826140066, "epoch": 0.81, "percentage": 40.47, "elapsed_time": "2:56:02", "remaining_time": "4:18:56"} +{"current_steps": 4380, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0006464903292099886, "epoch": 0.81, "percentage": 40.56, "elapsed_time": "2:56:24", "remaining_time": "4:18:29"} +{"current_steps": 4380, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0006464903292099886, "epoch": 0.81, "percentage": 40.56, "elapsed_time": "2:56:26", "remaining_time": "4:18:32"} +{"current_steps": 4380, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0006464903292099886, "epoch": 0.81, "percentage": 40.56, "elapsed_time": "3:02:29", "remaining_time": "4:27:24"} +{"current_steps": 4380, "total_steps": 10798, "loss": 2.0168, "reward": null, "learning_rate": 0.0006464903292099886, "epoch": 0.81, "percentage": 40.56, "elapsed_time": "2:56:28", "remaining_time": "4:18:34"} +{"current_steps": 4390, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0006450988358057919, "epoch": 0.81, "percentage": 40.66, "elapsed_time": "2:56:49", "remaining_time": "4:18:06"} +{"current_steps": 4390, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0006450988358057919, "epoch": 0.81, "percentage": 40.66, "elapsed_time": "3:02:54", "remaining_time": "4:26:58"} +{"current_steps": 4390, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0006450988358057919, "epoch": 0.81, "percentage": 40.66, "elapsed_time": "2:56:50", "remaining_time": "4:18:08"} +{"current_steps": 4390, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0006450988358057919, "epoch": 0.81, "percentage": 40.66, "elapsed_time": "2:56:52", "remaining_time": "4:18:11"} +{"current_steps": 4400, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0006437061141800238, "epoch": 0.81, "percentage": 40.75, "elapsed_time": "2:57:16", "remaining_time": "4:17:46"} +{"current_steps": 4400, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0006437061141800238, "epoch": 0.81, "percentage": 40.75, "elapsed_time": "3:03:18", "remaining_time": "4:26:32"} +{"current_steps": 4400, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0006437061141800238, "epoch": 0.81, "percentage": 40.75, "elapsed_time": "2:57:15", "remaining_time": "4:17:44"} +{"current_steps": 4400, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0006437061141800238, "epoch": 0.81, "percentage": 40.75, "elapsed_time": "2:57:13", "remaining_time": "4:17:42"} +{"current_steps": 4410, "total_steps": 10798, "loss": 1.9753, "reward": null, "learning_rate": 0.0006423121761216881, "epoch": 0.82, "percentage": 40.84, "elapsed_time": "3:03:43", "remaining_time": "4:26:08"} +{"current_steps": 4410, "total_steps": 10798, "loss": 1.9753, "reward": null, "learning_rate": 0.0006423121761216881, "epoch": 0.82, "percentage": 40.84, "elapsed_time": "2:57:42", "remaining_time": "4:17:24"} +{"current_steps": 4410, "total_steps": 10798, "loss": 1.9753, "reward": null, "learning_rate": 0.0006423121761216881, "epoch": 0.82, "percentage": 40.84, "elapsed_time": "2:57:40", "remaining_time": "4:17:22"} +{"current_steps": 4410, "total_steps": 10798, "loss": 1.9753, "reward": null, "learning_rate": 0.0006423121761216881, "epoch": 0.82, "percentage": 40.84, "elapsed_time": "2:57:38", "remaining_time": "4:17:19"} +{"current_steps": 4420, "total_steps": 10798, "loss": 1.9965, "reward": null, "learning_rate": 0.0006409170334300858, "epoch": 0.82, "percentage": 40.93, "elapsed_time": "3:04:07", "remaining_time": "4:25:40"} +{"current_steps": 4420, "total_steps": 10798, "loss": 1.9965, "reward": null, "learning_rate": 0.0006409170334300858, "epoch": 0.82, "percentage": 40.93, "elapsed_time": "2:58:03", "remaining_time": "4:16:56"} +{"current_steps": 4420, "total_steps": 10798, "loss": 1.9965, "reward": null, "learning_rate": 0.0006409170334300858, "epoch": 0.82, "percentage": 40.93, "elapsed_time": "2:58:02", "remaining_time": "4:16:54"} +{"current_steps": 4420, "total_steps": 10798, "loss": 1.9965, "reward": null, "learning_rate": 0.0006409170334300858, "epoch": 0.82, "percentage": 40.93, "elapsed_time": "2:58:05", "remaining_time": "4:16:59"} +{"current_steps": 4430, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0006395206979147141, "epoch": 0.82, "percentage": 41.03, "elapsed_time": "2:58:25", "remaining_time": "4:16:29"} +{"current_steps": 4430, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0006395206979147141, "epoch": 0.82, "percentage": 41.03, "elapsed_time": "3:04:30", "remaining_time": "4:25:13"} +{"current_steps": 4430, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0006395206979147141, "epoch": 0.82, "percentage": 41.03, "elapsed_time": "2:58:29", "remaining_time": "4:16:34"} +{"current_steps": 4430, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0006395206979147141, "epoch": 0.82, "percentage": 41.03, "elapsed_time": "2:58:27", "remaining_time": "4:16:31"} +{"current_steps": 4440, "total_steps": 10798, "loss": 1.9962, "reward": null, "learning_rate": 0.0006381231813951678, "epoch": 0.82, "percentage": 41.12, "elapsed_time": "2:58:51", "remaining_time": "4:16:07"} +{"current_steps": 4440, "total_steps": 10798, "loss": 1.9962, "reward": null, "learning_rate": 0.0006381231813951678, "epoch": 0.82, "percentage": 41.12, "elapsed_time": "2:58:53", "remaining_time": "4:16:09"} +{"current_steps": 4440, "total_steps": 10798, "loss": 1.9962, "reward": null, "learning_rate": 0.0006381231813951678, "epoch": 0.82, "percentage": 41.12, "elapsed_time": "2:58:49", "remaining_time": "4:16:04"} +{"current_steps": 4440, "total_steps": 10798, "loss": 1.9962, "reward": null, "learning_rate": 0.0006381231813951678, "epoch": 0.82, "percentage": 41.12, "elapsed_time": "3:04:54", "remaining_time": "4:24:47"} +{"current_steps": 4450, "total_steps": 10798, "loss": 1.9758, "reward": null, "learning_rate": 0.0006367244957010379, "epoch": 0.82, "percentage": 41.21, "elapsed_time": "3:05:18", "remaining_time": "4:24:20"} +{"current_steps": 4450, "total_steps": 10798, "loss": 1.9758, "reward": null, "learning_rate": 0.0006367244957010379, "epoch": 0.82, "percentage": 41.21, "elapsed_time": "2:59:16", "remaining_time": "4:15:44"} +{"current_steps": 4450, "total_steps": 10798, "loss": 1.9758, "reward": null, "learning_rate": 0.0006367244957010379, "epoch": 0.82, "percentage": 41.21, "elapsed_time": "2:59:14", "remaining_time": "4:15:42"} +{"current_steps": 4450, "total_steps": 10798, "loss": 1.9758, "reward": null, "learning_rate": 0.0006367244957010379, "epoch": 0.82, "percentage": 41.21, "elapsed_time": "2:59:13", "remaining_time": "4:15:39"} +{"current_steps": 4460, "total_steps": 10798, "loss": 1.9606, "reward": null, "learning_rate": 0.000635324652671813, "epoch": 0.83, "percentage": 41.3, "elapsed_time": "3:05:42", "remaining_time": "4:23:54"} +{"current_steps": 4460, "total_steps": 10798, "loss": 1.9606, "reward": null, "learning_rate": 0.000635324652671813, "epoch": 0.83, "percentage": 41.3, "elapsed_time": "2:59:40", "remaining_time": "4:15:20"} +{"current_steps": 4460, "total_steps": 10798, "loss": 1.9606, "reward": null, "learning_rate": 0.000635324652671813, "epoch": 0.83, "percentage": 41.3, "elapsed_time": "2:59:39", "remaining_time": "4:15:17"} +{"current_steps": 4460, "total_steps": 10798, "loss": 1.9606, "reward": null, "learning_rate": 0.000635324652671813, "epoch": 0.83, "percentage": 41.3, "elapsed_time": "2:59:37", "remaining_time": "4:15:15"} +{"current_steps": 4470, "total_steps": 10798, "loss": 1.9785, "reward": null, "learning_rate": 0.0006339236641567774, "epoch": 0.83, "percentage": 41.4, "elapsed_time": "3:00:01", "remaining_time": "4:14:50"} +{"current_steps": 4470, "total_steps": 10798, "loss": 1.9785, "reward": null, "learning_rate": 0.0006339236641567774, "epoch": 0.83, "percentage": 41.4, "elapsed_time": "3:06:05", "remaining_time": "4:23:27"} +{"current_steps": 4470, "total_steps": 10798, "loss": 1.9785, "reward": null, "learning_rate": 0.0006339236641567774, "epoch": 0.83, "percentage": 41.4, "elapsed_time": "3:00:04", "remaining_time": "4:14:55"} +{"current_steps": 4470, "total_steps": 10798, "loss": 1.9785, "reward": null, "learning_rate": 0.0006339236641567774, "epoch": 0.83, "percentage": 41.4, "elapsed_time": "3:00:02", "remaining_time": "4:14:52"} +{"current_steps": 4480, "total_steps": 10798, "loss": 1.9334, "reward": null, "learning_rate": 0.0006325215420149119, "epoch": 0.83, "percentage": 41.49, "elapsed_time": "3:00:24", "remaining_time": "4:14:26"} +{"current_steps": 4480, "total_steps": 10798, "loss": 1.9334, "reward": null, "learning_rate": 0.0006325215420149119, "epoch": 0.83, "percentage": 41.49, "elapsed_time": "3:00:26", "remaining_time": "4:14:28"} +{"current_steps": 4480, "total_steps": 10798, "loss": 1.9334, "reward": null, "learning_rate": 0.0006325215420149119, "epoch": 0.83, "percentage": 41.49, "elapsed_time": "3:06:29", "remaining_time": "4:23:00"} +{"current_steps": 4480, "total_steps": 10798, "loss": 1.9334, "reward": null, "learning_rate": 0.0006325215420149119, "epoch": 0.83, "percentage": 41.49, "elapsed_time": "3:00:28", "remaining_time": "4:14:30"} +{"current_steps": 4490, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0006311182981147935, "epoch": 0.83, "percentage": 41.58, "elapsed_time": "3:06:53", "remaining_time": "4:22:33"} +{"current_steps": 4490, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0006311182981147935, "epoch": 0.83, "percentage": 41.58, "elapsed_time": "3:00:52", "remaining_time": "4:14:06"} +{"current_steps": 4490, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0006311182981147935, "epoch": 0.83, "percentage": 41.58, "elapsed_time": "3:00:48", "remaining_time": "4:14:01"} +{"current_steps": 4490, "total_steps": 10798, "loss": 1.9829, "reward": null, "learning_rate": 0.0006311182981147935, "epoch": 0.83, "percentage": 41.58, "elapsed_time": "3:00:50", "remaining_time": "4:14:03"} +{"current_steps": 4500, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000629713944334494, "epoch": 0.83, "percentage": 41.67, "elapsed_time": "3:07:18", "remaining_time": "4:22:09"} +{"current_steps": 4500, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000629713944334494, "epoch": 0.83, "percentage": 41.67, "elapsed_time": "3:01:15", "remaining_time": "4:13:41"} +{"current_steps": 4500, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000629713944334494, "epoch": 0.83, "percentage": 41.67, "elapsed_time": "3:01:17", "remaining_time": "4:13:43"} +{"current_steps": 4500, "total_steps": 10798, "loss": 1.9671, "reward": null, "learning_rate": 0.000629713944334494, "epoch": 0.83, "percentage": 41.67, "elapsed_time": "3:01:14", "remaining_time": "4:13:38"} +{"current_steps": 4510, "total_steps": 10798, "loss": 2.0108, "reward": null, "learning_rate": 0.0006283084925614805, "epoch": 0.84, "percentage": 41.77, "elapsed_time": "3:01:37", "remaining_time": "4:13:13"} +{"current_steps": 4510, "total_steps": 10798, "loss": 2.0108, "reward": null, "learning_rate": 0.0006283084925614805, "epoch": 0.84, "percentage": 41.77, "elapsed_time": "3:07:42", "remaining_time": "4:21:42"} +{"current_steps": 4510, "total_steps": 10798, "loss": 2.0108, "reward": null, "learning_rate": 0.0006283084925614805, "epoch": 0.84, "percentage": 41.77, "elapsed_time": "3:01:40", "remaining_time": "4:13:18"} +{"current_steps": 4510, "total_steps": 10798, "loss": 2.0108, "reward": null, "learning_rate": 0.0006283084925614805, "epoch": 0.84, "percentage": 41.77, "elapsed_time": "3:01:39", "remaining_time": "4:13:16"} +{"current_steps": 4520, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.0006269019546925139, "epoch": 0.84, "percentage": 41.86, "elapsed_time": "3:08:05", "remaining_time": "4:21:15"} +{"current_steps": 4520, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.0006269019546925139, "epoch": 0.84, "percentage": 41.86, "elapsed_time": "3:02:00", "remaining_time": "4:12:48"} +{"current_steps": 4520, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.0006269019546925139, "epoch": 0.84, "percentage": 41.86, "elapsed_time": "3:02:02", "remaining_time": "4:12:50"} +{"current_steps": 4520, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.0006269019546925139, "epoch": 0.84, "percentage": 41.86, "elapsed_time": "3:02:04", "remaining_time": "4:12:53"} +{"current_steps": 4530, "total_steps": 10798, "loss": 1.9378, "reward": null, "learning_rate": 0.0006254943426335488, "epoch": 0.84, "percentage": 41.95, "elapsed_time": "3:08:30", "remaining_time": "4:20:50"} +{"current_steps": 4530, "total_steps": 10798, "loss": 1.9378, "reward": null, "learning_rate": 0.0006254943426335488, "epoch": 0.84, "percentage": 41.95, "elapsed_time": "3:02:26", "remaining_time": "4:12:25"} +{"current_steps": 4530, "total_steps": 10798, "loss": 1.9378, "reward": null, "learning_rate": 0.0006254943426335488, "epoch": 0.84, "percentage": 41.95, "elapsed_time": "3:02:27", "remaining_time": "4:12:27"} +{"current_steps": 4530, "total_steps": 10798, "loss": 1.9378, "reward": null, "learning_rate": 0.0006254943426335488, "epoch": 0.84, "percentage": 41.95, "elapsed_time": "3:02:29", "remaining_time": "4:12:30"} +{"current_steps": 4540, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0006240856682996326, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "3:02:49", "remaining_time": "4:12:00"} +{"current_steps": 4540, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0006240856682996326, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "3:02:51", "remaining_time": "4:12:02"} +{"current_steps": 4540, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0006240856682996326, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "3:08:54", "remaining_time": "4:20:23"} +{"current_steps": 4540, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0006240856682996326, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "3:02:52", "remaining_time": "4:12:05"} +{"current_steps": 4550, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 0.0006226759436148044, "epoch": 0.84, "percentage": 42.14, "elapsed_time": "3:03:15", "remaining_time": "4:11:39"} +{"current_steps": 4550, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 0.0006226759436148044, "epoch": 0.84, "percentage": 42.14, "elapsed_time": "3:03:14", "remaining_time": "4:11:36"} +{"current_steps": 4550, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 0.0006226759436148044, "epoch": 0.84, "percentage": 42.14, "elapsed_time": "3:03:17", "remaining_time": "4:11:41"} +{"current_steps": 4550, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 0.0006226759436148044, "epoch": 0.84, "percentage": 42.14, "elapsed_time": "3:09:18", "remaining_time": "4:19:57"} +{"current_steps": 4560, "total_steps": 10798, "loss": 1.9882, "reward": null, "learning_rate": 0.0006212651805119946, "epoch": 0.84, "percentage": 42.23, "elapsed_time": "3:09:44", "remaining_time": "4:19:33"} +{"current_steps": 4560, "total_steps": 10798, "loss": 1.9882, "reward": null, "learning_rate": 0.0006212651805119946, "epoch": 0.84, "percentage": 42.23, "elapsed_time": "3:03:43", "remaining_time": "4:11:19"} +{"current_steps": 4560, "total_steps": 10798, "loss": 1.9882, "reward": null, "learning_rate": 0.0006212651805119946, "epoch": 0.84, "percentage": 42.23, "elapsed_time": "3:03:39", "remaining_time": "4:11:14"} +{"current_steps": 4560, "total_steps": 10798, "loss": 1.9882, "reward": null, "learning_rate": 0.0006212651805119946, "epoch": 0.84, "percentage": 42.23, "elapsed_time": "3:03:41", "remaining_time": "4:11:16"} +{"current_steps": 4570, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.000619853390932923, "epoch": 0.85, "percentage": 42.32, "elapsed_time": "3:04:04", "remaining_time": "4:10:52"} +{"current_steps": 4570, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.000619853390932923, "epoch": 0.85, "percentage": 42.32, "elapsed_time": "3:04:03", "remaining_time": "4:10:49"} +{"current_steps": 4570, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.000619853390932923, "epoch": 0.85, "percentage": 42.32, "elapsed_time": "3:10:08", "remaining_time": "4:19:07"} +{"current_steps": 4570, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.000619853390932923, "epoch": 0.85, "percentage": 42.32, "elapsed_time": "3:04:06", "remaining_time": "4:10:54"} +{"current_steps": 4580, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0006184405868279985, "epoch": 0.85, "percentage": 42.42, "elapsed_time": "3:10:31", "remaining_time": "4:18:39"} +{"current_steps": 4580, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0006184405868279985, "epoch": 0.85, "percentage": 42.42, "elapsed_time": "3:04:29", "remaining_time": "4:10:28"} +{"current_steps": 4580, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0006184405868279985, "epoch": 0.85, "percentage": 42.42, "elapsed_time": "3:04:26", "remaining_time": "4:10:24"} +{"current_steps": 4580, "total_steps": 10798, "loss": 1.9894, "reward": null, "learning_rate": 0.0006184405868279985, "epoch": 0.85, "percentage": 42.42, "elapsed_time": "3:04:27", "remaining_time": "4:10:26"} +{"current_steps": 4590, "total_steps": 10798, "loss": 1.9365, "reward": null, "learning_rate": 0.0006170267801562176, "epoch": 0.85, "percentage": 42.51, "elapsed_time": "3:10:55", "remaining_time": "4:18:13"} +{"current_steps": 4590, "total_steps": 10798, "loss": 1.9365, "reward": null, "learning_rate": 0.0006170267801562176, "epoch": 0.85, "percentage": 42.51, "elapsed_time": "3:04:53", "remaining_time": "4:10:04"} +{"current_steps": 4590, "total_steps": 10798, "loss": 1.9365, "reward": null, "learning_rate": 0.0006170267801562176, "epoch": 0.85, "percentage": 42.51, "elapsed_time": "3:04:51", "remaining_time": "4:10:01"} +{"current_steps": 4590, "total_steps": 10798, "loss": 1.9365, "reward": null, "learning_rate": 0.0006170267801562176, "epoch": 0.85, "percentage": 42.51, "elapsed_time": "3:04:50", "remaining_time": "4:09:59"} +{"current_steps": 4600, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0006156119828850633, "epoch": 0.85, "percentage": 42.6, "elapsed_time": "3:05:17", "remaining_time": "4:09:40"} +{"current_steps": 4600, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0006156119828850633, "epoch": 0.85, "percentage": 42.6, "elapsed_time": "3:05:14", "remaining_time": "4:09:35"} +{"current_steps": 4600, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0006156119828850633, "epoch": 0.85, "percentage": 42.6, "elapsed_time": "3:11:19", "remaining_time": "4:17:47"} +{"current_steps": 4600, "total_steps": 10798, "loss": 2.0264, "reward": null, "learning_rate": 0.0006156119828850633, "epoch": 0.85, "percentage": 42.6, "elapsed_time": "3:05:16", "remaining_time": "4:09:37"} +{"current_steps": 4610, "total_steps": 10798, "loss": 1.9659, "reward": null, "learning_rate": 0.0006141962069904041, "epoch": 0.85, "percentage": 42.69, "elapsed_time": "3:11:43", "remaining_time": "4:17:21"} +{"current_steps": 4610, "total_steps": 10798, "loss": 1.9659, "reward": null, "learning_rate": 0.0006141962069904041, "epoch": 0.85, "percentage": 42.69, "elapsed_time": "3:05:42", "remaining_time": "4:09:16"} +{"current_steps": 4610, "total_steps": 10798, "loss": 1.9659, "reward": null, "learning_rate": 0.0006141962069904041, "epoch": 0.85, "percentage": 42.69, "elapsed_time": "3:05:40", "remaining_time": "4:09:14"} +{"current_steps": 4610, "total_steps": 10798, "loss": 1.9659, "reward": null, "learning_rate": 0.0006141962069904041, "epoch": 0.85, "percentage": 42.69, "elapsed_time": "3:05:39", "remaining_time": "4:09:11"} +{"current_steps": 4620, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.0006127794644563915, "epoch": 0.86, "percentage": 42.79, "elapsed_time": "3:06:01", "remaining_time": "4:08:45"} +{"current_steps": 4620, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.0006127794644563915, "epoch": 0.86, "percentage": 42.79, "elapsed_time": "3:06:04", "remaining_time": "4:08:50"} +{"current_steps": 4620, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.0006127794644563915, "epoch": 0.86, "percentage": 42.79, "elapsed_time": "3:12:06", "remaining_time": "4:16:53"} +{"current_steps": 4620, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.0006127794644563915, "epoch": 0.86, "percentage": 42.79, "elapsed_time": "3:06:03", "remaining_time": "4:08:47"} +{"current_steps": 4630, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0006113617672753598, "epoch": 0.86, "percentage": 42.88, "elapsed_time": "3:06:27", "remaining_time": "4:08:24"} +{"current_steps": 4630, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0006113617672753598, "epoch": 0.86, "percentage": 42.88, "elapsed_time": "3:06:26", "remaining_time": "4:08:22"} +{"current_steps": 4630, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0006113617672753598, "epoch": 0.86, "percentage": 42.88, "elapsed_time": "3:12:31", "remaining_time": "4:16:28"} +{"current_steps": 4630, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0006113617672753598, "epoch": 0.86, "percentage": 42.88, "elapsed_time": "3:06:29", "remaining_time": "4:08:26"} +{"current_steps": 4640, "total_steps": 10798, "loss": 1.9832, "reward": null, "learning_rate": 0.0006099431274477245, "epoch": 0.86, "percentage": 42.97, "elapsed_time": "3:06:52", "remaining_time": "4:08:01"} +{"current_steps": 4640, "total_steps": 10798, "loss": 1.9832, "reward": null, "learning_rate": 0.0006099431274477245, "epoch": 0.86, "percentage": 42.97, "elapsed_time": "3:12:54", "remaining_time": "4:16:00"} +{"current_steps": 4640, "total_steps": 10798, "loss": 1.9832, "reward": null, "learning_rate": 0.0006099431274477245, "epoch": 0.86, "percentage": 42.97, "elapsed_time": "3:06:51", "remaining_time": "4:07:58"} +{"current_steps": 4640, "total_steps": 10798, "loss": 1.9832, "reward": null, "learning_rate": 0.0006099431274477245, "epoch": 0.86, "percentage": 42.97, "elapsed_time": "3:06:49", "remaining_time": "4:07:56"} +{"current_steps": 4650, "total_steps": 10798, "loss": 1.9572, "reward": null, "learning_rate": 0.0006085235569818795, "epoch": 0.86, "percentage": 43.06, "elapsed_time": "3:07:12", "remaining_time": "4:07:31"} +{"current_steps": 4650, "total_steps": 10798, "loss": 1.9572, "reward": null, "learning_rate": 0.0006085235569818795, "epoch": 0.86, "percentage": 43.06, "elapsed_time": "3:07:15", "remaining_time": "4:07:35"} +{"current_steps": 4650, "total_steps": 10798, "loss": 1.9572, "reward": null, "learning_rate": 0.0006085235569818795, "epoch": 0.86, "percentage": 43.06, "elapsed_time": "3:07:14", "remaining_time": "4:07:33"} +{"current_steps": 4650, "total_steps": 10798, "loss": 1.9572, "reward": null, "learning_rate": 0.0006085235569818795, "epoch": 0.86, "percentage": 43.06, "elapsed_time": "3:13:17", "remaining_time": "4:15:33"} +{"current_steps": 4660, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0006071030678940969, "epoch": 0.86, "percentage": 43.16, "elapsed_time": "3:07:37", "remaining_time": "4:07:07"} +{"current_steps": 4660, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0006071030678940969, "epoch": 0.86, "percentage": 43.16, "elapsed_time": "3:07:40", "remaining_time": "4:07:12"} +{"current_steps": 4660, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0006071030678940969, "epoch": 0.86, "percentage": 43.16, "elapsed_time": "3:07:38", "remaining_time": "4:07:09"} +{"current_steps": 4660, "total_steps": 10798, "loss": 1.99, "reward": null, "learning_rate": 0.0006071030678940969, "epoch": 0.86, "percentage": 43.16, "elapsed_time": "3:13:42", "remaining_time": "4:15:08"} +{"current_steps": 4670, "total_steps": 10798, "loss": 1.9963, "reward": null, "learning_rate": 0.0006056816722084248, "epoch": 0.86, "percentage": 43.25, "elapsed_time": "3:14:05", "remaining_time": "4:14:40"} +{"current_steps": 4670, "total_steps": 10798, "loss": 1.9963, "reward": null, "learning_rate": 0.0006056816722084248, "epoch": 0.86, "percentage": 43.25, "elapsed_time": "3:08:01", "remaining_time": "4:06:44"} +{"current_steps": 4670, "total_steps": 10798, "loss": 1.9963, "reward": null, "learning_rate": 0.0006056816722084248, "epoch": 0.86, "percentage": 43.25, "elapsed_time": "3:08:00", "remaining_time": "4:06:42"} +{"current_steps": 4670, "total_steps": 10798, "loss": 1.9963, "reward": null, "learning_rate": 0.0006056816722084248, "epoch": 0.86, "percentage": 43.25, "elapsed_time": "3:08:03", "remaining_time": "4:06:46"} +{"current_steps": 4680, "total_steps": 10798, "loss": 1.9997, "reward": null, "learning_rate": 0.0006042593819565846, "epoch": 0.87, "percentage": 43.34, "elapsed_time": "3:08:24", "remaining_time": "4:06:18"} +{"current_steps": 4680, "total_steps": 10798, "loss": 1.9997, "reward": null, "learning_rate": 0.0006042593819565846, "epoch": 0.87, "percentage": 43.34, "elapsed_time": "3:14:29", "remaining_time": "4:14:15"} +{"current_steps": 4680, "total_steps": 10798, "loss": 1.9997, "reward": null, "learning_rate": 0.0006042593819565846, "epoch": 0.87, "percentage": 43.34, "elapsed_time": "3:08:28", "remaining_time": "4:06:22"} +{"current_steps": 4680, "total_steps": 10798, "loss": 1.9997, "reward": null, "learning_rate": 0.0006042593819565846, "epoch": 0.87, "percentage": 43.34, "elapsed_time": "3:08:26", "remaining_time": "4:06:20"} +{"current_steps": 4690, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.0006028362091778706, "epoch": 0.87, "percentage": 43.43, "elapsed_time": "3:08:50", "remaining_time": "4:05:55"} +{"current_steps": 4690, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.0006028362091778706, "epoch": 0.87, "percentage": 43.43, "elapsed_time": "3:08:48", "remaining_time": "4:05:53"} +{"current_steps": 4690, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.0006028362091778706, "epoch": 0.87, "percentage": 43.43, "elapsed_time": "3:14:53", "remaining_time": "4:13:48"} +{"current_steps": 4690, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.0006028362091778706, "epoch": 0.87, "percentage": 43.43, "elapsed_time": "3:08:51", "remaining_time": "4:05:58"} +{"current_steps": 4700, "total_steps": 10798, "loss": 1.9623, "reward": null, "learning_rate": 0.0006014121659190476, "epoch": 0.87, "percentage": 43.53, "elapsed_time": "3:15:17", "remaining_time": "4:13:22"} +{"current_steps": 4700, "total_steps": 10798, "loss": 1.9623, "reward": null, "learning_rate": 0.0006014121659190476, "epoch": 0.87, "percentage": 43.53, "elapsed_time": "3:09:16", "remaining_time": "4:05:33"} +{"current_steps": 4700, "total_steps": 10798, "loss": 1.9623, "reward": null, "learning_rate": 0.0006014121659190476, "epoch": 0.87, "percentage": 43.53, "elapsed_time": "3:09:12", "remaining_time": "4:05:29"} +{"current_steps": 4700, "total_steps": 10798, "loss": 1.9623, "reward": null, "learning_rate": 0.0006014121659190476, "epoch": 0.87, "percentage": 43.53, "elapsed_time": "3:09:14", "remaining_time": "4:05:31"} +{"current_steps": 4710, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0005999872642342484, "epoch": 0.87, "percentage": 43.62, "elapsed_time": "3:15:41", "remaining_time": "4:12:56"} +{"current_steps": 4710, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0005999872642342484, "epoch": 0.87, "percentage": 43.62, "elapsed_time": "3:09:40", "remaining_time": "4:05:09"} +{"current_steps": 4710, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0005999872642342484, "epoch": 0.87, "percentage": 43.62, "elapsed_time": "3:09:38", "remaining_time": "4:05:07"} +{"current_steps": 4710, "total_steps": 10798, "loss": 1.9949, "reward": null, "learning_rate": 0.0005999872642342484, "epoch": 0.87, "percentage": 43.62, "elapsed_time": "3:09:36", "remaining_time": "4:05:05"} +{"current_steps": 4720, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.0005985615161848721, "epoch": 0.87, "percentage": 43.71, "elapsed_time": "3:16:05", "remaining_time": "4:12:29"} +{"current_steps": 4720, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.0005985615161848721, "epoch": 0.87, "percentage": 43.71, "elapsed_time": "3:10:00", "remaining_time": "4:04:40"} +{"current_steps": 4720, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.0005985615161848721, "epoch": 0.87, "percentage": 43.71, "elapsed_time": "3:10:01", "remaining_time": "4:04:42"} +{"current_steps": 4720, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.0005985615161848721, "epoch": 0.87, "percentage": 43.71, "elapsed_time": "3:10:03", "remaining_time": "4:04:44"} +{"current_steps": 4730, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.000597134933839482, "epoch": 0.88, "percentage": 43.8, "elapsed_time": "3:16:29", "remaining_time": "4:12:04"} +{"current_steps": 4730, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.000597134933839482, "epoch": 0.88, "percentage": 43.8, "elapsed_time": "3:10:26", "remaining_time": "4:04:18"} +{"current_steps": 4730, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.000597134933839482, "epoch": 0.88, "percentage": 43.8, "elapsed_time": "3:10:28", "remaining_time": "4:04:21"} +{"current_steps": 4730, "total_steps": 10798, "loss": 1.975, "reward": null, "learning_rate": 0.000597134933839482, "epoch": 0.88, "percentage": 43.8, "elapsed_time": "3:10:24", "remaining_time": "4:04:16"} +{"current_steps": 4740, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005957075292737042, "epoch": 0.88, "percentage": 43.9, "elapsed_time": "3:16:54", "remaining_time": "4:11:39"} +{"current_steps": 4740, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005957075292737042, "epoch": 0.88, "percentage": 43.9, "elapsed_time": "3:10:51", "remaining_time": "4:03:55"} +{"current_steps": 4740, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005957075292737042, "epoch": 0.88, "percentage": 43.9, "elapsed_time": "3:10:52", "remaining_time": "4:03:57"} +{"current_steps": 4740, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005957075292737042, "epoch": 0.88, "percentage": 43.9, "elapsed_time": "3:10:49", "remaining_time": "4:03:53"} +{"current_steps": 4750, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0005942793145701235, "epoch": 0.88, "percentage": 43.99, "elapsed_time": "3:11:14", "remaining_time": "4:03:30"} +{"current_steps": 4750, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0005942793145701235, "epoch": 0.88, "percentage": 43.99, "elapsed_time": "3:11:16", "remaining_time": "4:03:32"} +{"current_steps": 4750, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0005942793145701235, "epoch": 0.88, "percentage": 43.99, "elapsed_time": "3:17:17", "remaining_time": "4:11:12"} +{"current_steps": 4750, "total_steps": 10798, "loss": 1.9591, "reward": null, "learning_rate": 0.0005942793145701235, "epoch": 0.88, "percentage": 43.99, "elapsed_time": "3:11:12", "remaining_time": "4:03:27"} +{"current_steps": 4760, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005928503018181833, "epoch": 0.88, "percentage": 44.08, "elapsed_time": "3:11:37", "remaining_time": "4:03:04"} +{"current_steps": 4760, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005928503018181833, "epoch": 0.88, "percentage": 44.08, "elapsed_time": "3:11:38", "remaining_time": "4:03:06"} +{"current_steps": 4760, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005928503018181833, "epoch": 0.88, "percentage": 44.08, "elapsed_time": "3:17:42", "remaining_time": "4:10:46"} +{"current_steps": 4760, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005928503018181833, "epoch": 0.88, "percentage": 44.08, "elapsed_time": "3:11:40", "remaining_time": "4:03:08"} +{"current_steps": 4770, "total_steps": 10798, "loss": 1.9823, "reward": null, "learning_rate": 0.0005914205031140819, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "3:12:04", "remaining_time": "4:02:44"} +{"current_steps": 4770, "total_steps": 10798, "loss": 1.9823, "reward": null, "learning_rate": 0.0005914205031140819, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "3:12:01", "remaining_time": "4:02:39"} +{"current_steps": 4770, "total_steps": 10798, "loss": 1.9823, "reward": null, "learning_rate": 0.0005914205031140819, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "3:12:02", "remaining_time": "4:02:41"} +{"current_steps": 4770, "total_steps": 10798, "loss": 1.9823, "reward": null, "learning_rate": 0.0005914205031140819, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "3:18:06", "remaining_time": "4:10:20"} +{"current_steps": 4780, "total_steps": 10798, "loss": 2.0032, "reward": null, "learning_rate": 0.0005899899305606703, "epoch": 0.89, "percentage": 44.27, "elapsed_time": "3:12:26", "remaining_time": "4:02:16"} +{"current_steps": 4780, "total_steps": 10798, "loss": 2.0032, "reward": null, "learning_rate": 0.0005899899305606703, "epoch": 0.89, "percentage": 44.27, "elapsed_time": "3:12:27", "remaining_time": "4:02:18"} +{"current_steps": 4780, "total_steps": 10798, "loss": 2.0032, "reward": null, "learning_rate": 0.0005899899305606703, "epoch": 0.89, "percentage": 44.27, "elapsed_time": "3:12:29", "remaining_time": "4:02:21"} +{"current_steps": 4780, "total_steps": 10798, "loss": 2.0032, "reward": null, "learning_rate": 0.0005899899305606703, "epoch": 0.89, "percentage": 44.27, "elapsed_time": "3:18:31", "remaining_time": "4:09:56"} +{"current_steps": 4790, "total_steps": 10798, "loss": 1.9722, "reward": null, "learning_rate": 0.0005885585962673501, "epoch": 0.89, "percentage": 44.36, "elapsed_time": "3:12:50", "remaining_time": "4:01:52"} +{"current_steps": 4790, "total_steps": 10798, "loss": 1.9722, "reward": null, "learning_rate": 0.0005885585962673501, "epoch": 0.89, "percentage": 44.36, "elapsed_time": "3:18:54", "remaining_time": "4:09:29"} +{"current_steps": 4790, "total_steps": 10798, "loss": 1.9722, "reward": null, "learning_rate": 0.0005885585962673501, "epoch": 0.89, "percentage": 44.36, "elapsed_time": "3:12:53", "remaining_time": "4:01:56"} +{"current_steps": 4790, "total_steps": 10798, "loss": 1.9722, "reward": null, "learning_rate": 0.0005885585962673501, "epoch": 0.89, "percentage": 44.36, "elapsed_time": "3:12:51", "remaining_time": "4:01:54"} +{"current_steps": 4800, "total_steps": 10798, "loss": 1.9903, "reward": null, "learning_rate": 0.0005871265123499708, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "3:19:20", "remaining_time": "4:09:05"} +{"current_steps": 4800, "total_steps": 10798, "loss": 1.9903, "reward": null, "learning_rate": 0.0005871265123499708, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "3:13:15", "remaining_time": "4:01:29"} +{"current_steps": 4800, "total_steps": 10798, "loss": 1.9903, "reward": null, "learning_rate": 0.0005871265123499708, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "3:13:16", "remaining_time": "4:01:31"} +{"current_steps": 4800, "total_steps": 10798, "loss": 1.9903, "reward": null, "learning_rate": 0.0005871265123499708, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "3:13:18", "remaining_time": "4:01:33"} +{"current_steps": 4810, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0005856936909307273, "epoch": 0.89, "percentage": 44.55, "elapsed_time": "3:13:42", "remaining_time": "4:01:08"} +{"current_steps": 4810, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0005856936909307273, "epoch": 0.89, "percentage": 44.55, "elapsed_time": "3:19:43", "remaining_time": "4:08:38"} +{"current_steps": 4810, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0005856936909307273, "epoch": 0.89, "percentage": 44.55, "elapsed_time": "3:13:40", "remaining_time": "4:01:06"} +{"current_steps": 4810, "total_steps": 10798, "loss": 2.0258, "reward": null, "learning_rate": 0.0005856936909307273, "epoch": 0.89, "percentage": 44.55, "elapsed_time": "3:13:38", "remaining_time": "4:01:04"} +{"current_steps": 4820, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.000584260144138057, "epoch": 0.89, "percentage": 44.64, "elapsed_time": "3:14:04", "remaining_time": "4:00:41"} +{"current_steps": 4820, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.000584260144138057, "epoch": 0.89, "percentage": 44.64, "elapsed_time": "3:20:07", "remaining_time": "4:08:12"} +{"current_steps": 4820, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.000584260144138057, "epoch": 0.89, "percentage": 44.64, "elapsed_time": "3:14:02", "remaining_time": "4:00:39"} +{"current_steps": 4820, "total_steps": 10798, "loss": 2.0444, "reward": null, "learning_rate": 0.000584260144138057, "epoch": 0.89, "percentage": 44.64, "elapsed_time": "3:14:06", "remaining_time": "4:00:44"} +{"current_steps": 4830, "total_steps": 10798, "loss": 1.968, "reward": null, "learning_rate": 0.0005828258841065377, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "3:20:30", "remaining_time": "4:07:45"} +{"current_steps": 4830, "total_steps": 10798, "loss": 1.968, "reward": null, "learning_rate": 0.0005828258841065377, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "3:14:26", "remaining_time": "4:00:14"} +{"current_steps": 4830, "total_steps": 10798, "loss": 1.968, "reward": null, "learning_rate": 0.0005828258841065377, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "3:14:27", "remaining_time": "4:00:16"} +{"current_steps": 4830, "total_steps": 10798, "loss": 1.968, "reward": null, "learning_rate": 0.0005828258841065377, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "3:14:29", "remaining_time": "4:00:18"} +{"current_steps": 4840, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.0005813909229767846, "epoch": 0.9, "percentage": 44.82, "elapsed_time": "3:20:55", "remaining_time": "4:07:20"} +{"current_steps": 4840, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.0005813909229767846, "epoch": 0.9, "percentage": 44.82, "elapsed_time": "3:14:54", "remaining_time": "3:59:55"} +{"current_steps": 4840, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.0005813909229767846, "epoch": 0.9, "percentage": 44.82, "elapsed_time": "3:14:50", "remaining_time": "3:59:51"} +{"current_steps": 4840, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.0005813909229767846, "epoch": 0.9, "percentage": 44.82, "elapsed_time": "3:14:52", "remaining_time": "3:59:53"} +{"current_steps": 4850, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0005799552728953472, "epoch": 0.9, "percentage": 44.92, "elapsed_time": "3:15:15", "remaining_time": "3:59:27"} +{"current_steps": 4850, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0005799552728953472, "epoch": 0.9, "percentage": 44.92, "elapsed_time": "3:15:16", "remaining_time": "3:59:29"} +{"current_steps": 4850, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0005799552728953472, "epoch": 0.9, "percentage": 44.92, "elapsed_time": "3:21:19", "remaining_time": "4:06:54"} +{"current_steps": 4850, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0005799552728953472, "epoch": 0.9, "percentage": 44.92, "elapsed_time": "3:15:18", "remaining_time": "3:59:31"} +{"current_steps": 4860, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.000578518946014607, "epoch": 0.9, "percentage": 45.01, "elapsed_time": "3:21:44", "remaining_time": "4:06:29"} +{"current_steps": 4860, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.000578518946014607, "epoch": 0.9, "percentage": 45.01, "elapsed_time": "3:15:40", "remaining_time": "3:59:04"} +{"current_steps": 4860, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.000578518946014607, "epoch": 0.9, "percentage": 45.01, "elapsed_time": "3:15:43", "remaining_time": "3:59:08"} +{"current_steps": 4860, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.000578518946014607, "epoch": 0.9, "percentage": 45.01, "elapsed_time": "3:15:41", "remaining_time": "3:59:06"} +{"current_steps": 4870, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0005770819544926741, "epoch": 0.9, "percentage": 45.1, "elapsed_time": "3:22:08", "remaining_time": "4:06:03"} +{"current_steps": 4870, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0005770819544926741, "epoch": 0.9, "percentage": 45.1, "elapsed_time": "3:16:07", "remaining_time": "3:58:43"} +{"current_steps": 4870, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0005770819544926741, "epoch": 0.9, "percentage": 45.1, "elapsed_time": "3:16:05", "remaining_time": "3:58:41"} +{"current_steps": 4870, "total_steps": 10798, "loss": 1.9835, "reward": null, "learning_rate": 0.0005770819544926741, "epoch": 0.9, "percentage": 45.1, "elapsed_time": "3:16:03", "remaining_time": "3:58:39"} +{"current_steps": 4880, "total_steps": 10798, "loss": 2.028, "reward": null, "learning_rate": 0.0005756443104932852, "epoch": 0.9, "percentage": 45.19, "elapsed_time": "3:22:33", "remaining_time": "4:05:38"} +{"current_steps": 4880, "total_steps": 10798, "loss": 2.028, "reward": null, "learning_rate": 0.0005756443104932852, "epoch": 0.9, "percentage": 45.19, "elapsed_time": "3:16:28", "remaining_time": "3:58:16"} +{"current_steps": 4880, "total_steps": 10798, "loss": 2.028, "reward": null, "learning_rate": 0.0005756443104932852, "epoch": 0.9, "percentage": 45.19, "elapsed_time": "3:16:32", "remaining_time": "3:58:20"} +{"current_steps": 4880, "total_steps": 10798, "loss": 2.028, "reward": null, "learning_rate": 0.0005756443104932852, "epoch": 0.9, "percentage": 45.19, "elapsed_time": "3:16:30", "remaining_time": "3:58:18"} +{"current_steps": 4890, "total_steps": 10798, "loss": 1.973, "reward": null, "learning_rate": 0.0005742060261856996, "epoch": 0.91, "percentage": 45.29, "elapsed_time": "3:16:57", "remaining_time": "3:57:57"} +{"current_steps": 4890, "total_steps": 10798, "loss": 1.973, "reward": null, "learning_rate": 0.0005742060261856996, "epoch": 0.91, "percentage": 45.29, "elapsed_time": "3:16:55", "remaining_time": "3:57:55"} +{"current_steps": 4890, "total_steps": 10798, "loss": 1.973, "reward": null, "learning_rate": 0.0005742060261856996, "epoch": 0.91, "percentage": 45.29, "elapsed_time": "3:22:58", "remaining_time": "4:05:14"} +{"current_steps": 4890, "total_steps": 10798, "loss": 1.973, "reward": null, "learning_rate": 0.0005742060261856996, "epoch": 0.91, "percentage": 45.29, "elapsed_time": "3:16:53", "remaining_time": "3:57:53"} +{"current_steps": 4900, "total_steps": 10798, "loss": 1.9734, "reward": null, "learning_rate": 0.0005727671137445967, "epoch": 0.91, "percentage": 45.38, "elapsed_time": "3:23:23", "remaining_time": "4:04:48"} +{"current_steps": 4900, "total_steps": 10798, "loss": 1.9734, "reward": null, "learning_rate": 0.0005727671137445967, "epoch": 0.91, "percentage": 45.38, "elapsed_time": "3:17:20", "remaining_time": "3:57:31"} +{"current_steps": 4900, "total_steps": 10798, "loss": 1.9734, "reward": null, "learning_rate": 0.0005727671137445967, "epoch": 0.91, "percentage": 45.38, "elapsed_time": "3:17:18", "remaining_time": "3:57:29"} +{"current_steps": 4900, "total_steps": 10798, "loss": 1.9734, "reward": null, "learning_rate": 0.0005727671137445967, "epoch": 0.91, "percentage": 45.38, "elapsed_time": "3:17:21", "remaining_time": "3:57:33"} +{"current_steps": 4910, "total_steps": 10798, "loss": 1.9921, "reward": null, "learning_rate": 0.0005713275853499729, "epoch": 0.91, "percentage": 45.47, "elapsed_time": "3:17:44", "remaining_time": "3:57:08"} +{"current_steps": 4910, "total_steps": 10798, "loss": 1.9921, "reward": null, "learning_rate": 0.0005713275853499729, "epoch": 0.91, "percentage": 45.47, "elapsed_time": "3:17:43", "remaining_time": "3:57:06"} +{"current_steps": 4910, "total_steps": 10798, "loss": 1.9921, "reward": null, "learning_rate": 0.0005713275853499729, "epoch": 0.91, "percentage": 45.47, "elapsed_time": "3:17:46", "remaining_time": "3:57:10"} +{"current_steps": 4910, "total_steps": 10798, "loss": 1.9921, "reward": null, "learning_rate": 0.0005713275853499729, "epoch": 0.91, "percentage": 45.47, "elapsed_time": "3:23:48", "remaining_time": "4:04:23"} +{"current_steps": 4920, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005698874531870386, "epoch": 0.91, "percentage": 45.56, "elapsed_time": "3:24:12", "remaining_time": "4:03:57"} +{"current_steps": 4920, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005698874531870386, "epoch": 0.91, "percentage": 45.56, "elapsed_time": "3:18:10", "remaining_time": "3:56:45"} +{"current_steps": 4920, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005698874531870386, "epoch": 0.91, "percentage": 45.56, "elapsed_time": "3:18:07", "remaining_time": "3:56:41"} +{"current_steps": 4920, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005698874531870386, "epoch": 0.91, "percentage": 45.56, "elapsed_time": "3:18:08", "remaining_time": "3:56:43"} +{"current_steps": 4930, "total_steps": 10798, "loss": 1.9468, "reward": null, "learning_rate": 0.0005684467294461146, "epoch": 0.91, "percentage": 45.66, "elapsed_time": "3:18:34", "remaining_time": "3:56:21"} +{"current_steps": 4930, "total_steps": 10798, "loss": 1.9468, "reward": null, "learning_rate": 0.0005684467294461146, "epoch": 0.91, "percentage": 45.66, "elapsed_time": "3:24:36", "remaining_time": "4:03:32"} +{"current_steps": 4930, "total_steps": 10798, "loss": 1.9468, "reward": null, "learning_rate": 0.0005684467294461146, "epoch": 0.91, "percentage": 45.66, "elapsed_time": "3:18:33", "remaining_time": "3:56:19"} +{"current_steps": 4930, "total_steps": 10798, "loss": 1.9468, "reward": null, "learning_rate": 0.0005684467294461146, "epoch": 0.91, "percentage": 45.66, "elapsed_time": "3:18:31", "remaining_time": "3:56:17"} +{"current_steps": 4940, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.0005670054263225297, "epoch": 0.91, "percentage": 45.75, "elapsed_time": "3:25:00", "remaining_time": "4:03:06"} +{"current_steps": 4940, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.0005670054263225297, "epoch": 0.91, "percentage": 45.75, "elapsed_time": "3:18:55", "remaining_time": "3:55:53"} +{"current_steps": 4940, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.0005670054263225297, "epoch": 0.91, "percentage": 45.75, "elapsed_time": "3:18:57", "remaining_time": "3:55:55"} +{"current_steps": 4940, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.0005670054263225297, "epoch": 0.91, "percentage": 45.75, "elapsed_time": "3:18:59", "remaining_time": "3:55:57"} +{"current_steps": 4950, "total_steps": 10798, "loss": 1.9737, "reward": null, "learning_rate": 0.0005655635560165166, "epoch": 0.92, "percentage": 45.84, "elapsed_time": "3:25:25", "remaining_time": "4:02:41"} +{"current_steps": 4950, "total_steps": 10798, "loss": 1.9737, "reward": null, "learning_rate": 0.0005655635560165166, "epoch": 0.92, "percentage": 45.84, "elapsed_time": "3:19:20", "remaining_time": "3:55:30"} +{"current_steps": 4950, "total_steps": 10798, "loss": 1.9737, "reward": null, "learning_rate": 0.0005655635560165166, "epoch": 0.92, "percentage": 45.84, "elapsed_time": "3:19:21", "remaining_time": "3:55:31"} +{"current_steps": 4950, "total_steps": 10798, "loss": 1.9737, "reward": null, "learning_rate": 0.0005655635560165166, "epoch": 0.92, "percentage": 45.84, "elapsed_time": "3:19:23", "remaining_time": "3:55:34"} +{"current_steps": 4960, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0005641211307331093, "epoch": 0.92, "percentage": 45.93, "elapsed_time": "3:25:48", "remaining_time": "4:02:14"} +{"current_steps": 4960, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0005641211307331093, "epoch": 0.92, "percentage": 45.93, "elapsed_time": "3:19:45", "remaining_time": "3:55:06"} +{"current_steps": 4960, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0005641211307331093, "epoch": 0.92, "percentage": 45.93, "elapsed_time": "3:19:43", "remaining_time": "3:55:04"} +{"current_steps": 4960, "total_steps": 10798, "loss": 1.9532, "reward": null, "learning_rate": 0.0005641211307331093, "epoch": 0.92, "percentage": 45.93, "elapsed_time": "3:19:46", "remaining_time": "3:55:08"} +{"current_steps": 4970, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005626781626820395, "epoch": 0.92, "percentage": 46.03, "elapsed_time": "3:20:09", "remaining_time": "3:54:42"} +{"current_steps": 4970, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005626781626820395, "epoch": 0.92, "percentage": 46.03, "elapsed_time": "3:20:07", "remaining_time": "3:54:40"} +{"current_steps": 4970, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005626781626820395, "epoch": 0.92, "percentage": 46.03, "elapsed_time": "3:20:11", "remaining_time": "3:54:44"} +{"current_steps": 4970, "total_steps": 10798, "loss": 2.0048, "reward": null, "learning_rate": 0.0005626781626820395, "epoch": 0.92, "percentage": 46.03, "elapsed_time": "3:26:12", "remaining_time": "4:01:48"} +{"current_steps": 4980, "total_steps": 10798, "loss": 2.0276, "reward": null, "learning_rate": 0.0005612346640776331, "epoch": 0.92, "percentage": 46.12, "elapsed_time": "3:20:33", "remaining_time": "3:54:18"} +{"current_steps": 4980, "total_steps": 10798, "loss": 2.0276, "reward": null, "learning_rate": 0.0005612346640776331, "epoch": 0.92, "percentage": 46.12, "elapsed_time": "3:26:37", "remaining_time": "4:01:23"} +{"current_steps": 4980, "total_steps": 10798, "loss": 2.0276, "reward": null, "learning_rate": 0.0005612346640776331, "epoch": 0.92, "percentage": 46.12, "elapsed_time": "3:20:32", "remaining_time": "3:54:17"} +{"current_steps": 4980, "total_steps": 10798, "loss": 2.0276, "reward": null, "learning_rate": 0.0005612346640776331, "epoch": 0.92, "percentage": 46.12, "elapsed_time": "3:20:35", "remaining_time": "3:54:21"} +{"current_steps": 4990, "total_steps": 10798, "loss": 1.9476, "reward": null, "learning_rate": 0.0005597906471387074, "epoch": 0.92, "percentage": 46.21, "elapsed_time": "3:21:00", "remaining_time": "3:53:57"} +{"current_steps": 4990, "total_steps": 10798, "loss": 1.9476, "reward": null, "learning_rate": 0.0005597906471387074, "epoch": 0.92, "percentage": 46.21, "elapsed_time": "3:27:02", "remaining_time": "4:00:58"} +{"current_steps": 4990, "total_steps": 10798, "loss": 1.9476, "reward": null, "learning_rate": 0.0005597906471387074, "epoch": 0.92, "percentage": 46.21, "elapsed_time": "3:20:57", "remaining_time": "3:53:53"} +{"current_steps": 4990, "total_steps": 10798, "loss": 1.9476, "reward": null, "learning_rate": 0.0005597906471387074, "epoch": 0.92, "percentage": 46.21, "elapsed_time": "3:20:58", "remaining_time": "3:53:55"} +{"current_steps": 5000, "total_steps": 10798, "loss": 1.943, "reward": null, "learning_rate": 0.0005583461240884666, "epoch": 0.93, "percentage": 46.3, "elapsed_time": "3:27:27", "remaining_time": "4:00:33"} +{"current_steps": 5000, "total_steps": 10798, "loss": 1.943, "reward": null, "learning_rate": 0.0005583461240884666, "epoch": 0.93, "percentage": 46.3, "elapsed_time": "3:21:24", "remaining_time": "3:53:32"} +{"current_steps": 5000, "total_steps": 10798, "loss": 1.943, "reward": null, "learning_rate": 0.0005583461240884666, "epoch": 0.93, "percentage": 46.3, "elapsed_time": "3:21:25", "remaining_time": "3:53:34"} +{"current_steps": 5000, "total_steps": 10798, "loss": 1.943, "reward": null, "learning_rate": 0.0005583461240884666, "epoch": 0.93, "percentage": 46.3, "elapsed_time": "3:21:22", "remaining_time": "3:53:30"} +{"current_steps": 5010, "total_steps": 10798, "loss": 1.9859, "reward": null, "learning_rate": 0.0005569011071543997, "epoch": 0.93, "percentage": 46.4, "elapsed_time": "3:27:51", "remaining_time": "4:00:08"} +{"current_steps": 5010, "total_steps": 10798, "loss": 1.9859, "reward": null, "learning_rate": 0.0005569011071543997, "epoch": 0.93, "percentage": 46.4, "elapsed_time": "3:21:49", "remaining_time": "3:53:10"} +{"current_steps": 5010, "total_steps": 10798, "loss": 1.9859, "reward": null, "learning_rate": 0.0005569011071543997, "epoch": 0.93, "percentage": 46.4, "elapsed_time": "3:21:46", "remaining_time": "3:53:06"} +{"current_steps": 5010, "total_steps": 10798, "loss": 1.9859, "reward": null, "learning_rate": 0.0005569011071543997, "epoch": 0.93, "percentage": 46.4, "elapsed_time": "3:21:48", "remaining_time": "3:53:08"} +{"current_steps": 5020, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005554556085681757, "epoch": 0.93, "percentage": 46.49, "elapsed_time": "3:22:14", "remaining_time": "3:52:46"} +{"current_steps": 5020, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005554556085681757, "epoch": 0.93, "percentage": 46.49, "elapsed_time": "3:22:12", "remaining_time": "3:52:44"} +{"current_steps": 5020, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005554556085681757, "epoch": 0.93, "percentage": 46.49, "elapsed_time": "3:22:10", "remaining_time": "3:52:42"} +{"current_steps": 5020, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.0005554556085681757, "epoch": 0.93, "percentage": 46.49, "elapsed_time": "3:28:15", "remaining_time": "3:59:42"} +{"current_steps": 5030, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0005540096405655409, "epoch": 0.93, "percentage": 46.58, "elapsed_time": "3:28:39", "remaining_time": "3:59:16"} +{"current_steps": 5030, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0005540096405655409, "epoch": 0.93, "percentage": 46.58, "elapsed_time": "3:22:35", "remaining_time": "3:52:18"} +{"current_steps": 5030, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0005540096405655409, "epoch": 0.93, "percentage": 46.58, "elapsed_time": "3:22:36", "remaining_time": "3:52:20"} +{"current_steps": 5030, "total_steps": 10798, "loss": 1.9825, "reward": null, "learning_rate": 0.0005540096405655409, "epoch": 0.93, "percentage": 46.58, "elapsed_time": "3:22:38", "remaining_time": "3:52:22"} +{"current_steps": 5040, "total_steps": 10798, "loss": 1.9875, "reward": null, "learning_rate": 0.0005525632153862152, "epoch": 0.93, "percentage": 46.68, "elapsed_time": "3:29:03", "remaining_time": "3:58:50"} +{"current_steps": 5040, "total_steps": 10798, "loss": 1.9875, "reward": null, "learning_rate": 0.0005525632153862152, "epoch": 0.93, "percentage": 46.68, "elapsed_time": "3:22:58", "remaining_time": "3:51:53"} +{"current_steps": 5040, "total_steps": 10798, "loss": 1.9875, "reward": null, "learning_rate": 0.0005525632153862152, "epoch": 0.93, "percentage": 46.68, "elapsed_time": "3:23:01", "remaining_time": "3:51:57"} +{"current_steps": 5040, "total_steps": 10798, "loss": 1.9875, "reward": null, "learning_rate": 0.0005525632153862152, "epoch": 0.93, "percentage": 46.68, "elapsed_time": "3:23:00", "remaining_time": "3:51:55"} +{"current_steps": 5050, "total_steps": 10798, "loss": 2.0051, "reward": null, "learning_rate": 0.0005511163452737884, "epoch": 0.94, "percentage": 46.77, "elapsed_time": "3:23:21", "remaining_time": "3:51:27"} +{"current_steps": 5050, "total_steps": 10798, "loss": 2.0051, "reward": null, "learning_rate": 0.0005511163452737884, "epoch": 0.94, "percentage": 46.77, "elapsed_time": "3:23:24", "remaining_time": "3:51:31"} +{"current_steps": 5050, "total_steps": 10798, "loss": 2.0051, "reward": null, "learning_rate": 0.0005511163452737884, "epoch": 0.94, "percentage": 46.77, "elapsed_time": "3:23:23", "remaining_time": "3:51:29"} +{"current_steps": 5050, "total_steps": 10798, "loss": 2.0051, "reward": null, "learning_rate": 0.0005511163452737884, "epoch": 0.94, "percentage": 46.77, "elapsed_time": "3:29:26", "remaining_time": "3:58:23"} +{"current_steps": 5060, "total_steps": 10798, "loss": 2.0089, "reward": null, "learning_rate": 0.0005496690424756164, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "3:23:46", "remaining_time": "3:51:05"} +{"current_steps": 5060, "total_steps": 10798, "loss": 2.0089, "reward": null, "learning_rate": 0.0005496690424756164, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "3:23:45", "remaining_time": "3:51:03"} +{"current_steps": 5060, "total_steps": 10798, "loss": 2.0089, "reward": null, "learning_rate": 0.0005496690424756164, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "3:23:48", "remaining_time": "3:51:07"} +{"current_steps": 5060, "total_steps": 10798, "loss": 2.0089, "reward": null, "learning_rate": 0.0005496690424756164, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "3:29:50", "remaining_time": "3:57:57"} +{"current_steps": 5070, "total_steps": 10798, "loss": 1.9495, "reward": null, "learning_rate": 0.0005482213192427174, "epoch": 0.94, "percentage": 46.95, "elapsed_time": "3:30:15", "remaining_time": "3:57:32"} +{"current_steps": 5070, "total_steps": 10798, "loss": 1.9495, "reward": null, "learning_rate": 0.0005482213192427174, "epoch": 0.94, "percentage": 46.95, "elapsed_time": "3:24:12", "remaining_time": "3:50:42"} +{"current_steps": 5070, "total_steps": 10798, "loss": 1.9495, "reward": null, "learning_rate": 0.0005482213192427174, "epoch": 0.94, "percentage": 46.95, "elapsed_time": "3:24:10", "remaining_time": "3:50:40"} +{"current_steps": 5070, "total_steps": 10798, "loss": 1.9495, "reward": null, "learning_rate": 0.0005482213192427174, "epoch": 0.94, "percentage": 46.95, "elapsed_time": "3:24:14", "remaining_time": "3:50:44"} +{"current_steps": 5080, "total_steps": 10798, "loss": 1.9701, "reward": null, "learning_rate": 0.0005467731878296688, "epoch": 0.94, "percentage": 47.05, "elapsed_time": "3:24:35", "remaining_time": "3:50:16"} +{"current_steps": 5080, "total_steps": 10798, "loss": 1.9701, "reward": null, "learning_rate": 0.0005467731878296688, "epoch": 0.94, "percentage": 47.05, "elapsed_time": "3:24:33", "remaining_time": "3:50:15"} +{"current_steps": 5080, "total_steps": 10798, "loss": 1.9701, "reward": null, "learning_rate": 0.0005467731878296688, "epoch": 0.94, "percentage": 47.05, "elapsed_time": "3:24:37", "remaining_time": "3:50:18"} +{"current_steps": 5080, "total_steps": 10798, "loss": 1.9701, "reward": null, "learning_rate": 0.0005467731878296688, "epoch": 0.94, "percentage": 47.05, "elapsed_time": "3:30:38", "remaining_time": "3:57:05"} +{"current_steps": 5090, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0005453246604945034, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "3:31:04", "remaining_time": "3:56:41"} +{"current_steps": 5090, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0005453246604945034, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "3:24:59", "remaining_time": "3:49:52"} +{"current_steps": 5090, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0005453246604945034, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "3:25:02", "remaining_time": "3:49:56"} +{"current_steps": 5090, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 0.0005453246604945034, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "3:25:00", "remaining_time": "3:49:54"} +{"current_steps": 5100, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0005438757494986044, "epoch": 0.94, "percentage": 47.23, "elapsed_time": "3:31:27", "remaining_time": "3:56:14"} +{"current_steps": 5100, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0005438757494986044, "epoch": 0.94, "percentage": 47.23, "elapsed_time": "3:25:22", "remaining_time": "3:49:27"} +{"current_steps": 5100, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0005438757494986044, "epoch": 0.94, "percentage": 47.23, "elapsed_time": "3:25:24", "remaining_time": "3:49:29"} +{"current_steps": 5100, "total_steps": 10798, "loss": 1.9833, "reward": null, "learning_rate": 0.0005438757494986044, "epoch": 0.94, "percentage": 47.23, "elapsed_time": "3:25:25", "remaining_time": "3:49:31"} +{"current_steps": 5110, "total_steps": 10798, "loss": 1.9974, "reward": null, "learning_rate": 0.0005424264671066038, "epoch": 0.95, "percentage": 47.32, "elapsed_time": "3:25:49", "remaining_time": "3:49:06"} +{"current_steps": 5110, "total_steps": 10798, "loss": 1.9974, "reward": null, "learning_rate": 0.0005424264671066038, "epoch": 0.95, "percentage": 47.32, "elapsed_time": "3:25:45", "remaining_time": "3:49:02"} +{"current_steps": 5110, "total_steps": 10798, "loss": 1.9974, "reward": null, "learning_rate": 0.0005424264671066038, "epoch": 0.95, "percentage": 47.32, "elapsed_time": "3:25:47", "remaining_time": "3:49:04"} +{"current_steps": 5110, "total_steps": 10798, "loss": 1.9974, "reward": null, "learning_rate": 0.0005424264671066038, "epoch": 0.95, "percentage": 47.32, "elapsed_time": "3:31:50", "remaining_time": "3:55:48"} +{"current_steps": 5120, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0005409768255862766, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "3:32:14", "remaining_time": "3:55:22"} +{"current_steps": 5120, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0005409768255862766, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "3:26:11", "remaining_time": "3:48:39"} +{"current_steps": 5120, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0005409768255862766, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "3:26:13", "remaining_time": "3:48:41"} +{"current_steps": 5120, "total_steps": 10798, "loss": 1.9746, "reward": null, "learning_rate": 0.0005409768255862766, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "3:26:09", "remaining_time": "3:48:37"} +{"current_steps": 5130, "total_steps": 10798, "loss": 1.9757, "reward": null, "learning_rate": 0.0005395268372084378, "epoch": 0.95, "percentage": 47.51, "elapsed_time": "3:26:35", "remaining_time": "3:48:15"} +{"current_steps": 5130, "total_steps": 10798, "loss": 1.9757, "reward": null, "learning_rate": 0.0005395268372084378, "epoch": 0.95, "percentage": 47.51, "elapsed_time": "3:26:37", "remaining_time": "3:48:17"} +{"current_steps": 5130, "total_steps": 10798, "loss": 1.9757, "reward": null, "learning_rate": 0.0005395268372084378, "epoch": 0.95, "percentage": 47.51, "elapsed_time": "3:26:33", "remaining_time": "3:48:13"} +{"current_steps": 5130, "total_steps": 10798, "loss": 1.9757, "reward": null, "learning_rate": 0.0005395268372084378, "epoch": 0.95, "percentage": 47.51, "elapsed_time": "3:32:38", "remaining_time": "3:54:56"} +{"current_steps": 5140, "total_steps": 10798, "loss": 1.9908, "reward": null, "learning_rate": 0.0005380765142468387, "epoch": 0.95, "percentage": 47.6, "elapsed_time": "3:26:59", "remaining_time": "3:47:51"} +{"current_steps": 5140, "total_steps": 10798, "loss": 1.9908, "reward": null, "learning_rate": 0.0005380765142468387, "epoch": 0.95, "percentage": 47.6, "elapsed_time": "3:26:57", "remaining_time": "3:47:49"} +{"current_steps": 5140, "total_steps": 10798, "loss": 1.9908, "reward": null, "learning_rate": 0.0005380765142468387, "epoch": 0.95, "percentage": 47.6, "elapsed_time": "3:27:01", "remaining_time": "3:47:53"} +{"current_steps": 5140, "total_steps": 10798, "loss": 1.9908, "reward": null, "learning_rate": 0.0005380765142468387, "epoch": 0.95, "percentage": 47.6, "elapsed_time": "3:33:02", "remaining_time": "3:54:30"} +{"current_steps": 5150, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0005366258689780625, "epoch": 0.95, "percentage": 47.69, "elapsed_time": "3:27:25", "remaining_time": "3:47:28"} +{"current_steps": 5150, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0005366258689780625, "epoch": 0.95, "percentage": 47.69, "elapsed_time": "3:27:27", "remaining_time": "3:47:30"} +{"current_steps": 5150, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0005366258689780625, "epoch": 0.95, "percentage": 47.69, "elapsed_time": "3:27:23", "remaining_time": "3:47:27"} +{"current_steps": 5150, "total_steps": 10798, "loss": 2.006, "reward": null, "learning_rate": 0.0005366258689780625, "epoch": 0.95, "percentage": 47.69, "elapsed_time": "3:33:28", "remaining_time": "3:54:07"} +{"current_steps": 5160, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005351749136814208, "epoch": 0.96, "percentage": 47.79, "elapsed_time": "3:27:51", "remaining_time": "3:47:07"} +{"current_steps": 5160, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005351749136814208, "epoch": 0.96, "percentage": 47.79, "elapsed_time": "3:33:53", "remaining_time": "3:53:42"} +{"current_steps": 5160, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005351749136814208, "epoch": 0.96, "percentage": 47.79, "elapsed_time": "3:27:48", "remaining_time": "3:47:03"} +{"current_steps": 5160, "total_steps": 10798, "loss": 1.9957, "reward": null, "learning_rate": 0.0005351749136814208, "epoch": 0.96, "percentage": 47.79, "elapsed_time": "3:27:50", "remaining_time": "3:47:05"} +{"current_steps": 5170, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0005337236606388495, "epoch": 0.96, "percentage": 47.88, "elapsed_time": "3:28:13", "remaining_time": "3:46:40"} +{"current_steps": 5170, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0005337236606388495, "epoch": 0.96, "percentage": 47.88, "elapsed_time": "3:34:17", "remaining_time": "3:53:16"} +{"current_steps": 5170, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0005337236606388495, "epoch": 0.96, "percentage": 47.88, "elapsed_time": "3:28:12", "remaining_time": "3:46:39"} +{"current_steps": 5170, "total_steps": 10798, "loss": 1.959, "reward": null, "learning_rate": 0.0005337236606388495, "epoch": 0.96, "percentage": 47.88, "elapsed_time": "3:28:15", "remaining_time": "3:46:42"} +{"current_steps": 5180, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0005322721221348047, "epoch": 0.96, "percentage": 47.97, "elapsed_time": "3:34:42", "remaining_time": "3:52:51"} +{"current_steps": 5180, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0005322721221348047, "epoch": 0.96, "percentage": 47.97, "elapsed_time": "3:28:37", "remaining_time": "3:46:15"} +{"current_steps": 5180, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0005322721221348047, "epoch": 0.96, "percentage": 47.97, "elapsed_time": "3:28:38", "remaining_time": "3:46:17"} +{"current_steps": 5180, "total_steps": 10798, "loss": 2.0027, "reward": null, "learning_rate": 0.0005322721221348047, "epoch": 0.96, "percentage": 47.97, "elapsed_time": "3:28:40", "remaining_time": "3:46:19"} +{"current_steps": 5190, "total_steps": 10798, "loss": 1.9248, "reward": null, "learning_rate": 0.000530820310456159, "epoch": 0.96, "percentage": 48.06, "elapsed_time": "3:35:05", "remaining_time": "3:52:24"} +{"current_steps": 5190, "total_steps": 10798, "loss": 1.9248, "reward": null, "learning_rate": 0.000530820310456159, "epoch": 0.96, "percentage": 48.06, "elapsed_time": "3:29:02", "remaining_time": "3:45:52"} +{"current_steps": 5190, "total_steps": 10798, "loss": 1.9248, "reward": null, "learning_rate": 0.000530820310456159, "epoch": 0.96, "percentage": 48.06, "elapsed_time": "3:29:04", "remaining_time": "3:45:54"} +{"current_steps": 5190, "total_steps": 10798, "loss": 1.9248, "reward": null, "learning_rate": 0.000530820310456159, "epoch": 0.96, "percentage": 48.06, "elapsed_time": "3:29:00", "remaining_time": "3:45:50"} +{"current_steps": 5200, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0005293682378920974, "epoch": 0.96, "percentage": 48.16, "elapsed_time": "3:29:27", "remaining_time": "3:45:29"} +{"current_steps": 5200, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0005293682378920974, "epoch": 0.96, "percentage": 48.16, "elapsed_time": "3:29:24", "remaining_time": "3:45:26"} +{"current_steps": 5200, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0005293682378920974, "epoch": 0.96, "percentage": 48.16, "elapsed_time": "3:35:29", "remaining_time": "3:51:58"} +{"current_steps": 5200, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0005293682378920974, "epoch": 0.96, "percentage": 48.16, "elapsed_time": "3:29:26", "remaining_time": "3:45:27"} +{"current_steps": 5210, "total_steps": 10798, "loss": 1.9844, "reward": null, "learning_rate": 0.000527915916734013, "epoch": 0.96, "percentage": 48.25, "elapsed_time": "3:29:48", "remaining_time": "3:45:01"} +{"current_steps": 5210, "total_steps": 10798, "loss": 1.9844, "reward": null, "learning_rate": 0.000527915916734013, "epoch": 0.96, "percentage": 48.25, "elapsed_time": "3:35:53", "remaining_time": "3:51:33"} +{"current_steps": 5210, "total_steps": 10798, "loss": 1.9844, "reward": null, "learning_rate": 0.000527915916734013, "epoch": 0.96, "percentage": 48.25, "elapsed_time": "3:29:50", "remaining_time": "3:45:03"} +{"current_steps": 5210, "total_steps": 10798, "loss": 1.9844, "reward": null, "learning_rate": 0.000527915916734013, "epoch": 0.96, "percentage": 48.25, "elapsed_time": "3:29:51", "remaining_time": "3:45:05"} +{"current_steps": 5220, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0005264633592754035, "epoch": 0.97, "percentage": 48.34, "elapsed_time": "3:36:17", "remaining_time": "3:51:07"} +{"current_steps": 5220, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0005264633592754035, "epoch": 0.97, "percentage": 48.34, "elapsed_time": "3:30:12", "remaining_time": "3:44:37"} +{"current_steps": 5220, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0005264633592754035, "epoch": 0.97, "percentage": 48.34, "elapsed_time": "3:30:14", "remaining_time": "3:44:39"} +{"current_steps": 5220, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.0005264633592754035, "epoch": 0.97, "percentage": 48.34, "elapsed_time": "3:30:16", "remaining_time": "3:44:41"} +{"current_steps": 5230, "total_steps": 10798, "loss": 2.0074, "reward": null, "learning_rate": 0.0005250105778117661, "epoch": 0.97, "percentage": 48.43, "elapsed_time": "3:36:41", "remaining_time": "3:50:42"} +{"current_steps": 5230, "total_steps": 10798, "loss": 2.0074, "reward": null, "learning_rate": 0.0005250105778117661, "epoch": 0.97, "percentage": 48.43, "elapsed_time": "3:30:38", "remaining_time": "3:44:15"} +{"current_steps": 5230, "total_steps": 10798, "loss": 2.0074, "reward": null, "learning_rate": 0.0005250105778117661, "epoch": 0.97, "percentage": 48.43, "elapsed_time": "3:30:40", "remaining_time": "3:44:17"} +{"current_steps": 5230, "total_steps": 10798, "loss": 2.0074, "reward": null, "learning_rate": 0.0005250105778117661, "epoch": 0.97, "percentage": 48.43, "elapsed_time": "3:30:36", "remaining_time": "3:44:13"} +{"current_steps": 5240, "total_steps": 10798, "loss": 1.9901, "reward": null, "learning_rate": 0.0005235575846404952, "epoch": 0.97, "percentage": 48.53, "elapsed_time": "3:37:06", "remaining_time": "3:50:17"} +{"current_steps": 5240, "total_steps": 10798, "loss": 1.9901, "reward": null, "learning_rate": 0.0005235575846404952, "epoch": 0.97, "percentage": 48.53, "elapsed_time": "3:31:03", "remaining_time": "3:43:51"} +{"current_steps": 5240, "total_steps": 10798, "loss": 1.9901, "reward": null, "learning_rate": 0.0005235575846404952, "epoch": 0.97, "percentage": 48.53, "elapsed_time": "3:31:01", "remaining_time": "3:43:50"} +{"current_steps": 5240, "total_steps": 10798, "loss": 1.9901, "reward": null, "learning_rate": 0.0005235575846404952, "epoch": 0.97, "percentage": 48.53, "elapsed_time": "3:31:05", "remaining_time": "3:43:53"} +{"current_steps": 5250, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0005221043920607763, "epoch": 0.97, "percentage": 48.62, "elapsed_time": "3:31:29", "remaining_time": "3:43:29"} +{"current_steps": 5250, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0005221043920607763, "epoch": 0.97, "percentage": 48.62, "elapsed_time": "3:31:27", "remaining_time": "3:43:27"} +{"current_steps": 5250, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0005221043920607763, "epoch": 0.97, "percentage": 48.62, "elapsed_time": "3:31:26", "remaining_time": "3:43:26"} +{"current_steps": 5250, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0005221043920607763, "epoch": 0.97, "percentage": 48.62, "elapsed_time": "3:37:30", "remaining_time": "3:49:51"} +{"current_steps": 5260, "total_steps": 10798, "loss": 1.9576, "reward": null, "learning_rate": 0.0005206510123734837, "epoch": 0.97, "percentage": 48.71, "elapsed_time": "3:31:50", "remaining_time": "3:43:01"} +{"current_steps": 5260, "total_steps": 10798, "loss": 1.9576, "reward": null, "learning_rate": 0.0005206510123734837, "epoch": 0.97, "percentage": 48.71, "elapsed_time": "3:31:53", "remaining_time": "3:43:05"} +{"current_steps": 5260, "total_steps": 10798, "loss": 1.9576, "reward": null, "learning_rate": 0.0005206510123734837, "epoch": 0.97, "percentage": 48.71, "elapsed_time": "3:31:51", "remaining_time": "3:43:03"} +{"current_steps": 5260, "total_steps": 10798, "loss": 1.9576, "reward": null, "learning_rate": 0.0005206510123734837, "epoch": 0.97, "percentage": 48.71, "elapsed_time": "3:37:54", "remaining_time": "3:49:25"} +{"current_steps": 5270, "total_steps": 10798, "loss": 1.9741, "reward": null, "learning_rate": 0.0005191974578810746, "epoch": 0.98, "percentage": 48.81, "elapsed_time": "3:38:17", "remaining_time": "3:48:59"} +{"current_steps": 5270, "total_steps": 10798, "loss": 1.9741, "reward": null, "learning_rate": 0.0005191974578810746, "epoch": 0.98, "percentage": 48.81, "elapsed_time": "3:32:14", "remaining_time": "3:42:38"} +{"current_steps": 5270, "total_steps": 10798, "loss": 1.9741, "reward": null, "learning_rate": 0.0005191974578810746, "epoch": 0.98, "percentage": 48.81, "elapsed_time": "3:32:16", "remaining_time": "3:42:40"} +{"current_steps": 5270, "total_steps": 10798, "loss": 1.9741, "reward": null, "learning_rate": 0.0005191974578810746, "epoch": 0.98, "percentage": 48.81, "elapsed_time": "3:32:13", "remaining_time": "3:42:36"} +{"current_steps": 5280, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0005177437408874868, "epoch": 0.98, "percentage": 48.9, "elapsed_time": "3:32:39", "remaining_time": "3:42:14"} +{"current_steps": 5280, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0005177437408874868, "epoch": 0.98, "percentage": 48.9, "elapsed_time": "3:32:37", "remaining_time": "3:42:12"} +{"current_steps": 5280, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0005177437408874868, "epoch": 0.98, "percentage": 48.9, "elapsed_time": "3:32:40", "remaining_time": "3:42:16"} +{"current_steps": 5280, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0005177437408874868, "epoch": 0.98, "percentage": 48.9, "elapsed_time": "3:38:42", "remaining_time": "3:48:33"} +{"current_steps": 5290, "total_steps": 10798, "loss": 1.9883, "reward": null, "learning_rate": 0.0005162898736980327, "epoch": 0.98, "percentage": 48.99, "elapsed_time": "3:33:05", "remaining_time": "3:41:52"} +{"current_steps": 5290, "total_steps": 10798, "loss": 1.9883, "reward": null, "learning_rate": 0.0005162898736980327, "epoch": 0.98, "percentage": 48.99, "elapsed_time": "3:39:07", "remaining_time": "3:48:09"} +{"current_steps": 5290, "total_steps": 10798, "loss": 1.9883, "reward": null, "learning_rate": 0.0005162898736980327, "epoch": 0.98, "percentage": 48.99, "elapsed_time": "3:33:04", "remaining_time": "3:41:50"} +{"current_steps": 5290, "total_steps": 10798, "loss": 1.9883, "reward": null, "learning_rate": 0.0005162898736980327, "epoch": 0.98, "percentage": 48.99, "elapsed_time": "3:33:02", "remaining_time": "3:41:49"} +{"current_steps": 5300, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0005148358686192967, "epoch": 0.98, "percentage": 49.08, "elapsed_time": "3:33:29", "remaining_time": "3:41:28"} +{"current_steps": 5300, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0005148358686192967, "epoch": 0.98, "percentage": 49.08, "elapsed_time": "3:39:31", "remaining_time": "3:47:43"} +{"current_steps": 5300, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0005148358686192967, "epoch": 0.98, "percentage": 49.08, "elapsed_time": "3:33:26", "remaining_time": "3:41:24"} +{"current_steps": 5300, "total_steps": 10798, "loss": 1.969, "reward": null, "learning_rate": 0.0005148358686192967, "epoch": 0.98, "percentage": 49.08, "elapsed_time": "3:33:27", "remaining_time": "3:41:26"} +{"current_steps": 5310, "total_steps": 10798, "loss": 2.0018, "reward": null, "learning_rate": 0.0005133817379590302, "epoch": 0.98, "percentage": 49.18, "elapsed_time": "3:33:52", "remaining_time": "3:41:02"} +{"current_steps": 5310, "total_steps": 10798, "loss": 2.0018, "reward": null, "learning_rate": 0.0005133817379590302, "epoch": 0.98, "percentage": 49.18, "elapsed_time": "3:33:51", "remaining_time": "3:41:01"} +{"current_steps": 5310, "total_steps": 10798, "loss": 2.0018, "reward": null, "learning_rate": 0.0005133817379590302, "epoch": 0.98, "percentage": 49.18, "elapsed_time": "3:33:54", "remaining_time": "3:41:04"} +{"current_steps": 5310, "total_steps": 10798, "loss": 2.0018, "reward": null, "learning_rate": 0.0005133817379590302, "epoch": 0.98, "percentage": 49.18, "elapsed_time": "3:39:55", "remaining_time": "3:47:18"} +{"current_steps": 5320, "total_steps": 10798, "loss": 1.971, "reward": null, "learning_rate": 0.0005119274940260476, "epoch": 0.99, "percentage": 49.27, "elapsed_time": "3:34:17", "remaining_time": "3:40:39"} +{"current_steps": 5320, "total_steps": 10798, "loss": 1.971, "reward": null, "learning_rate": 0.0005119274940260476, "epoch": 0.99, "percentage": 49.27, "elapsed_time": "3:34:16", "remaining_time": "3:40:37"} +{"current_steps": 5320, "total_steps": 10798, "loss": 1.971, "reward": null, "learning_rate": 0.0005119274940260476, "epoch": 0.99, "percentage": 49.27, "elapsed_time": "3:34:19", "remaining_time": "3:40:41"} +{"current_steps": 5320, "total_steps": 10798, "loss": 1.971, "reward": null, "learning_rate": 0.0005119274940260476, "epoch": 0.99, "percentage": 49.27, "elapsed_time": "3:40:20", "remaining_time": "3:46:53"} +{"current_steps": 5330, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0005104731491301225, "epoch": 0.99, "percentage": 49.36, "elapsed_time": "3:40:44", "remaining_time": "3:46:27"} +{"current_steps": 5330, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0005104731491301225, "epoch": 0.99, "percentage": 49.36, "elapsed_time": "3:34:41", "remaining_time": "3:40:14"} +{"current_steps": 5330, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0005104731491301225, "epoch": 0.99, "percentage": 49.36, "elapsed_time": "3:34:39", "remaining_time": "3:40:13"} +{"current_steps": 5330, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0005104731491301225, "epoch": 0.99, "percentage": 49.36, "elapsed_time": "3:34:43", "remaining_time": "3:40:16"} +{"current_steps": 5340, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0005090187155818823, "epoch": 0.99, "percentage": 49.45, "elapsed_time": "3:41:08", "remaining_time": "3:46:01"} +{"current_steps": 5340, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0005090187155818823, "epoch": 0.99, "percentage": 49.45, "elapsed_time": "3:35:07", "remaining_time": "3:39:52"} +{"current_steps": 5340, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0005090187155818823, "epoch": 0.99, "percentage": 49.45, "elapsed_time": "3:35:03", "remaining_time": "3:39:48"} +{"current_steps": 5340, "total_steps": 10798, "loss": 1.9798, "reward": null, "learning_rate": 0.0005090187155818823, "epoch": 0.99, "percentage": 49.45, "elapsed_time": "3:35:05", "remaining_time": "3:39:50"} +{"current_steps": 5350, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0005075642056927057, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "3:41:33", "remaining_time": "3:45:37"} +{"current_steps": 5350, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0005075642056927057, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "3:35:32", "remaining_time": "3:39:29"} +{"current_steps": 5350, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0005075642056927057, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "3:35:30", "remaining_time": "3:39:27"} +{"current_steps": 5350, "total_steps": 10798, "loss": 2.0331, "reward": null, "learning_rate": 0.0005075642056927057, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "3:35:29", "remaining_time": "3:39:25"} +{"current_steps": 5360, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.000506109631774617, "epoch": 0.99, "percentage": 49.64, "elapsed_time": "3:41:57", "remaining_time": "3:45:11"} +{"current_steps": 5360, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.000506109631774617, "epoch": 0.99, "percentage": 49.64, "elapsed_time": "3:35:54", "remaining_time": "3:39:02"} +{"current_steps": 5360, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.000506109631774617, "epoch": 0.99, "percentage": 49.64, "elapsed_time": "3:35:55", "remaining_time": "3:39:04"} +{"current_steps": 5360, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.000506109631774617, "epoch": 0.99, "percentage": 49.64, "elapsed_time": "3:35:52", "remaining_time": "3:39:00"} +{"current_steps": 5370, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 0.0005046550061401825, "epoch": 0.99, "percentage": 49.73, "elapsed_time": "3:42:21", "remaining_time": "3:44:45"} +{"current_steps": 5370, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 0.0005046550061401825, "epoch": 0.99, "percentage": 49.73, "elapsed_time": "3:36:16", "remaining_time": "3:38:36"} +{"current_steps": 5370, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 0.0005046550061401825, "epoch": 0.99, "percentage": 49.73, "elapsed_time": "3:36:19", "remaining_time": "3:38:40"} +{"current_steps": 5370, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 0.0005046550061401825, "epoch": 0.99, "percentage": 49.73, "elapsed_time": "3:36:18", "remaining_time": "3:38:38"} +{"current_steps": 5380, "total_steps": 10798, "loss": 2.0099, "reward": null, "learning_rate": 0.0005032003411024067, "epoch": 1.0, "percentage": 49.82, "elapsed_time": "3:42:46", "remaining_time": "3:44:20"} +{"current_steps": 5380, "total_steps": 10798, "loss": 2.0099, "reward": null, "learning_rate": 0.0005032003411024067, "epoch": 1.0, "percentage": 49.82, "elapsed_time": "3:36:44", "remaining_time": "3:38:16"} +{"current_steps": 5380, "total_steps": 10798, "loss": 2.0099, "reward": null, "learning_rate": 0.0005032003411024067, "epoch": 1.0, "percentage": 49.82, "elapsed_time": "3:36:41", "remaining_time": "3:38:13"} +{"current_steps": 5380, "total_steps": 10798, "loss": 2.0099, "reward": null, "learning_rate": 0.0005032003411024067, "epoch": 1.0, "percentage": 49.82, "elapsed_time": "3:36:43", "remaining_time": "3:38:14"} +{"current_steps": 5390, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0005017456489746275, "epoch": 1.0, "percentage": 49.92, "elapsed_time": "3:37:06", "remaining_time": "3:37:49"} +{"current_steps": 5390, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0005017456489746275, "epoch": 1.0, "percentage": 49.92, "elapsed_time": "3:37:04", "remaining_time": "3:37:47"} +{"current_steps": 5390, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0005017456489746275, "epoch": 1.0, "percentage": 49.92, "elapsed_time": "3:43:09", "remaining_time": "3:43:53"} +{"current_steps": 5390, "total_steps": 10798, "loss": 1.9756, "reward": null, "learning_rate": 0.0005017456489746275, "epoch": 1.0, "percentage": 49.92, "elapsed_time": "3:37:07", "remaining_time": "3:37:51"} +{"current_steps": 5400, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.0005002909420704116, "epoch": 1.0, "percentage": 50.01, "elapsed_time": "3:37:28", "remaining_time": "3:37:23"} +{"current_steps": 5400, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.0005002909420704116, "epoch": 1.0, "percentage": 50.01, "elapsed_time": "3:43:33", "remaining_time": "3:43:28"} +{"current_steps": 5400, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.0005002909420704116, "epoch": 1.0, "percentage": 50.01, "elapsed_time": "3:37:31", "remaining_time": "3:37:26"} +{"current_steps": 5400, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.0005002909420704116, "epoch": 1.0, "percentage": 50.01, "elapsed_time": "3:37:30", "remaining_time": "3:37:25"} +{"current_steps": 5410, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0004988362327034516, "epoch": 1.0, "percentage": 50.1, "elapsed_time": "3:43:58", "remaining_time": "3:43:03"} +{"current_steps": 5410, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0004988362327034516, "epoch": 1.0, "percentage": 50.1, "elapsed_time": "3:37:53", "remaining_time": "3:37:00"} +{"current_steps": 5410, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0004988362327034516, "epoch": 1.0, "percentage": 50.1, "elapsed_time": "3:37:56", "remaining_time": "3:37:03"} +{"current_steps": 5410, "total_steps": 10798, "loss": 1.976, "reward": null, "learning_rate": 0.0004988362327034516, "epoch": 1.0, "percentage": 50.1, "elapsed_time": "3:37:55", "remaining_time": "3:37:01"} +{"current_steps": 5420, "total_steps": 10798, "loss": 1.9593, "reward": null, "learning_rate": 0.0004973815331874603, "epoch": 1.0, "percentage": 50.19, "elapsed_time": "3:38:17", "remaining_time": "3:36:36"} +{"current_steps": 5420, "total_steps": 10798, "loss": 1.9593, "reward": null, "learning_rate": 0.0004973815331874603, "epoch": 1.0, "percentage": 50.19, "elapsed_time": "3:38:19", "remaining_time": "3:36:37"} +{"current_steps": 5420, "total_steps": 10798, "loss": 1.9593, "reward": null, "learning_rate": 0.0004973815331874603, "epoch": 1.0, "percentage": 50.19, "elapsed_time": "3:44:22", "remaining_time": "3:42:38"} +{"current_steps": 5420, "total_steps": 10798, "loss": 1.9593, "reward": null, "learning_rate": 0.0004973815331874603, "epoch": 1.0, "percentage": 50.19, "elapsed_time": "3:38:20", "remaining_time": "3:36:39"} +{"current_steps": 5430, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.0004959268558360675, "epoch": 1.01, "percentage": 50.29, "elapsed_time": "3:38:45", "remaining_time": "3:36:15"} +{"current_steps": 5430, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.0004959268558360675, "epoch": 1.01, "percentage": 50.29, "elapsed_time": "3:44:46", "remaining_time": "3:42:12"} +{"current_steps": 5430, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.0004959268558360675, "epoch": 1.01, "percentage": 50.29, "elapsed_time": "3:38:43", "remaining_time": "3:36:13"} +{"current_steps": 5430, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.0004959268558360675, "epoch": 1.01, "percentage": 50.29, "elapsed_time": "3:38:41", "remaining_time": "3:36:12"} +{"current_steps": 5440, "total_steps": 10798, "loss": 1.972, "reward": null, "learning_rate": 0.0004944722129627151, "epoch": 1.01, "percentage": 50.38, "elapsed_time": "3:45:10", "remaining_time": "3:41:47"} +{"current_steps": 5440, "total_steps": 10798, "loss": 1.972, "reward": null, "learning_rate": 0.0004944722129627151, "epoch": 1.01, "percentage": 50.38, "elapsed_time": "3:39:07", "remaining_time": "3:35:49"} +{"current_steps": 5440, "total_steps": 10798, "loss": 1.972, "reward": null, "learning_rate": 0.0004944722129627151, "epoch": 1.01, "percentage": 50.38, "elapsed_time": "3:39:06", "remaining_time": "3:35:47"} +{"current_steps": 5440, "total_steps": 10798, "loss": 1.972, "reward": null, "learning_rate": 0.0004944722129627151, "epoch": 1.01, "percentage": 50.38, "elapsed_time": "3:39:09", "remaining_time": "3:35:51"} +{"current_steps": 5450, "total_steps": 10798, "loss": 1.9307, "reward": null, "learning_rate": 0.0004930176168805531, "epoch": 1.01, "percentage": 50.47, "elapsed_time": "3:45:34", "remaining_time": "3:41:20"} +{"current_steps": 5450, "total_steps": 10798, "loss": 1.9307, "reward": null, "learning_rate": 0.0004930176168805531, "epoch": 1.01, "percentage": 50.47, "elapsed_time": "3:39:29", "remaining_time": "3:35:22"} +{"current_steps": 5450, "total_steps": 10798, "loss": 1.9307, "reward": null, "learning_rate": 0.0004930176168805531, "epoch": 1.01, "percentage": 50.47, "elapsed_time": "3:39:32", "remaining_time": "3:35:26"} +{"current_steps": 5450, "total_steps": 10798, "loss": 1.9307, "reward": null, "learning_rate": 0.0004930176168805531, "epoch": 1.01, "percentage": 50.47, "elapsed_time": "3:39:30", "remaining_time": "3:35:24"} +{"current_steps": 5460, "total_steps": 10798, "loss": 1.9541, "reward": null, "learning_rate": 0.0004915630799023359, "epoch": 1.01, "percentage": 50.56, "elapsed_time": "3:39:56", "remaining_time": "3:35:01"} +{"current_steps": 5460, "total_steps": 10798, "loss": 1.9541, "reward": null, "learning_rate": 0.0004915630799023359, "epoch": 1.01, "percentage": 50.56, "elapsed_time": "3:39:52", "remaining_time": "3:34:58"} +{"current_steps": 5460, "total_steps": 10798, "loss": 1.9541, "reward": null, "learning_rate": 0.0004915630799023359, "epoch": 1.01, "percentage": 50.56, "elapsed_time": "3:39:54", "remaining_time": "3:34:59"} +{"current_steps": 5460, "total_steps": 10798, "loss": 1.9541, "reward": null, "learning_rate": 0.0004915630799023359, "epoch": 1.01, "percentage": 50.56, "elapsed_time": "3:45:57", "remaining_time": "3:40:54"} +{"current_steps": 5470, "total_steps": 10798, "loss": 1.9212, "reward": null, "learning_rate": 0.0004901086143403172, "epoch": 1.01, "percentage": 50.66, "elapsed_time": "3:46:20", "remaining_time": "3:40:28"} +{"current_steps": 5470, "total_steps": 10798, "loss": 1.9212, "reward": null, "learning_rate": 0.0004901086143403172, "epoch": 1.01, "percentage": 50.66, "elapsed_time": "3:40:19", "remaining_time": "3:34:36"} +{"current_steps": 5470, "total_steps": 10798, "loss": 1.9212, "reward": null, "learning_rate": 0.0004901086143403172, "epoch": 1.01, "percentage": 50.66, "elapsed_time": "3:40:17", "remaining_time": "3:34:34"} +{"current_steps": 5470, "total_steps": 10798, "loss": 1.9212, "reward": null, "learning_rate": 0.0004901086143403172, "epoch": 1.01, "percentage": 50.66, "elapsed_time": "3:40:15", "remaining_time": "3:34:32"} +{"current_steps": 5480, "total_steps": 10798, "loss": 1.965, "reward": null, "learning_rate": 0.0004886542325061464, "epoch": 1.02, "percentage": 50.75, "elapsed_time": "3:40:43", "remaining_time": "3:34:11"} +{"current_steps": 5480, "total_steps": 10798, "loss": 1.965, "reward": null, "learning_rate": 0.0004886542325061464, "epoch": 1.02, "percentage": 50.75, "elapsed_time": "3:46:44", "remaining_time": "3:40:02"} +{"current_steps": 5480, "total_steps": 10798, "loss": 1.965, "reward": null, "learning_rate": 0.0004886542325061464, "epoch": 1.02, "percentage": 50.75, "elapsed_time": "3:40:41", "remaining_time": "3:34:09"} +{"current_steps": 5480, "total_steps": 10798, "loss": 1.965, "reward": null, "learning_rate": 0.0004886542325061464, "epoch": 1.02, "percentage": 50.75, "elapsed_time": "3:40:39", "remaining_time": "3:34:08"} +{"current_steps": 5490, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0004871999467107639, "epoch": 1.02, "percentage": 50.84, "elapsed_time": "3:41:05", "remaining_time": "3:33:45"} +{"current_steps": 5490, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0004871999467107639, "epoch": 1.02, "percentage": 50.84, "elapsed_time": "3:41:04", "remaining_time": "3:33:44"} +{"current_steps": 5490, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0004871999467107639, "epoch": 1.02, "percentage": 50.84, "elapsed_time": "3:47:08", "remaining_time": "3:39:37"} +{"current_steps": 5490, "total_steps": 10798, "loss": 2.0083, "reward": null, "learning_rate": 0.0004871999467107639, "epoch": 1.02, "percentage": 50.84, "elapsed_time": "3:41:07", "remaining_time": "3:33:47"} +{"current_steps": 5500, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0004857457692642974, "epoch": 1.02, "percentage": 50.94, "elapsed_time": "3:47:33", "remaining_time": "3:39:11"} +{"current_steps": 5500, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0004857457692642974, "epoch": 1.02, "percentage": 50.94, "elapsed_time": "3:41:30", "remaining_time": "3:33:21"} +{"current_steps": 5500, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0004857457692642974, "epoch": 1.02, "percentage": 50.94, "elapsed_time": "3:41:28", "remaining_time": "3:33:20"} +{"current_steps": 5500, "total_steps": 10798, "loss": 1.9676, "reward": null, "learning_rate": 0.0004857457692642974, "epoch": 1.02, "percentage": 50.94, "elapsed_time": "3:41:31", "remaining_time": "3:33:23"} +{"current_steps": 5510, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.000484291712475957, "epoch": 1.02, "percentage": 51.03, "elapsed_time": "3:41:53", "remaining_time": "3:32:56"} +{"current_steps": 5510, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.000484291712475957, "epoch": 1.02, "percentage": 51.03, "elapsed_time": "3:41:56", "remaining_time": "3:32:59"} +{"current_steps": 5510, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.000484291712475957, "epoch": 1.02, "percentage": 51.03, "elapsed_time": "3:41:54", "remaining_time": "3:32:58"} +{"current_steps": 5510, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.000484291712475957, "epoch": 1.02, "percentage": 51.03, "elapsed_time": "3:47:57", "remaining_time": "3:38:46"} +{"current_steps": 5520, "total_steps": 10798, "loss": 1.9339, "reward": null, "learning_rate": 0.00048283778865393243, "epoch": 1.02, "percentage": 51.12, "elapsed_time": "3:42:17", "remaining_time": "3:32:33"} +{"current_steps": 5520, "total_steps": 10798, "loss": 1.9339, "reward": null, "learning_rate": 0.00048283778865393243, "epoch": 1.02, "percentage": 51.12, "elapsed_time": "3:42:19", "remaining_time": "3:32:34"} +{"current_steps": 5520, "total_steps": 10798, "loss": 1.9339, "reward": null, "learning_rate": 0.00048283778865393243, "epoch": 1.02, "percentage": 51.12, "elapsed_time": "3:42:16", "remaining_time": "3:32:31"} +{"current_steps": 5520, "total_steps": 10798, "loss": 1.9339, "reward": null, "learning_rate": 0.00048283778865393243, "epoch": 1.02, "percentage": 51.12, "elapsed_time": "3:48:21", "remaining_time": "3:38:20"} +{"current_steps": 5530, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0004813840101052869, "epoch": 1.02, "percentage": 51.21, "elapsed_time": "3:48:45", "remaining_time": "3:37:55"} +{"current_steps": 5530, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0004813840101052869, "epoch": 1.02, "percentage": 51.21, "elapsed_time": "3:42:42", "remaining_time": "3:32:09"} +{"current_steps": 5530, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0004813840101052869, "epoch": 1.02, "percentage": 51.21, "elapsed_time": "3:42:44", "remaining_time": "3:32:11"} +{"current_steps": 5530, "total_steps": 10798, "loss": 2.0182, "reward": null, "learning_rate": 0.0004813840101052869, "epoch": 1.02, "percentage": 51.21, "elapsed_time": "3:42:40", "remaining_time": "3:32:07"} +{"current_steps": 5540, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.0004799303891358545, "epoch": 1.03, "percentage": 51.31, "elapsed_time": "3:43:04", "remaining_time": "3:31:43"} +{"current_steps": 5540, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.0004799303891358545, "epoch": 1.03, "percentage": 51.31, "elapsed_time": "3:49:09", "remaining_time": "3:37:29"} +{"current_steps": 5540, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.0004799303891358545, "epoch": 1.03, "percentage": 51.31, "elapsed_time": "3:43:08", "remaining_time": "3:31:46"} +{"current_steps": 5540, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.0004799303891358545, "epoch": 1.03, "percentage": 51.31, "elapsed_time": "3:43:06", "remaining_time": "3:31:45"} +{"current_steps": 5550, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004784769380501352, "epoch": 1.03, "percentage": 51.4, "elapsed_time": "3:49:33", "remaining_time": "3:37:03"} +{"current_steps": 5550, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004784769380501352, "epoch": 1.03, "percentage": 51.4, "elapsed_time": "3:43:31", "remaining_time": "3:31:21"} +{"current_steps": 5550, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004784769380501352, "epoch": 1.03, "percentage": 51.4, "elapsed_time": "3:43:30", "remaining_time": "3:31:20"} +{"current_steps": 5550, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004784769380501352, "epoch": 1.03, "percentage": 51.4, "elapsed_time": "3:43:28", "remaining_time": "3:31:18"} +{"current_steps": 5560, "total_steps": 10798, "loss": 1.9404, "reward": null, "learning_rate": 0.0004770236691511908, "epoch": 1.03, "percentage": 51.49, "elapsed_time": "3:43:51", "remaining_time": "3:30:53"} +{"current_steps": 5560, "total_steps": 10798, "loss": 1.9404, "reward": null, "learning_rate": 0.0004770236691511908, "epoch": 1.03, "percentage": 51.49, "elapsed_time": "3:43:54", "remaining_time": "3:30:56"} +{"current_steps": 5560, "total_steps": 10798, "loss": 1.9404, "reward": null, "learning_rate": 0.0004770236691511908, "epoch": 1.03, "percentage": 51.49, "elapsed_time": "3:49:56", "remaining_time": "3:36:37"} +{"current_steps": 5560, "total_steps": 10798, "loss": 1.9404, "reward": null, "learning_rate": 0.0004770236691511908, "epoch": 1.03, "percentage": 51.49, "elapsed_time": "3:43:53", "remaining_time": "3:30:55"} +{"current_steps": 5570, "total_steps": 10798, "loss": 1.9415, "reward": null, "learning_rate": 0.0004755705947405417, "epoch": 1.03, "percentage": 51.58, "elapsed_time": "3:44:18", "remaining_time": "3:30:31"} +{"current_steps": 5570, "total_steps": 10798, "loss": 1.9415, "reward": null, "learning_rate": 0.0004755705947405417, "epoch": 1.03, "percentage": 51.58, "elapsed_time": "3:44:14", "remaining_time": "3:30:28"} +{"current_steps": 5570, "total_steps": 10798, "loss": 1.9415, "reward": null, "learning_rate": 0.0004755705947405417, "epoch": 1.03, "percentage": 51.58, "elapsed_time": "3:50:19", "remaining_time": "3:36:11"} +{"current_steps": 5570, "total_steps": 10798, "loss": 1.9415, "reward": null, "learning_rate": 0.0004755705947405417, "epoch": 1.03, "percentage": 51.58, "elapsed_time": "3:44:16", "remaining_time": "3:30:30"} +{"current_steps": 5580, "total_steps": 10798, "loss": 1.9292, "reward": null, "learning_rate": 0.00047411772711806105, "epoch": 1.03, "percentage": 51.68, "elapsed_time": "3:50:42", "remaining_time": "3:35:44"} +{"current_steps": 5580, "total_steps": 10798, "loss": 1.9292, "reward": null, "learning_rate": 0.00047411772711806105, "epoch": 1.03, "percentage": 51.68, "elapsed_time": "3:44:41", "remaining_time": "3:30:06"} +{"current_steps": 5580, "total_steps": 10798, "loss": 1.9292, "reward": null, "learning_rate": 0.00047411772711806105, "epoch": 1.03, "percentage": 51.68, "elapsed_time": "3:44:39", "remaining_time": "3:30:04"} +{"current_steps": 5580, "total_steps": 10798, "loss": 1.9292, "reward": null, "learning_rate": 0.00047411772711806105, "epoch": 1.03, "percentage": 51.68, "elapsed_time": "3:44:37", "remaining_time": "3:30:03"} +{"current_steps": 5590, "total_steps": 10798, "loss": 1.9487, "reward": null, "learning_rate": 0.000472665078581872, "epoch": 1.04, "percentage": 51.77, "elapsed_time": "3:51:06", "remaining_time": "3:35:19"} +{"current_steps": 5590, "total_steps": 10798, "loss": 1.9487, "reward": null, "learning_rate": 0.000472665078581872, "epoch": 1.04, "percentage": 51.77, "elapsed_time": "3:45:01", "remaining_time": "3:29:39"} +{"current_steps": 5590, "total_steps": 10798, "loss": 1.9487, "reward": null, "learning_rate": 0.000472665078581872, "epoch": 1.04, "percentage": 51.77, "elapsed_time": "3:45:03", "remaining_time": "3:29:40"} +{"current_steps": 5590, "total_steps": 10798, "loss": 1.9487, "reward": null, "learning_rate": 0.000472665078581872, "epoch": 1.04, "percentage": 51.77, "elapsed_time": "3:45:05", "remaining_time": "3:29:42"} +{"current_steps": 5600, "total_steps": 10798, "loss": 1.9435, "reward": null, "learning_rate": 0.00047121266142824354, "epoch": 1.04, "percentage": 51.86, "elapsed_time": "3:51:31", "remaining_time": "3:34:53"} +{"current_steps": 5600, "total_steps": 10798, "loss": 1.9435, "reward": null, "learning_rate": 0.00047121266142824354, "epoch": 1.04, "percentage": 51.86, "elapsed_time": "3:45:27", "remaining_time": "3:29:16"} +{"current_steps": 5600, "total_steps": 10798, "loss": 1.9435, "reward": null, "learning_rate": 0.00047121266142824354, "epoch": 1.04, "percentage": 51.86, "elapsed_time": "3:45:26", "remaining_time": "3:29:15"} +{"current_steps": 5600, "total_steps": 10798, "loss": 1.9435, "reward": null, "learning_rate": 0.00047121266142824354, "epoch": 1.04, "percentage": 51.86, "elapsed_time": "3:45:29", "remaining_time": "3:29:18"} +{"current_steps": 5610, "total_steps": 10798, "loss": 1.9145, "reward": null, "learning_rate": 0.0004697604879514853, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "3:45:53", "remaining_time": "3:28:53"} +{"current_steps": 5610, "total_steps": 10798, "loss": 1.9145, "reward": null, "learning_rate": 0.0004697604879514853, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "3:45:50", "remaining_time": "3:28:50"} +{"current_steps": 5610, "total_steps": 10798, "loss": 1.9145, "reward": null, "learning_rate": 0.0004697604879514853, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "3:45:51", "remaining_time": "3:28:52"} +{"current_steps": 5610, "total_steps": 10798, "loss": 1.9145, "reward": null, "learning_rate": 0.0004697604879514853, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "3:51:54", "remaining_time": "3:34:28"} +{"current_steps": 5620, "total_steps": 10798, "loss": 1.9975, "reward": null, "learning_rate": 0.0004683085704438451, "epoch": 1.04, "percentage": 52.05, "elapsed_time": "3:46:18", "remaining_time": "3:28:30"} +{"current_steps": 5620, "total_steps": 10798, "loss": 1.9975, "reward": null, "learning_rate": 0.0004683085704438451, "epoch": 1.04, "percentage": 52.05, "elapsed_time": "3:46:16", "remaining_time": "3:28:29"} +{"current_steps": 5620, "total_steps": 10798, "loss": 1.9975, "reward": null, "learning_rate": 0.0004683085704438451, "epoch": 1.04, "percentage": 52.05, "elapsed_time": "3:52:20", "remaining_time": "3:34:03"} +{"current_steps": 5620, "total_steps": 10798, "loss": 1.9975, "reward": null, "learning_rate": 0.0004683085704438451, "epoch": 1.04, "percentage": 52.05, "elapsed_time": "3:46:15", "remaining_time": "3:28:27"} +{"current_steps": 5630, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 0.00046685692119540357, "epoch": 1.04, "percentage": 52.14, "elapsed_time": "3:46:43", "remaining_time": "3:28:06"} +{"current_steps": 5630, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 0.00046685692119540357, "epoch": 1.04, "percentage": 52.14, "elapsed_time": "3:46:39", "remaining_time": "3:28:03"} +{"current_steps": 5630, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 0.00046685692119540357, "epoch": 1.04, "percentage": 52.14, "elapsed_time": "3:46:41", "remaining_time": "3:28:05"} +{"current_steps": 5630, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 0.00046685692119540357, "epoch": 1.04, "percentage": 52.14, "elapsed_time": "3:52:44", "remaining_time": "3:33:38"} +{"current_steps": 5640, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.00046540555249397056, "epoch": 1.04, "percentage": 52.23, "elapsed_time": "3:47:07", "remaining_time": "3:27:42"} +{"current_steps": 5640, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.00046540555249397056, "epoch": 1.04, "percentage": 52.23, "elapsed_time": "3:53:08", "remaining_time": "3:33:13"} +{"current_steps": 5640, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.00046540555249397056, "epoch": 1.04, "percentage": 52.23, "elapsed_time": "3:47:05", "remaining_time": "3:27:40"} +{"current_steps": 5640, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 0.00046540555249397056, "epoch": 1.04, "percentage": 52.23, "elapsed_time": "3:47:03", "remaining_time": "3:27:39"} +{"current_steps": 5650, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00046395447662498117, "epoch": 1.05, "percentage": 52.32, "elapsed_time": "3:47:28", "remaining_time": "3:27:16"} +{"current_steps": 5650, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00046395447662498117, "epoch": 1.05, "percentage": 52.32, "elapsed_time": "3:53:32", "remaining_time": "3:32:47"} +{"current_steps": 5650, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00046395447662498117, "epoch": 1.05, "percentage": 52.32, "elapsed_time": "3:47:27", "remaining_time": "3:27:14"} +{"current_steps": 5650, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00046395447662498117, "epoch": 1.05, "percentage": 52.32, "elapsed_time": "3:47:30", "remaining_time": "3:27:17"} +{"current_steps": 5660, "total_steps": 10798, "loss": 1.9748, "reward": null, "learning_rate": 0.00046250370587139206, "epoch": 1.05, "percentage": 52.42, "elapsed_time": "3:53:56", "remaining_time": "3:32:21"} +{"current_steps": 5660, "total_steps": 10798, "loss": 1.9748, "reward": null, "learning_rate": 0.00046250370587139206, "epoch": 1.05, "percentage": 52.42, "elapsed_time": "3:47:53", "remaining_time": "3:26:52"} +{"current_steps": 5660, "total_steps": 10798, "loss": 1.9748, "reward": null, "learning_rate": 0.00046250370587139206, "epoch": 1.05, "percentage": 52.42, "elapsed_time": "3:47:55", "remaining_time": "3:26:53"} +{"current_steps": 5660, "total_steps": 10798, "loss": 1.9748, "reward": null, "learning_rate": 0.00046250370587139206, "epoch": 1.05, "percentage": 52.42, "elapsed_time": "3:47:51", "remaining_time": "3:26:50"} +{"current_steps": 5670, "total_steps": 10798, "loss": 1.9125, "reward": null, "learning_rate": 0.00046105325251357695, "epoch": 1.05, "percentage": 52.51, "elapsed_time": "3:54:20", "remaining_time": "3:31:56"} +{"current_steps": 5670, "total_steps": 10798, "loss": 1.9125, "reward": null, "learning_rate": 0.00046105325251357695, "epoch": 1.05, "percentage": 52.51, "elapsed_time": "3:48:18", "remaining_time": "3:26:29"} +{"current_steps": 5670, "total_steps": 10798, "loss": 1.9125, "reward": null, "learning_rate": 0.00046105325251357695, "epoch": 1.05, "percentage": 52.51, "elapsed_time": "3:48:16", "remaining_time": "3:26:27"} +{"current_steps": 5670, "total_steps": 10798, "loss": 1.9125, "reward": null, "learning_rate": 0.00046105325251357695, "epoch": 1.05, "percentage": 52.51, "elapsed_time": "3:48:15", "remaining_time": "3:26:26"} +{"current_steps": 5680, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.00045960312882922306, "epoch": 1.05, "percentage": 52.6, "elapsed_time": "3:48:40", "remaining_time": "3:26:02"} +{"current_steps": 5680, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.00045960312882922306, "epoch": 1.05, "percentage": 52.6, "elapsed_time": "3:48:42", "remaining_time": "3:26:04"} +{"current_steps": 5680, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.00045960312882922306, "epoch": 1.05, "percentage": 52.6, "elapsed_time": "3:54:45", "remaining_time": "3:31:31"} +{"current_steps": 5680, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.00045960312882922306, "epoch": 1.05, "percentage": 52.6, "elapsed_time": "3:48:43", "remaining_time": "3:26:05"} +{"current_steps": 5690, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.00045815334709322665, "epoch": 1.05, "percentage": 52.69, "elapsed_time": "3:55:08", "remaining_time": "3:31:05"} +{"current_steps": 5690, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.00045815334709322665, "epoch": 1.05, "percentage": 52.69, "elapsed_time": "3:49:05", "remaining_time": "3:25:39"} +{"current_steps": 5690, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.00045815334709322665, "epoch": 1.05, "percentage": 52.69, "elapsed_time": "3:49:07", "remaining_time": "3:25:41"} +{"current_steps": 5690, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.00045815334709322665, "epoch": 1.05, "percentage": 52.69, "elapsed_time": "3:49:03", "remaining_time": "3:25:38"} +{"current_steps": 5700, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0004567039195775899, "epoch": 1.06, "percentage": 52.79, "elapsed_time": "3:49:32", "remaining_time": "3:25:17"} +{"current_steps": 5700, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0004567039195775899, "epoch": 1.06, "percentage": 52.79, "elapsed_time": "3:49:28", "remaining_time": "3:25:14"} +{"current_steps": 5700, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0004567039195775899, "epoch": 1.06, "percentage": 52.79, "elapsed_time": "3:49:30", "remaining_time": "3:25:16"} +{"current_steps": 5700, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 0.0004567039195775899, "epoch": 1.06, "percentage": 52.79, "elapsed_time": "3:55:33", "remaining_time": "3:30:41"} +{"current_steps": 5710, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.000455254858551316, "epoch": 1.06, "percentage": 52.88, "elapsed_time": "3:49:55", "remaining_time": "3:24:53"} +{"current_steps": 5710, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.000455254858551316, "epoch": 1.06, "percentage": 52.88, "elapsed_time": "3:49:54", "remaining_time": "3:24:51"} +{"current_steps": 5710, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.000455254858551316, "epoch": 1.06, "percentage": 52.88, "elapsed_time": "3:49:57", "remaining_time": "3:24:54"} +{"current_steps": 5710, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.000455254858551316, "epoch": 1.06, "percentage": 52.88, "elapsed_time": "3:55:59", "remaining_time": "3:30:16"} +{"current_steps": 5720, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00045380617628030693, "epoch": 1.06, "percentage": 52.97, "elapsed_time": "3:56:22", "remaining_time": "3:29:50"} +{"current_steps": 5720, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00045380617628030693, "epoch": 1.06, "percentage": 52.97, "elapsed_time": "3:50:21", "remaining_time": "3:24:29"} +{"current_steps": 5720, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00045380617628030693, "epoch": 1.06, "percentage": 52.97, "elapsed_time": "3:50:17", "remaining_time": "3:24:26"} +{"current_steps": 5720, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 0.00045380617628030693, "epoch": 1.06, "percentage": 52.97, "elapsed_time": "3:50:19", "remaining_time": "3:24:28"} +{"current_steps": 5730, "total_steps": 10798, "loss": 1.9446, "reward": null, "learning_rate": 0.00045235788502725777, "epoch": 1.06, "percentage": 53.07, "elapsed_time": "3:50:43", "remaining_time": "3:24:03"} +{"current_steps": 5730, "total_steps": 10798, "loss": 1.9446, "reward": null, "learning_rate": 0.00045235788502725777, "epoch": 1.06, "percentage": 53.07, "elapsed_time": "3:50:46", "remaining_time": "3:24:06"} +{"current_steps": 5730, "total_steps": 10798, "loss": 1.9446, "reward": null, "learning_rate": 0.00045235788502725777, "epoch": 1.06, "percentage": 53.07, "elapsed_time": "3:50:44", "remaining_time": "3:24:05"} +{"current_steps": 5730, "total_steps": 10798, "loss": 1.9446, "reward": null, "learning_rate": 0.00045235788502725777, "epoch": 1.06, "percentage": 53.07, "elapsed_time": "3:56:47", "remaining_time": "3:29:26"} +{"current_steps": 5740, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.00045090999705155383, "epoch": 1.06, "percentage": 53.16, "elapsed_time": "3:51:06", "remaining_time": "3:23:38"} +{"current_steps": 5740, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.00045090999705155383, "epoch": 1.06, "percentage": 53.16, "elapsed_time": "3:57:11", "remaining_time": "3:29:00"} +{"current_steps": 5740, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.00045090999705155383, "epoch": 1.06, "percentage": 53.16, "elapsed_time": "3:51:07", "remaining_time": "3:23:40"} +{"current_steps": 5740, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.00045090999705155383, "epoch": 1.06, "percentage": 53.16, "elapsed_time": "3:51:09", "remaining_time": "3:23:41"} +{"current_steps": 5750, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004494625246091672, "epoch": 1.07, "percentage": 53.25, "elapsed_time": "3:51:30", "remaining_time": "3:23:15"} +{"current_steps": 5750, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004494625246091672, "epoch": 1.07, "percentage": 53.25, "elapsed_time": "3:57:35", "remaining_time": "3:28:35"} +{"current_steps": 5750, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004494625246091672, "epoch": 1.07, "percentage": 53.25, "elapsed_time": "3:51:34", "remaining_time": "3:23:17"} +{"current_steps": 5750, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 0.0004494625246091672, "epoch": 1.07, "percentage": 53.25, "elapsed_time": "3:51:32", "remaining_time": "3:23:16"} +{"current_steps": 5760, "total_steps": 10798, "loss": 1.9849, "reward": null, "learning_rate": 0.00044801547995255194, "epoch": 1.07, "percentage": 53.34, "elapsed_time": "3:51:57", "remaining_time": "3:22:53"} +{"current_steps": 5760, "total_steps": 10798, "loss": 1.9849, "reward": null, "learning_rate": 0.00044801547995255194, "epoch": 1.07, "percentage": 53.34, "elapsed_time": "3:58:01", "remaining_time": "3:28:11"} +{"current_steps": 5760, "total_steps": 10798, "loss": 1.9849, "reward": null, "learning_rate": 0.00044801547995255194, "epoch": 1.07, "percentage": 53.34, "elapsed_time": "3:51:59", "remaining_time": "3:22:54"} +{"current_steps": 5760, "total_steps": 10798, "loss": 1.9849, "reward": null, "learning_rate": 0.00044801547995255194, "epoch": 1.07, "percentage": 53.34, "elapsed_time": "3:51:56", "remaining_time": "3:22:52"} +{"current_steps": 5770, "total_steps": 10798, "loss": 1.9367, "reward": null, "learning_rate": 0.00044656887533054193, "epoch": 1.07, "percentage": 53.44, "elapsed_time": "3:58:25", "remaining_time": "3:27:45"} +{"current_steps": 5770, "total_steps": 10798, "loss": 1.9367, "reward": null, "learning_rate": 0.00044656887533054193, "epoch": 1.07, "percentage": 53.44, "elapsed_time": "3:52:23", "remaining_time": "3:22:30"} +{"current_steps": 5770, "total_steps": 10798, "loss": 1.9367, "reward": null, "learning_rate": 0.00044656887533054193, "epoch": 1.07, "percentage": 53.44, "elapsed_time": "3:52:21", "remaining_time": "3:22:29"} +{"current_steps": 5770, "total_steps": 10798, "loss": 1.9367, "reward": null, "learning_rate": 0.00044656887533054193, "epoch": 1.07, "percentage": 53.44, "elapsed_time": "3:52:20", "remaining_time": "3:22:27"} +{"current_steps": 5780, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 0.0004451227229882455, "epoch": 1.07, "percentage": 53.53, "elapsed_time": "3:52:47", "remaining_time": "3:22:05"} +{"current_steps": 5780, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 0.0004451227229882455, "epoch": 1.07, "percentage": 53.53, "elapsed_time": "3:52:45", "remaining_time": "3:22:04"} +{"current_steps": 5780, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 0.0004451227229882455, "epoch": 1.07, "percentage": 53.53, "elapsed_time": "3:52:43", "remaining_time": "3:22:02"} +{"current_steps": 5780, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 0.0004451227229882455, "epoch": 1.07, "percentage": 53.53, "elapsed_time": "3:58:48", "remaining_time": "3:27:19"} +{"current_steps": 5790, "total_steps": 10798, "loss": 1.9578, "reward": null, "learning_rate": 0.0004436770351669429, "epoch": 1.07, "percentage": 53.62, "elapsed_time": "3:53:10", "remaining_time": "3:21:40"} +{"current_steps": 5790, "total_steps": 10798, "loss": 1.9578, "reward": null, "learning_rate": 0.0004436770351669429, "epoch": 1.07, "percentage": 53.62, "elapsed_time": "3:53:08", "remaining_time": "3:21:39"} +{"current_steps": 5790, "total_steps": 10798, "loss": 1.9578, "reward": null, "learning_rate": 0.0004436770351669429, "epoch": 1.07, "percentage": 53.62, "elapsed_time": "3:59:13", "remaining_time": "3:26:54"} +{"current_steps": 5790, "total_steps": 10798, "loss": 1.9578, "reward": null, "learning_rate": 0.0004436770351669429, "epoch": 1.07, "percentage": 53.62, "elapsed_time": "3:53:11", "remaining_time": "3:21:42"} +{"current_steps": 5800, "total_steps": 10798, "loss": 1.9095, "reward": null, "learning_rate": 0.0004422318241039821, "epoch": 1.07, "percentage": 53.71, "elapsed_time": "3:53:32", "remaining_time": "3:21:14"} +{"current_steps": 5800, "total_steps": 10798, "loss": 1.9095, "reward": null, "learning_rate": 0.0004422318241039821, "epoch": 1.07, "percentage": 53.71, "elapsed_time": "3:53:35", "remaining_time": "3:21:17"} +{"current_steps": 5800, "total_steps": 10798, "loss": 1.9095, "reward": null, "learning_rate": 0.0004422318241039821, "epoch": 1.07, "percentage": 53.71, "elapsed_time": "3:59:36", "remaining_time": "3:26:28"} +{"current_steps": 5800, "total_steps": 10798, "loss": 1.9095, "reward": null, "learning_rate": 0.0004422318241039821, "epoch": 1.07, "percentage": 53.71, "elapsed_time": "3:53:33", "remaining_time": "3:21:15"} +{"current_steps": 5810, "total_steps": 10798, "loss": 1.9337, "reward": null, "learning_rate": 0.00044078710203267576, "epoch": 1.08, "percentage": 53.81, "elapsed_time": "3:53:56", "remaining_time": "3:20:50"} +{"current_steps": 5810, "total_steps": 10798, "loss": 1.9337, "reward": null, "learning_rate": 0.00044078710203267576, "epoch": 1.08, "percentage": 53.81, "elapsed_time": "4:00:01", "remaining_time": "3:26:03"} +{"current_steps": 5810, "total_steps": 10798, "loss": 1.9337, "reward": null, "learning_rate": 0.00044078710203267576, "epoch": 1.08, "percentage": 53.81, "elapsed_time": "3:53:58", "remaining_time": "3:20:52"} +{"current_steps": 5810, "total_steps": 10798, "loss": 1.9337, "reward": null, "learning_rate": 0.00044078710203267576, "epoch": 1.08, "percentage": 53.81, "elapsed_time": "3:53:59", "remaining_time": "3:20:53"} +{"current_steps": 5820, "total_steps": 10798, "loss": 1.9904, "reward": null, "learning_rate": 0.0004393428811821971, "epoch": 1.08, "percentage": 53.9, "elapsed_time": "3:54:24", "remaining_time": "3:20:29"} +{"current_steps": 5820, "total_steps": 10798, "loss": 1.9904, "reward": null, "learning_rate": 0.0004393428811821971, "epoch": 1.08, "percentage": 53.9, "elapsed_time": "3:54:22", "remaining_time": "3:20:27"} +{"current_steps": 5820, "total_steps": 10798, "loss": 1.9904, "reward": null, "learning_rate": 0.0004393428811821971, "epoch": 1.08, "percentage": 53.9, "elapsed_time": "4:00:25", "remaining_time": "3:25:38"} +{"current_steps": 5820, "total_steps": 10798, "loss": 1.9904, "reward": null, "learning_rate": 0.0004393428811821971, "epoch": 1.08, "percentage": 53.9, "elapsed_time": "3:54:20", "remaining_time": "3:20:26"} +{"current_steps": 5830, "total_steps": 10798, "loss": 1.9569, "reward": null, "learning_rate": 0.00043789917377747695, "epoch": 1.08, "percentage": 53.99, "elapsed_time": "3:54:45", "remaining_time": "3:20:03"} +{"current_steps": 5830, "total_steps": 10798, "loss": 1.9569, "reward": null, "learning_rate": 0.00043789917377747695, "epoch": 1.08, "percentage": 53.99, "elapsed_time": "3:54:47", "remaining_time": "3:20:04"} +{"current_steps": 5830, "total_steps": 10798, "loss": 1.9569, "reward": null, "learning_rate": 0.00043789917377747695, "epoch": 1.08, "percentage": 53.99, "elapsed_time": "3:54:49", "remaining_time": "3:20:05"} +{"current_steps": 5830, "total_steps": 10798, "loss": 1.9569, "reward": null, "learning_rate": 0.00043789917377747695, "epoch": 1.08, "percentage": 53.99, "elapsed_time": "4:00:50", "remaining_time": "3:25:14"} +{"current_steps": 5840, "total_steps": 10798, "loss": 1.9423, "reward": null, "learning_rate": 0.0004364559920390996, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "4:01:14", "remaining_time": "3:24:48"} +{"current_steps": 5840, "total_steps": 10798, "loss": 1.9423, "reward": null, "learning_rate": 0.0004364559920390996, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "3:55:09", "remaining_time": "3:19:38"} +{"current_steps": 5840, "total_steps": 10798, "loss": 1.9423, "reward": null, "learning_rate": 0.0004364559920390996, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "3:55:10", "remaining_time": "3:19:39"} +{"current_steps": 5840, "total_steps": 10798, "loss": 1.9423, "reward": null, "learning_rate": 0.0004364559920390996, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "3:55:12", "remaining_time": "3:19:41"} +{"current_steps": 5850, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.00043501334818320004, "epoch": 1.08, "percentage": 54.18, "elapsed_time": "4:01:38", "remaining_time": "3:24:22"} +{"current_steps": 5850, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.00043501334818320004, "epoch": 1.08, "percentage": 54.18, "elapsed_time": "3:55:34", "remaining_time": "3:19:15"} +{"current_steps": 5850, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.00043501334818320004, "epoch": 1.08, "percentage": 54.18, "elapsed_time": "3:55:36", "remaining_time": "3:19:16"} +{"current_steps": 5850, "total_steps": 10798, "loss": 2.0013, "reward": null, "learning_rate": 0.00043501334818320004, "epoch": 1.08, "percentage": 54.18, "elapsed_time": "3:55:33", "remaining_time": "3:19:14"} +{"current_steps": 5860, "total_steps": 10798, "loss": 1.9585, "reward": null, "learning_rate": 0.0004335712544213597, "epoch": 1.09, "percentage": 54.27, "elapsed_time": "3:56:00", "remaining_time": "3:18:52"} +{"current_steps": 5860, "total_steps": 10798, "loss": 1.9585, "reward": null, "learning_rate": 0.0004335712544213597, "epoch": 1.09, "percentage": 54.27, "elapsed_time": "3:55:58", "remaining_time": "3:18:50"} +{"current_steps": 5860, "total_steps": 10798, "loss": 1.9585, "reward": null, "learning_rate": 0.0004335712544213597, "epoch": 1.09, "percentage": 54.27, "elapsed_time": "3:56:01", "remaining_time": "3:18:53"} +{"current_steps": 5860, "total_steps": 10798, "loss": 1.9585, "reward": null, "learning_rate": 0.0004335712544213597, "epoch": 1.09, "percentage": 54.27, "elapsed_time": "4:02:03", "remaining_time": "3:23:58"} +{"current_steps": 5870, "total_steps": 10798, "loss": 1.9148, "reward": null, "learning_rate": 0.0004321297229605044, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "4:02:27", "remaining_time": "3:23:32"} +{"current_steps": 5870, "total_steps": 10798, "loss": 1.9148, "reward": null, "learning_rate": 0.0004321297229605044, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "3:56:24", "remaining_time": "3:18:27"} +{"current_steps": 5870, "total_steps": 10798, "loss": 1.9148, "reward": null, "learning_rate": 0.0004321297229605044, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "3:56:25", "remaining_time": "3:18:29"} +{"current_steps": 5870, "total_steps": 10798, "loss": 1.9148, "reward": null, "learning_rate": 0.0004321297229605044, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "3:56:22", "remaining_time": "3:18:26"} +{"current_steps": 5880, "total_steps": 10798, "loss": 1.9558, "reward": null, "learning_rate": 0.00043068876600279964, "epoch": 1.09, "percentage": 54.45, "elapsed_time": "3:56:49", "remaining_time": "3:18:04"} +{"current_steps": 5880, "total_steps": 10798, "loss": 1.9558, "reward": null, "learning_rate": 0.00043068876600279964, "epoch": 1.09, "percentage": 54.45, "elapsed_time": "3:56:47", "remaining_time": "3:18:03"} +{"current_steps": 5880, "total_steps": 10798, "loss": 1.9558, "reward": null, "learning_rate": 0.00043068876600279964, "epoch": 1.09, "percentage": 54.45, "elapsed_time": "4:02:50", "remaining_time": "3:23:07"} +{"current_steps": 5880, "total_steps": 10798, "loss": 1.9558, "reward": null, "learning_rate": 0.00043068876600279964, "epoch": 1.09, "percentage": 54.45, "elapsed_time": "3:56:46", "remaining_time": "3:18:01"} +{"current_steps": 5890, "total_steps": 10798, "loss": 1.9899, "reward": null, "learning_rate": 0.0004292483957455482, "epoch": 1.09, "percentage": 54.55, "elapsed_time": "4:03:13", "remaining_time": "3:22:40"} +{"current_steps": 5890, "total_steps": 10798, "loss": 1.9899, "reward": null, "learning_rate": 0.0004292483957455482, "epoch": 1.09, "percentage": 54.55, "elapsed_time": "3:57:12", "remaining_time": "3:17:39"} +{"current_steps": 5890, "total_steps": 10798, "loss": 1.9899, "reward": null, "learning_rate": 0.0004292483957455482, "epoch": 1.09, "percentage": 54.55, "elapsed_time": "3:57:10", "remaining_time": "3:17:37"} +{"current_steps": 5890, "total_steps": 10798, "loss": 1.9899, "reward": null, "learning_rate": 0.0004292483957455482, "epoch": 1.09, "percentage": 54.55, "elapsed_time": "3:57:08", "remaining_time": "3:17:36"} +{"current_steps": 5900, "total_steps": 10798, "loss": 1.9597, "reward": null, "learning_rate": 0.00042780862438108655, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "4:03:37", "remaining_time": "3:22:15"} +{"current_steps": 5900, "total_steps": 10798, "loss": 1.9597, "reward": null, "learning_rate": 0.00042780862438108655, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "3:57:36", "remaining_time": "3:17:15"} +{"current_steps": 5900, "total_steps": 10798, "loss": 1.9597, "reward": null, "learning_rate": 0.00042780862438108655, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "3:57:34", "remaining_time": "3:17:13"} +{"current_steps": 5900, "total_steps": 10798, "loss": 1.9597, "reward": null, "learning_rate": 0.00042780862438108655, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "3:57:33", "remaining_time": "3:17:12"} +{"current_steps": 5910, "total_steps": 10798, "loss": 1.9603, "reward": null, "learning_rate": 0.00042636946409668123, "epoch": 1.09, "percentage": 54.73, "elapsed_time": "3:57:58", "remaining_time": "3:16:49"} +{"current_steps": 5910, "total_steps": 10798, "loss": 1.9603, "reward": null, "learning_rate": 0.00042636946409668123, "epoch": 1.09, "percentage": 54.73, "elapsed_time": "3:57:56", "remaining_time": "3:16:48"} +{"current_steps": 5910, "total_steps": 10798, "loss": 1.9603, "reward": null, "learning_rate": 0.00042636946409668123, "epoch": 1.09, "percentage": 54.73, "elapsed_time": "3:58:00", "remaining_time": "3:16:50"} +{"current_steps": 5910, "total_steps": 10798, "loss": 1.9603, "reward": null, "learning_rate": 0.00042636946409668123, "epoch": 1.09, "percentage": 54.73, "elapsed_time": "4:04:01", "remaining_time": "3:21:49"} +{"current_steps": 5920, "total_steps": 10798, "loss": 1.9771, "reward": null, "learning_rate": 0.00042493092707442717, "epoch": 1.1, "percentage": 54.82, "elapsed_time": "3:58:25", "remaining_time": "3:16:27"} +{"current_steps": 5920, "total_steps": 10798, "loss": 1.9771, "reward": null, "learning_rate": 0.00042493092707442717, "epoch": 1.1, "percentage": 54.82, "elapsed_time": "4:04:26", "remaining_time": "3:21:25"} +{"current_steps": 5920, "total_steps": 10798, "loss": 1.9771, "reward": null, "learning_rate": 0.00042493092707442717, "epoch": 1.1, "percentage": 54.82, "elapsed_time": "3:58:22", "remaining_time": "3:16:24"} +{"current_steps": 5920, "total_steps": 10798, "loss": 1.9771, "reward": null, "learning_rate": 0.00042493092707442717, "epoch": 1.1, "percentage": 54.82, "elapsed_time": "3:58:23", "remaining_time": "3:16:26"} +{"current_steps": 5930, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 0.0004234930254911427, "epoch": 1.1, "percentage": 54.92, "elapsed_time": "4:04:50", "remaining_time": "3:20:59"} +{"current_steps": 5930, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 0.0004234930254911427, "epoch": 1.1, "percentage": 54.92, "elapsed_time": "3:58:48", "remaining_time": "3:16:02"} +{"current_steps": 5930, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 0.0004234930254911427, "epoch": 1.1, "percentage": 54.92, "elapsed_time": "3:58:47", "remaining_time": "3:16:01"} +{"current_steps": 5930, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 0.0004234930254911427, "epoch": 1.1, "percentage": 54.92, "elapsed_time": "3:58:45", "remaining_time": "3:15:59"} +{"current_steps": 5940, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.00042205577151826747, "epoch": 1.1, "percentage": 55.01, "elapsed_time": "4:05:14", "remaining_time": "3:20:34"} +{"current_steps": 5940, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.00042205577151826747, "epoch": 1.1, "percentage": 55.01, "elapsed_time": "3:59:12", "remaining_time": "3:15:38"} +{"current_steps": 5940, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.00042205577151826747, "epoch": 1.1, "percentage": 55.01, "elapsed_time": "3:59:11", "remaining_time": "3:15:37"} +{"current_steps": 5940, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.00042205577151826747, "epoch": 1.1, "percentage": 55.01, "elapsed_time": "3:59:09", "remaining_time": "3:15:35"} +{"current_steps": 5950, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.00042061917732175966, "epoch": 1.1, "percentage": 55.1, "elapsed_time": "3:59:33", "remaining_time": "3:15:11"} +{"current_steps": 5950, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.00042061917732175966, "epoch": 1.1, "percentage": 55.1, "elapsed_time": "4:05:38", "remaining_time": "3:20:08"} +{"current_steps": 5950, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.00042061917732175966, "epoch": 1.1, "percentage": 55.1, "elapsed_time": "3:59:35", "remaining_time": "3:15:12"} +{"current_steps": 5950, "total_steps": 10798, "loss": 1.9636, "reward": null, "learning_rate": 0.00042061917732175966, "epoch": 1.1, "percentage": 55.1, "elapsed_time": "3:59:36", "remaining_time": "3:15:14"} +{"current_steps": 5960, "total_steps": 10798, "loss": 1.966, "reward": null, "learning_rate": 0.000419183255061992, "epoch": 1.1, "percentage": 55.2, "elapsed_time": "3:59:58", "remaining_time": "3:14:47"} +{"current_steps": 5960, "total_steps": 10798, "loss": 1.966, "reward": null, "learning_rate": 0.000419183255061992, "epoch": 1.1, "percentage": 55.2, "elapsed_time": "4:00:00", "remaining_time": "3:14:49"} +{"current_steps": 5960, "total_steps": 10798, "loss": 1.966, "reward": null, "learning_rate": 0.000419183255061992, "epoch": 1.1, "percentage": 55.2, "elapsed_time": "4:00:01", "remaining_time": "3:14:50"} +{"current_steps": 5960, "total_steps": 10798, "loss": 1.966, "reward": null, "learning_rate": 0.000419183255061992, "epoch": 1.1, "percentage": 55.2, "elapsed_time": "4:06:03", "remaining_time": "3:19:44"} +{"current_steps": 5970, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0004177480168936504, "epoch": 1.11, "percentage": 55.29, "elapsed_time": "4:00:24", "remaining_time": "3:14:25"} +{"current_steps": 5970, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0004177480168936504, "epoch": 1.11, "percentage": 55.29, "elapsed_time": "4:00:26", "remaining_time": "3:14:26"} +{"current_steps": 5970, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0004177480168936504, "epoch": 1.11, "percentage": 55.29, "elapsed_time": "4:06:27", "remaining_time": "3:19:18"} +{"current_steps": 5970, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.0004177480168936504, "epoch": 1.11, "percentage": 55.29, "elapsed_time": "4:00:22", "remaining_time": "3:14:23"} +{"current_steps": 5980, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.00041631347496562913, "epoch": 1.11, "percentage": 55.38, "elapsed_time": "4:00:46", "remaining_time": "3:13:59"} +{"current_steps": 5980, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.00041631347496562913, "epoch": 1.11, "percentage": 55.38, "elapsed_time": "4:06:51", "remaining_time": "3:18:53"} +{"current_steps": 5980, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.00041631347496562913, "epoch": 1.11, "percentage": 55.38, "elapsed_time": "4:00:48", "remaining_time": "3:14:00"} +{"current_steps": 5980, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.00041631347496562913, "epoch": 1.11, "percentage": 55.38, "elapsed_time": "4:00:50", "remaining_time": "3:14:02"} +{"current_steps": 5990, "total_steps": 10798, "loss": 1.9809, "reward": null, "learning_rate": 0.0004148796414209297, "epoch": 1.11, "percentage": 55.47, "elapsed_time": "4:01:10", "remaining_time": "3:13:35"} +{"current_steps": 5990, "total_steps": 10798, "loss": 1.9809, "reward": null, "learning_rate": 0.0004148796414209297, "epoch": 1.11, "percentage": 55.47, "elapsed_time": "4:01:14", "remaining_time": "3:13:37"} +{"current_steps": 5990, "total_steps": 10798, "loss": 1.9809, "reward": null, "learning_rate": 0.0004148796414209297, "epoch": 1.11, "percentage": 55.47, "elapsed_time": "4:01:12", "remaining_time": "3:13:36"} +{"current_steps": 5990, "total_steps": 10798, "loss": 1.9809, "reward": null, "learning_rate": 0.0004148796414209297, "epoch": 1.11, "percentage": 55.47, "elapsed_time": "4:07:15", "remaining_time": "3:18:28"} +{"current_steps": 6000, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.0004134465283965568, "epoch": 1.11, "percentage": 55.57, "elapsed_time": "4:01:35", "remaining_time": "3:13:11"} +{"current_steps": 6000, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.0004134465283965568, "epoch": 1.11, "percentage": 55.57, "elapsed_time": "4:01:36", "remaining_time": "3:13:12"} +{"current_steps": 6000, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.0004134465283965568, "epoch": 1.11, "percentage": 55.57, "elapsed_time": "4:07:40", "remaining_time": "3:18:03"} +{"current_steps": 6000, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.0004134465283965568, "epoch": 1.11, "percentage": 55.57, "elapsed_time": "4:01:38", "remaining_time": "3:13:14"} +{"current_steps": 6010, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 0.00041201414802341643, "epoch": 1.11, "percentage": 55.66, "elapsed_time": "4:02:00", "remaining_time": "3:12:47"} +{"current_steps": 6010, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 0.00041201414802341643, "epoch": 1.11, "percentage": 55.66, "elapsed_time": "4:02:02", "remaining_time": "3:12:49"} +{"current_steps": 6010, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 0.00041201414802341643, "epoch": 1.11, "percentage": 55.66, "elapsed_time": "4:08:03", "remaining_time": "3:17:37"} +{"current_steps": 6010, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 0.00041201414802341643, "epoch": 1.11, "percentage": 55.66, "elapsed_time": "4:01:58", "remaining_time": "3:12:46"} +{"current_steps": 6020, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00041058251242621295, "epoch": 1.12, "percentage": 55.75, "elapsed_time": "4:02:26", "remaining_time": "3:12:25"} +{"current_steps": 6020, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00041058251242621295, "epoch": 1.12, "percentage": 55.75, "elapsed_time": "4:02:24", "remaining_time": "3:12:24"} +{"current_steps": 6020, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00041058251242621295, "epoch": 1.12, "percentage": 55.75, "elapsed_time": "4:02:23", "remaining_time": "3:12:22"} +{"current_steps": 6020, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00041058251242621295, "epoch": 1.12, "percentage": 55.75, "elapsed_time": "4:08:28", "remaining_time": "3:17:12"} +{"current_steps": 6030, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.0004091516337233464, "epoch": 1.12, "percentage": 55.84, "elapsed_time": "4:02:46", "remaining_time": "3:11:57"} +{"current_steps": 6030, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.0004091516337233464, "epoch": 1.12, "percentage": 55.84, "elapsed_time": "4:02:49", "remaining_time": "3:12:00"} +{"current_steps": 6030, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.0004091516337233464, "epoch": 1.12, "percentage": 55.84, "elapsed_time": "4:08:51", "remaining_time": "3:16:46"} +{"current_steps": 6030, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.0004091516337233464, "epoch": 1.12, "percentage": 55.84, "elapsed_time": "4:02:47", "remaining_time": "3:11:58"} +{"current_steps": 6040, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.00040772152402680973, "epoch": 1.12, "percentage": 55.94, "elapsed_time": "4:03:10", "remaining_time": "3:11:33"} +{"current_steps": 6040, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.00040772152402680973, "epoch": 1.12, "percentage": 55.94, "elapsed_time": "4:03:13", "remaining_time": "3:11:36"} +{"current_steps": 6040, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.00040772152402680973, "epoch": 1.12, "percentage": 55.94, "elapsed_time": "4:03:11", "remaining_time": "3:11:34"} +{"current_steps": 6040, "total_steps": 10798, "loss": 1.9897, "reward": null, "learning_rate": 0.00040772152402680973, "epoch": 1.12, "percentage": 55.94, "elapsed_time": "4:09:15", "remaining_time": "3:16:20"} +{"current_steps": 6050, "total_steps": 10798, "loss": 1.9473, "reward": null, "learning_rate": 0.00040629219544208644, "epoch": 1.12, "percentage": 56.03, "elapsed_time": "4:09:39", "remaining_time": "3:15:56"} +{"current_steps": 6050, "total_steps": 10798, "loss": 1.9473, "reward": null, "learning_rate": 0.00040629219544208644, "epoch": 1.12, "percentage": 56.03, "elapsed_time": "4:03:36", "remaining_time": "3:11:10"} +{"current_steps": 6050, "total_steps": 10798, "loss": 1.9473, "reward": null, "learning_rate": 0.00040629219544208644, "epoch": 1.12, "percentage": 56.03, "elapsed_time": "4:03:38", "remaining_time": "3:11:12"} +{"current_steps": 6050, "total_steps": 10798, "loss": 1.9473, "reward": null, "learning_rate": 0.00040629219544208644, "epoch": 1.12, "percentage": 56.03, "elapsed_time": "4:03:34", "remaining_time": "3:11:09"} +{"current_steps": 6060, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00040486366006804817, "epoch": 1.12, "percentage": 56.12, "elapsed_time": "4:03:59", "remaining_time": "3:10:45"} +{"current_steps": 6060, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00040486366006804817, "epoch": 1.12, "percentage": 56.12, "elapsed_time": "4:04:02", "remaining_time": "3:10:48"} +{"current_steps": 6060, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00040486366006804817, "epoch": 1.12, "percentage": 56.12, "elapsed_time": "4:10:04", "remaining_time": "3:15:31"} +{"current_steps": 6060, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00040486366006804817, "epoch": 1.12, "percentage": 56.12, "elapsed_time": "4:04:01", "remaining_time": "3:10:47"} +{"current_steps": 6070, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00040343592999685264, "epoch": 1.12, "percentage": 56.21, "elapsed_time": "4:04:26", "remaining_time": "3:10:24"} +{"current_steps": 6070, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00040343592999685264, "epoch": 1.12, "percentage": 56.21, "elapsed_time": "4:10:28", "remaining_time": "3:15:05"} +{"current_steps": 6070, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00040343592999685264, "epoch": 1.12, "percentage": 56.21, "elapsed_time": "4:04:23", "remaining_time": "3:10:21"} +{"current_steps": 6070, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00040343592999685264, "epoch": 1.12, "percentage": 56.21, "elapsed_time": "4:04:24", "remaining_time": "3:10:22"} +{"current_steps": 6080, "total_steps": 10798, "loss": 1.9611, "reward": null, "learning_rate": 0.0004020090173138404, "epoch": 1.13, "percentage": 56.31, "elapsed_time": "4:04:48", "remaining_time": "3:09:58"} +{"current_steps": 6080, "total_steps": 10798, "loss": 1.9611, "reward": null, "learning_rate": 0.0004020090173138404, "epoch": 1.13, "percentage": 56.31, "elapsed_time": "4:04:50", "remaining_time": "3:09:59"} +{"current_steps": 6080, "total_steps": 10798, "loss": 1.9611, "reward": null, "learning_rate": 0.0004020090173138404, "epoch": 1.13, "percentage": 56.31, "elapsed_time": "4:04:47", "remaining_time": "3:09:57"} +{"current_steps": 6080, "total_steps": 10798, "loss": 1.9611, "reward": null, "learning_rate": 0.0004020090173138404, "epoch": 1.13, "percentage": 56.31, "elapsed_time": "4:10:52", "remaining_time": "3:14:40"} +{"current_steps": 6090, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00040058293409743316, "epoch": 1.13, "percentage": 56.4, "elapsed_time": "4:11:14", "remaining_time": "3:14:14"} +{"current_steps": 6090, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00040058293409743316, "epoch": 1.13, "percentage": 56.4, "elapsed_time": "4:05:11", "remaining_time": "3:09:33"} +{"current_steps": 6090, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00040058293409743316, "epoch": 1.13, "percentage": 56.4, "elapsed_time": "4:05:13", "remaining_time": "3:09:34"} +{"current_steps": 6090, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00040058293409743316, "epoch": 1.13, "percentage": 56.4, "elapsed_time": "4:05:10", "remaining_time": "3:09:32"} +{"current_steps": 6100, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00039915769241903175, "epoch": 1.13, "percentage": 56.49, "elapsed_time": "4:11:40", "remaining_time": "3:13:49"} +{"current_steps": 6100, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00039915769241903175, "epoch": 1.13, "percentage": 56.49, "elapsed_time": "4:05:38", "remaining_time": "3:09:11"} +{"current_steps": 6100, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00039915769241903175, "epoch": 1.13, "percentage": 56.49, "elapsed_time": "4:05:36", "remaining_time": "3:09:09"} +{"current_steps": 6100, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00039915769241903175, "epoch": 1.13, "percentage": 56.49, "elapsed_time": "4:05:35", "remaining_time": "3:09:08"} +{"current_steps": 6110, "total_steps": 10798, "loss": 1.9233, "reward": null, "learning_rate": 0.0003977333043429129, "epoch": 1.13, "percentage": 56.58, "elapsed_time": "4:05:59", "remaining_time": "3:08:44"} +{"current_steps": 6110, "total_steps": 10798, "loss": 1.9233, "reward": null, "learning_rate": 0.0003977333043429129, "epoch": 1.13, "percentage": 56.58, "elapsed_time": "4:06:00", "remaining_time": "3:08:45"} +{"current_steps": 6110, "total_steps": 10798, "loss": 1.9233, "reward": null, "learning_rate": 0.0003977333043429129, "epoch": 1.13, "percentage": 56.58, "elapsed_time": "4:06:02", "remaining_time": "3:08:46"} +{"current_steps": 6110, "total_steps": 10798, "loss": 1.9233, "reward": null, "learning_rate": 0.0003977333043429129, "epoch": 1.13, "percentage": 56.58, "elapsed_time": "4:12:04", "remaining_time": "3:13:24"} +{"current_steps": 6120, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0003963097819261288, "epoch": 1.13, "percentage": 56.68, "elapsed_time": "4:12:28", "remaining_time": "3:12:59"} +{"current_steps": 6120, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0003963097819261288, "epoch": 1.13, "percentage": 56.68, "elapsed_time": "4:06:27", "remaining_time": "3:08:22"} +{"current_steps": 6120, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0003963097819261288, "epoch": 1.13, "percentage": 56.68, "elapsed_time": "4:06:23", "remaining_time": "3:08:20"} +{"current_steps": 6120, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0003963097819261288, "epoch": 1.13, "percentage": 56.68, "elapsed_time": "4:06:25", "remaining_time": "3:08:21"} +{"current_steps": 6130, "total_steps": 10798, "loss": 1.9719, "reward": null, "learning_rate": 0.0003948871372184033, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "4:06:48", "remaining_time": "3:07:56"} +{"current_steps": 6130, "total_steps": 10798, "loss": 1.9719, "reward": null, "learning_rate": 0.0003948871372184033, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "4:06:51", "remaining_time": "3:07:58"} +{"current_steps": 6130, "total_steps": 10798, "loss": 1.9719, "reward": null, "learning_rate": 0.0003948871372184033, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "4:06:49", "remaining_time": "3:07:57"} +{"current_steps": 6130, "total_steps": 10798, "loss": 1.9719, "reward": null, "learning_rate": 0.0003948871372184033, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "4:12:52", "remaining_time": "3:12:34"} +{"current_steps": 6140, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0003934653822620309, "epoch": 1.14, "percentage": 56.86, "elapsed_time": "4:07:12", "remaining_time": "3:07:32"} +{"current_steps": 6140, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0003934653822620309, "epoch": 1.14, "percentage": 56.86, "elapsed_time": "4:07:15", "remaining_time": "3:07:35"} +{"current_steps": 6140, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0003934653822620309, "epoch": 1.14, "percentage": 56.86, "elapsed_time": "4:13:17", "remaining_time": "3:12:09"} +{"current_steps": 6140, "total_steps": 10798, "loss": 1.9861, "reward": null, "learning_rate": 0.0003934653822620309, "epoch": 1.14, "percentage": 56.86, "elapsed_time": "4:07:14", "remaining_time": "3:07:33"} +{"current_steps": 6150, "total_steps": 10798, "loss": 1.9514, "reward": null, "learning_rate": 0.0003920445290917747, "epoch": 1.14, "percentage": 56.95, "elapsed_time": "4:13:43", "remaining_time": "3:11:45"} +{"current_steps": 6150, "total_steps": 10798, "loss": 1.9514, "reward": null, "learning_rate": 0.0003920445290917747, "epoch": 1.14, "percentage": 56.95, "elapsed_time": "4:07:39", "remaining_time": "3:07:10"} +{"current_steps": 6150, "total_steps": 10798, "loss": 1.9514, "reward": null, "learning_rate": 0.0003920445290917747, "epoch": 1.14, "percentage": 56.95, "elapsed_time": "4:07:41", "remaining_time": "3:07:11"} +{"current_steps": 6150, "total_steps": 10798, "loss": 1.9514, "reward": null, "learning_rate": 0.0003920445290917747, "epoch": 1.14, "percentage": 56.95, "elapsed_time": "4:07:38", "remaining_time": "3:07:09"} +{"current_steps": 6160, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0003906245897347643, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "4:14:07", "remaining_time": "3:11:19"} +{"current_steps": 6160, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0003906245897347643, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "4:08:02", "remaining_time": "3:06:45"} +{"current_steps": 6160, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0003906245897347643, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "4:08:03", "remaining_time": "3:06:46"} +{"current_steps": 6160, "total_steps": 10798, "loss": 2.0047, "reward": null, "learning_rate": 0.0003906245897347643, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "4:08:05", "remaining_time": "3:06:47"} +{"current_steps": 6170, "total_steps": 10798, "loss": 1.934, "reward": null, "learning_rate": 0.0003892055762103943, "epoch": 1.14, "percentage": 57.14, "elapsed_time": "4:08:25", "remaining_time": "3:06:20"} +{"current_steps": 6170, "total_steps": 10798, "loss": 1.934, "reward": null, "learning_rate": 0.0003892055762103943, "epoch": 1.14, "percentage": 57.14, "elapsed_time": "4:14:30", "remaining_time": "3:10:54"} +{"current_steps": 6170, "total_steps": 10798, "loss": 1.934, "reward": null, "learning_rate": 0.0003892055762103943, "epoch": 1.14, "percentage": 57.14, "elapsed_time": "4:08:29", "remaining_time": "3:06:23"} +{"current_steps": 6170, "total_steps": 10798, "loss": 1.934, "reward": null, "learning_rate": 0.0003892055762103943, "epoch": 1.14, "percentage": 57.14, "elapsed_time": "4:08:27", "remaining_time": "3:06:21"} +{"current_steps": 6180, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0003877875005302223, "epoch": 1.14, "percentage": 57.23, "elapsed_time": "4:08:52", "remaining_time": "3:05:58"} +{"current_steps": 6180, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0003877875005302223, "epoch": 1.14, "percentage": 57.23, "elapsed_time": "4:14:54", "remaining_time": "3:10:28"} +{"current_steps": 6180, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0003877875005302223, "epoch": 1.14, "percentage": 57.23, "elapsed_time": "4:08:51", "remaining_time": "3:05:57"} +{"current_steps": 6180, "total_steps": 10798, "loss": 1.9619, "reward": null, "learning_rate": 0.0003877875005302223, "epoch": 1.14, "percentage": 57.23, "elapsed_time": "4:08:49", "remaining_time": "3:05:56"} +{"current_steps": 6190, "total_steps": 10798, "loss": 1.9085, "reward": null, "learning_rate": 0.00038637037469786727, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "4:15:18", "remaining_time": "3:10:03"} +{"current_steps": 6190, "total_steps": 10798, "loss": 1.9085, "reward": null, "learning_rate": 0.00038637037469786727, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "4:09:13", "remaining_time": "3:05:32"} +{"current_steps": 6190, "total_steps": 10798, "loss": 1.9085, "reward": null, "learning_rate": 0.00038637037469786727, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "4:09:17", "remaining_time": "3:05:34"} +{"current_steps": 6190, "total_steps": 10798, "loss": 1.9085, "reward": null, "learning_rate": 0.00038637037469786727, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "4:09:15", "remaining_time": "3:05:33"} +{"current_steps": 6200, "total_steps": 10798, "loss": 1.9222, "reward": null, "learning_rate": 0.00038495421070890796, "epoch": 1.15, "percentage": 57.42, "elapsed_time": "4:09:38", "remaining_time": "3:05:08"} +{"current_steps": 6200, "total_steps": 10798, "loss": 1.9222, "reward": null, "learning_rate": 0.00038495421070890796, "epoch": 1.15, "percentage": 57.42, "elapsed_time": "4:09:41", "remaining_time": "3:05:10"} +{"current_steps": 6200, "total_steps": 10798, "loss": 1.9222, "reward": null, "learning_rate": 0.00038495421070890796, "epoch": 1.15, "percentage": 57.42, "elapsed_time": "4:09:40", "remaining_time": "3:05:09"} +{"current_steps": 6200, "total_steps": 10798, "loss": 1.9222, "reward": null, "learning_rate": 0.00038495421070890796, "epoch": 1.15, "percentage": 57.42, "elapsed_time": "4:15:43", "remaining_time": "3:09:38"} +{"current_steps": 6210, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003835390205507812, "epoch": 1.15, "percentage": 57.51, "elapsed_time": "4:10:03", "remaining_time": "3:04:44"} +{"current_steps": 6210, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003835390205507812, "epoch": 1.15, "percentage": 57.51, "elapsed_time": "4:16:06", "remaining_time": "3:09:13"} +{"current_steps": 6210, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003835390205507812, "epoch": 1.15, "percentage": 57.51, "elapsed_time": "4:10:05", "remaining_time": "3:04:46"} +{"current_steps": 6210, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003835390205507812, "epoch": 1.15, "percentage": 57.51, "elapsed_time": "4:10:02", "remaining_time": "3:04:43"} +{"current_steps": 6220, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00038212481620268125, "epoch": 1.15, "percentage": 57.6, "elapsed_time": "4:10:29", "remaining_time": "3:04:22"} +{"current_steps": 6220, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00038212481620268125, "epoch": 1.15, "percentage": 57.6, "elapsed_time": "4:10:28", "remaining_time": "3:04:20"} +{"current_steps": 6220, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00038212481620268125, "epoch": 1.15, "percentage": 57.6, "elapsed_time": "4:16:31", "remaining_time": "3:08:48"} +{"current_steps": 6220, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00038212481620268125, "epoch": 1.15, "percentage": 57.6, "elapsed_time": "4:10:26", "remaining_time": "3:04:19"} +{"current_steps": 6230, "total_steps": 10798, "loss": 1.974, "reward": null, "learning_rate": 0.000380711609635457, "epoch": 1.15, "percentage": 57.7, "elapsed_time": "4:16:54", "remaining_time": "3:08:22"} +{"current_steps": 6230, "total_steps": 10798, "loss": 1.974, "reward": null, "learning_rate": 0.000380711609635457, "epoch": 1.15, "percentage": 57.7, "elapsed_time": "4:10:49", "remaining_time": "3:03:54"} +{"current_steps": 6230, "total_steps": 10798, "loss": 1.974, "reward": null, "learning_rate": 0.000380711609635457, "epoch": 1.15, "percentage": 57.7, "elapsed_time": "4:10:51", "remaining_time": "3:03:55"} +{"current_steps": 6230, "total_steps": 10798, "loss": 1.974, "reward": null, "learning_rate": 0.000380711609635457, "epoch": 1.15, "percentage": 57.7, "elapsed_time": "4:10:52", "remaining_time": "3:03:57"} +{"current_steps": 6240, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.000379299412811512, "epoch": 1.16, "percentage": 57.79, "elapsed_time": "4:11:16", "remaining_time": "3:03:32"} +{"current_steps": 6240, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.000379299412811512, "epoch": 1.16, "percentage": 57.79, "elapsed_time": "4:11:14", "remaining_time": "3:03:31"} +{"current_steps": 6240, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.000379299412811512, "epoch": 1.16, "percentage": 57.79, "elapsed_time": "4:17:18", "remaining_time": "3:07:56"} +{"current_steps": 6240, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.000379299412811512, "epoch": 1.16, "percentage": 57.79, "elapsed_time": "4:11:13", "remaining_time": "3:03:30"} +{"current_steps": 6250, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.00037788823768470227, "epoch": 1.16, "percentage": 57.88, "elapsed_time": "4:17:42", "remaining_time": "3:07:31"} +{"current_steps": 6250, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.00037788823768470227, "epoch": 1.16, "percentage": 57.88, "elapsed_time": "4:11:37", "remaining_time": "3:03:06"} +{"current_steps": 6250, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.00037788823768470227, "epoch": 1.16, "percentage": 57.88, "elapsed_time": "4:11:41", "remaining_time": "3:03:08"} +{"current_steps": 6250, "total_steps": 10798, "loss": 1.8982, "reward": null, "learning_rate": 0.00037788823768470227, "epoch": 1.16, "percentage": 57.88, "elapsed_time": "4:11:39", "remaining_time": "3:03:07"} +{"current_steps": 6260, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.0003764780962002352, "epoch": 1.16, "percentage": 57.97, "elapsed_time": "4:12:01", "remaining_time": "3:02:41"} +{"current_steps": 6260, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.0003764780962002352, "epoch": 1.16, "percentage": 57.97, "elapsed_time": "4:18:06", "remaining_time": "3:07:06"} +{"current_steps": 6260, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.0003764780962002352, "epoch": 1.16, "percentage": 57.97, "elapsed_time": "4:12:04", "remaining_time": "3:02:44"} +{"current_steps": 6260, "total_steps": 10798, "loss": 1.9384, "reward": null, "learning_rate": 0.0003764780962002352, "epoch": 1.16, "percentage": 57.97, "elapsed_time": "4:12:02", "remaining_time": "3:02:42"} +{"current_steps": 6270, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.0003750690002945695, "epoch": 1.16, "percentage": 58.07, "elapsed_time": "4:12:27", "remaining_time": "3:02:18"} +{"current_steps": 6270, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.0003750690002945695, "epoch": 1.16, "percentage": 58.07, "elapsed_time": "4:12:25", "remaining_time": "3:02:17"} +{"current_steps": 6270, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.0003750690002945695, "epoch": 1.16, "percentage": 58.07, "elapsed_time": "4:18:30", "remaining_time": "3:06:41"} +{"current_steps": 6270, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.0003750690002945695, "epoch": 1.16, "percentage": 58.07, "elapsed_time": "4:12:28", "remaining_time": "3:02:19"} +{"current_steps": 6280, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00037366096189531253, "epoch": 1.16, "percentage": 58.16, "elapsed_time": "4:18:53", "remaining_time": "3:06:15"} +{"current_steps": 6280, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00037366096189531253, "epoch": 1.16, "percentage": 58.16, "elapsed_time": "4:12:52", "remaining_time": "3:01:55"} +{"current_steps": 6280, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00037366096189531253, "epoch": 1.16, "percentage": 58.16, "elapsed_time": "4:12:50", "remaining_time": "3:01:54"} +{"current_steps": 6280, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00037366096189531253, "epoch": 1.16, "percentage": 58.16, "elapsed_time": "4:12:49", "remaining_time": "3:01:53"} +{"current_steps": 6290, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 0.0003722539929211205, "epoch": 1.17, "percentage": 58.25, "elapsed_time": "4:13:14", "remaining_time": "3:01:29"} +{"current_steps": 6290, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 0.0003722539929211205, "epoch": 1.17, "percentage": 58.25, "elapsed_time": "4:19:19", "remaining_time": "3:05:51"} +{"current_steps": 6290, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 0.0003722539929211205, "epoch": 1.17, "percentage": 58.25, "elapsed_time": "4:13:15", "remaining_time": "3:01:30"} +{"current_steps": 6290, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 0.0003722539929211205, "epoch": 1.17, "percentage": 58.25, "elapsed_time": "4:13:17", "remaining_time": "3:01:32"} +{"current_steps": 6300, "total_steps": 10798, "loss": 2.008, "reward": null, "learning_rate": 0.0003708481052815973, "epoch": 1.17, "percentage": 58.34, "elapsed_time": "4:19:42", "remaining_time": "3:05:25"} +{"current_steps": 6300, "total_steps": 10798, "loss": 2.008, "reward": null, "learning_rate": 0.0003708481052815973, "epoch": 1.17, "percentage": 58.34, "elapsed_time": "4:13:37", "remaining_time": "3:01:04"} +{"current_steps": 6300, "total_steps": 10798, "loss": 2.008, "reward": null, "learning_rate": 0.0003708481052815973, "epoch": 1.17, "percentage": 58.34, "elapsed_time": "4:13:38", "remaining_time": "3:01:05"} +{"current_steps": 6300, "total_steps": 10798, "loss": 2.008, "reward": null, "learning_rate": 0.0003708481052815973, "epoch": 1.17, "percentage": 58.34, "elapsed_time": "4:13:40", "remaining_time": "3:01:07"} +{"current_steps": 6310, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0003694433108771933, "epoch": 1.17, "percentage": 58.44, "elapsed_time": "4:14:03", "remaining_time": "3:00:42"} +{"current_steps": 6310, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0003694433108771933, "epoch": 1.17, "percentage": 58.44, "elapsed_time": "4:14:02", "remaining_time": "3:00:40"} +{"current_steps": 6310, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0003694433108771933, "epoch": 1.17, "percentage": 58.44, "elapsed_time": "4:20:06", "remaining_time": "3:05:00"} +{"current_steps": 6310, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0003694433108771933, "epoch": 1.17, "percentage": 58.44, "elapsed_time": "4:14:05", "remaining_time": "3:00:43"} +{"current_steps": 6320, "total_steps": 10798, "loss": 1.8619, "reward": null, "learning_rate": 0.00036803962159910543, "epoch": 1.17, "percentage": 58.53, "elapsed_time": "4:14:29", "remaining_time": "3:00:19"} +{"current_steps": 6320, "total_steps": 10798, "loss": 1.8619, "reward": null, "learning_rate": 0.00036803962159910543, "epoch": 1.17, "percentage": 58.53, "elapsed_time": "4:20:31", "remaining_time": "3:04:35"} +{"current_steps": 6320, "total_steps": 10798, "loss": 1.8619, "reward": null, "learning_rate": 0.00036803962159910543, "epoch": 1.17, "percentage": 58.53, "elapsed_time": "4:14:26", "remaining_time": "3:00:16"} +{"current_steps": 6320, "total_steps": 10798, "loss": 1.8619, "reward": null, "learning_rate": 0.00036803962159910543, "epoch": 1.17, "percentage": 58.53, "elapsed_time": "4:14:28", "remaining_time": "3:00:18"} +{"current_steps": 6330, "total_steps": 10798, "loss": 1.9612, "reward": null, "learning_rate": 0.0003666370493291757, "epoch": 1.17, "percentage": 58.62, "elapsed_time": "4:14:54", "remaining_time": "2:59:55"} +{"current_steps": 6330, "total_steps": 10798, "loss": 1.9612, "reward": null, "learning_rate": 0.0003666370493291757, "epoch": 1.17, "percentage": 58.62, "elapsed_time": "4:14:53", "remaining_time": "2:59:54"} +{"current_steps": 6330, "total_steps": 10798, "loss": 1.9612, "reward": null, "learning_rate": 0.0003666370493291757, "epoch": 1.17, "percentage": 58.62, "elapsed_time": "4:14:51", "remaining_time": "2:59:53"} +{"current_steps": 6330, "total_steps": 10798, "loss": 1.9612, "reward": null, "learning_rate": 0.0003666370493291757, "epoch": 1.17, "percentage": 58.62, "elapsed_time": "4:20:56", "remaining_time": "3:04:10"} +{"current_steps": 6340, "total_steps": 10798, "loss": 1.9371, "reward": null, "learning_rate": 0.0003652356059397909, "epoch": 1.17, "percentage": 58.71, "elapsed_time": "4:15:15", "remaining_time": "2:59:29"} +{"current_steps": 6340, "total_steps": 10798, "loss": 1.9371, "reward": null, "learning_rate": 0.0003652356059397909, "epoch": 1.17, "percentage": 58.71, "elapsed_time": "4:21:20", "remaining_time": "3:03:45"} +{"current_steps": 6340, "total_steps": 10798, "loss": 1.9371, "reward": null, "learning_rate": 0.0003652356059397909, "epoch": 1.17, "percentage": 58.71, "elapsed_time": "4:15:17", "remaining_time": "2:59:30"} +{"current_steps": 6340, "total_steps": 10798, "loss": 1.9371, "reward": null, "learning_rate": 0.0003652356059397909, "epoch": 1.17, "percentage": 58.71, "elapsed_time": "4:15:19", "remaining_time": "2:59:31"} +{"current_steps": 6350, "total_steps": 10798, "loss": 1.9193, "reward": null, "learning_rate": 0.00036383530329378225, "epoch": 1.18, "percentage": 58.81, "elapsed_time": "4:15:41", "remaining_time": "2:59:06"} +{"current_steps": 6350, "total_steps": 10798, "loss": 1.9193, "reward": null, "learning_rate": 0.00036383530329378225, "epoch": 1.18, "percentage": 58.81, "elapsed_time": "4:15:42", "remaining_time": "2:59:07"} +{"current_steps": 6350, "total_steps": 10798, "loss": 1.9193, "reward": null, "learning_rate": 0.00036383530329378225, "epoch": 1.18, "percentage": 58.81, "elapsed_time": "4:15:44", "remaining_time": "2:59:08"} +{"current_steps": 6350, "total_steps": 10798, "loss": 1.9193, "reward": null, "learning_rate": 0.00036383530329378225, "epoch": 1.18, "percentage": 58.81, "elapsed_time": "4:21:46", "remaining_time": "3:03:21"} +{"current_steps": 6360, "total_steps": 10798, "loss": 1.9509, "reward": null, "learning_rate": 0.00036243615324432494, "epoch": 1.18, "percentage": 58.9, "elapsed_time": "4:16:05", "remaining_time": "2:58:41"} +{"current_steps": 6360, "total_steps": 10798, "loss": 1.9509, "reward": null, "learning_rate": 0.00036243615324432494, "epoch": 1.18, "percentage": 58.9, "elapsed_time": "4:16:06", "remaining_time": "2:58:42"} +{"current_steps": 6360, "total_steps": 10798, "loss": 1.9509, "reward": null, "learning_rate": 0.00036243615324432494, "epoch": 1.18, "percentage": 58.9, "elapsed_time": "4:16:08", "remaining_time": "2:58:44"} +{"current_steps": 6360, "total_steps": 10798, "loss": 1.9509, "reward": null, "learning_rate": 0.00036243615324432494, "epoch": 1.18, "percentage": 58.9, "elapsed_time": "4:22:10", "remaining_time": "3:02:56"} +{"current_steps": 6370, "total_steps": 10798, "loss": 1.9517, "reward": null, "learning_rate": 0.00036103816763483775, "epoch": 1.18, "percentage": 58.99, "elapsed_time": "4:16:33", "remaining_time": "2:58:20"} +{"current_steps": 6370, "total_steps": 10798, "loss": 1.9517, "reward": null, "learning_rate": 0.00036103816763483775, "epoch": 1.18, "percentage": 58.99, "elapsed_time": "4:22:34", "remaining_time": "3:02:31"} +{"current_steps": 6370, "total_steps": 10798, "loss": 1.9517, "reward": null, "learning_rate": 0.00036103816763483775, "epoch": 1.18, "percentage": 58.99, "elapsed_time": "4:16:31", "remaining_time": "2:58:19"} +{"current_steps": 6370, "total_steps": 10798, "loss": 1.9517, "reward": null, "learning_rate": 0.00036103816763483775, "epoch": 1.18, "percentage": 58.99, "elapsed_time": "4:16:29", "remaining_time": "2:58:17"} +{"current_steps": 6380, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.00035964135829888287, "epoch": 1.18, "percentage": 59.09, "elapsed_time": "4:16:58", "remaining_time": "2:57:56"} +{"current_steps": 6380, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.00035964135829888287, "epoch": 1.18, "percentage": 59.09, "elapsed_time": "4:22:59", "remaining_time": "3:02:07"} +{"current_steps": 6380, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.00035964135829888287, "epoch": 1.18, "percentage": 59.09, "elapsed_time": "4:16:56", "remaining_time": "2:57:55"} +{"current_steps": 6380, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 0.00035964135829888287, "epoch": 1.18, "percentage": 59.09, "elapsed_time": "4:16:54", "remaining_time": "2:57:54"} +{"current_steps": 6390, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.00035824573706006547, "epoch": 1.18, "percentage": 59.18, "elapsed_time": "4:17:21", "remaining_time": "2:57:32"} +{"current_steps": 6390, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.00035824573706006547, "epoch": 1.18, "percentage": 59.18, "elapsed_time": "4:23:25", "remaining_time": "3:01:42"} +{"current_steps": 6390, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.00035824573706006547, "epoch": 1.18, "percentage": 59.18, "elapsed_time": "4:17:23", "remaining_time": "2:57:33"} +{"current_steps": 6390, "total_steps": 10798, "loss": 1.9985, "reward": null, "learning_rate": 0.00035824573706006547, "epoch": 1.18, "percentage": 59.18, "elapsed_time": "4:17:20", "remaining_time": "2:57:31"} +{"current_steps": 6400, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.00035685131573193386, "epoch": 1.19, "percentage": 59.27, "elapsed_time": "4:23:49", "remaining_time": "3:01:17"} +{"current_steps": 6400, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.00035685131573193386, "epoch": 1.19, "percentage": 59.27, "elapsed_time": "4:17:44", "remaining_time": "2:57:06"} +{"current_steps": 6400, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.00035685131573193386, "epoch": 1.19, "percentage": 59.27, "elapsed_time": "4:17:47", "remaining_time": "2:57:09"} +{"current_steps": 6400, "total_steps": 10798, "loss": 1.9791, "reward": null, "learning_rate": 0.00035685131573193386, "epoch": 1.19, "percentage": 59.27, "elapsed_time": "4:17:45", "remaining_time": "2:57:07"} +{"current_steps": 6410, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 0.00035545810611787925, "epoch": 1.19, "percentage": 59.36, "elapsed_time": "4:24:13", "remaining_time": "3:00:52"} +{"current_steps": 6410, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 0.00035545810611787925, "epoch": 1.19, "percentage": 59.36, "elapsed_time": "4:18:08", "remaining_time": "2:56:42"} +{"current_steps": 6410, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 0.00035545810611787925, "epoch": 1.19, "percentage": 59.36, "elapsed_time": "4:18:09", "remaining_time": "2:56:43"} +{"current_steps": 6410, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 0.00035545810611787925, "epoch": 1.19, "percentage": 59.36, "elapsed_time": "4:18:11", "remaining_time": "2:56:44"} +{"current_steps": 6420, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003540661200110367, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "4:18:33", "remaining_time": "2:56:19"} +{"current_steps": 6420, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003540661200110367, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "4:18:36", "remaining_time": "2:56:21"} +{"current_steps": 6420, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003540661200110367, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "4:24:38", "remaining_time": "3:00:27"} +{"current_steps": 6420, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.0003540661200110367, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "4:18:34", "remaining_time": "2:56:20"} +{"current_steps": 6430, "total_steps": 10798, "loss": 1.9928, "reward": null, "learning_rate": 0.00035267536919418395, "epoch": 1.19, "percentage": 59.55, "elapsed_time": "4:18:58", "remaining_time": "2:55:55"} +{"current_steps": 6430, "total_steps": 10798, "loss": 1.9928, "reward": null, "learning_rate": 0.00035267536919418395, "epoch": 1.19, "percentage": 59.55, "elapsed_time": "4:18:56", "remaining_time": "2:55:54"} +{"current_steps": 6430, "total_steps": 10798, "loss": 1.9928, "reward": null, "learning_rate": 0.00035267536919418395, "epoch": 1.19, "percentage": 59.55, "elapsed_time": "4:19:00", "remaining_time": "2:55:56"} +{"current_steps": 6430, "total_steps": 10798, "loss": 1.9928, "reward": null, "learning_rate": 0.00035267536919418395, "epoch": 1.19, "percentage": 59.55, "elapsed_time": "4:25:01", "remaining_time": "3:00:02"} +{"current_steps": 6440, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 0.00035128586543964243, "epoch": 1.19, "percentage": 59.64, "elapsed_time": "4:25:25", "remaining_time": "2:59:36"} +{"current_steps": 6440, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 0.00035128586543964243, "epoch": 1.19, "percentage": 59.64, "elapsed_time": "4:19:23", "remaining_time": "2:55:32"} +{"current_steps": 6440, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 0.00035128586543964243, "epoch": 1.19, "percentage": 59.64, "elapsed_time": "4:19:20", "remaining_time": "2:55:29"} +{"current_steps": 6440, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 0.00035128586543964243, "epoch": 1.19, "percentage": 59.64, "elapsed_time": "4:19:22", "remaining_time": "2:55:30"} +{"current_steps": 6450, "total_steps": 10798, "loss": 1.9837, "reward": null, "learning_rate": 0.00034989762050917784, "epoch": 1.19, "percentage": 59.73, "elapsed_time": "4:19:48", "remaining_time": "2:55:08"} +{"current_steps": 6450, "total_steps": 10798, "loss": 1.9837, "reward": null, "learning_rate": 0.00034989762050917784, "epoch": 1.19, "percentage": 59.73, "elapsed_time": "4:19:44", "remaining_time": "2:55:05"} +{"current_steps": 6450, "total_steps": 10798, "loss": 1.9837, "reward": null, "learning_rate": 0.00034989762050917784, "epoch": 1.19, "percentage": 59.73, "elapsed_time": "4:19:46", "remaining_time": "2:55:06"} +{"current_steps": 6450, "total_steps": 10798, "loss": 1.9837, "reward": null, "learning_rate": 0.00034989762050917784, "epoch": 1.19, "percentage": 59.73, "elapsed_time": "4:25:49", "remaining_time": "2:59:11"} +{"current_steps": 6460, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 0.0003485106461538999, "epoch": 1.2, "percentage": 59.83, "elapsed_time": "4:26:15", "remaining_time": "2:58:47"} +{"current_steps": 6460, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 0.0003485106461538999, "epoch": 1.2, "percentage": 59.83, "elapsed_time": "4:20:13", "remaining_time": "2:54:44"} +{"current_steps": 6460, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 0.0003485106461538999, "epoch": 1.2, "percentage": 59.83, "elapsed_time": "4:20:12", "remaining_time": "2:54:43"} +{"current_steps": 6460, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 0.0003485106461538999, "epoch": 1.2, "percentage": 59.83, "elapsed_time": "4:20:10", "remaining_time": "2:54:42"} +{"current_steps": 6470, "total_steps": 10798, "loss": 1.9284, "reward": null, "learning_rate": 0.00034712495411416385, "epoch": 1.2, "percentage": 59.92, "elapsed_time": "4:20:37", "remaining_time": "2:54:20"} +{"current_steps": 6470, "total_steps": 10798, "loss": 1.9284, "reward": null, "learning_rate": 0.00034712495411416385, "epoch": 1.2, "percentage": 59.92, "elapsed_time": "4:26:40", "remaining_time": "2:58:23"} +{"current_steps": 6470, "total_steps": 10798, "loss": 1.9284, "reward": null, "learning_rate": 0.00034712495411416385, "epoch": 1.2, "percentage": 59.92, "elapsed_time": "4:20:38", "remaining_time": "2:54:21"} +{"current_steps": 6470, "total_steps": 10798, "loss": 1.9284, "reward": null, "learning_rate": 0.00034712495411416385, "epoch": 1.2, "percentage": 59.92, "elapsed_time": "4:20:35", "remaining_time": "2:54:19"} +{"current_steps": 6480, "total_steps": 10798, "loss": 1.8848, "reward": null, "learning_rate": 0.00034574055611946984, "epoch": 1.2, "percentage": 60.01, "elapsed_time": "4:27:05", "remaining_time": "2:57:58"} +{"current_steps": 6480, "total_steps": 10798, "loss": 1.8848, "reward": null, "learning_rate": 0.00034574055611946984, "epoch": 1.2, "percentage": 60.01, "elapsed_time": "4:21:00", "remaining_time": "2:53:55"} +{"current_steps": 6480, "total_steps": 10798, "loss": 1.8848, "reward": null, "learning_rate": 0.00034574055611946984, "epoch": 1.2, "percentage": 60.01, "elapsed_time": "4:21:03", "remaining_time": "2:53:57"} +{"current_steps": 6480, "total_steps": 10798, "loss": 1.8848, "reward": null, "learning_rate": 0.00034574055611946984, "epoch": 1.2, "percentage": 60.01, "elapsed_time": "4:21:01", "remaining_time": "2:53:56"} +{"current_steps": 6490, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00034435746388836457, "epoch": 1.2, "percentage": 60.1, "elapsed_time": "4:27:29", "remaining_time": "2:57:33"} +{"current_steps": 6490, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00034435746388836457, "epoch": 1.2, "percentage": 60.1, "elapsed_time": "4:21:24", "remaining_time": "2:53:31"} +{"current_steps": 6490, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00034435746388836457, "epoch": 1.2, "percentage": 60.1, "elapsed_time": "4:21:25", "remaining_time": "2:53:32"} +{"current_steps": 6490, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00034435746388836457, "epoch": 1.2, "percentage": 60.1, "elapsed_time": "4:21:27", "remaining_time": "2:53:33"} +{"current_steps": 6500, "total_steps": 10798, "loss": 1.9635, "reward": null, "learning_rate": 0.00034297568912834177, "epoch": 1.2, "percentage": 60.2, "elapsed_time": "4:21:51", "remaining_time": "2:53:09"} +{"current_steps": 6500, "total_steps": 10798, "loss": 1.9635, "reward": null, "learning_rate": 0.00034297568912834177, "epoch": 1.2, "percentage": 60.2, "elapsed_time": "4:21:50", "remaining_time": "2:53:08"} +{"current_steps": 6500, "total_steps": 10798, "loss": 1.9635, "reward": null, "learning_rate": 0.00034297568912834177, "epoch": 1.2, "percentage": 60.2, "elapsed_time": "4:21:48", "remaining_time": "2:53:07"} +{"current_steps": 6500, "total_steps": 10798, "loss": 1.9635, "reward": null, "learning_rate": 0.00034297568912834177, "epoch": 1.2, "percentage": 60.2, "elapsed_time": "4:27:53", "remaining_time": "2:57:08"} +{"current_steps": 6510, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0003415952435357431, "epoch": 1.21, "percentage": 60.29, "elapsed_time": "4:28:17", "remaining_time": "2:56:43"} +{"current_steps": 6510, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0003415952435357431, "epoch": 1.21, "percentage": 60.29, "elapsed_time": "4:22:13", "remaining_time": "2:52:43"} +{"current_steps": 6510, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0003415952435357431, "epoch": 1.21, "percentage": 60.29, "elapsed_time": "4:22:16", "remaining_time": "2:52:45"} +{"current_steps": 6510, "total_steps": 10798, "loss": 1.9794, "reward": null, "learning_rate": 0.0003415952435357431, "epoch": 1.21, "percentage": 60.29, "elapsed_time": "4:22:14", "remaining_time": "2:52:44"} +{"current_steps": 6520, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 0.00034021613879565944, "epoch": 1.21, "percentage": 60.38, "elapsed_time": "4:28:41", "remaining_time": "2:56:18"} +{"current_steps": 6520, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 0.00034021613879565944, "epoch": 1.21, "percentage": 60.38, "elapsed_time": "4:22:40", "remaining_time": "2:52:21"} +{"current_steps": 6520, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 0.00034021613879565944, "epoch": 1.21, "percentage": 60.38, "elapsed_time": "4:22:38", "remaining_time": "2:52:19"} +{"current_steps": 6520, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 0.00034021613879565944, "epoch": 1.21, "percentage": 60.38, "elapsed_time": "4:22:37", "remaining_time": "2:52:18"} +{"current_steps": 6530, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 0.00033883838658183154, "epoch": 1.21, "percentage": 60.47, "elapsed_time": "4:29:05", "remaining_time": "2:55:52"} +{"current_steps": 6530, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 0.00033883838658183154, "epoch": 1.21, "percentage": 60.47, "elapsed_time": "4:23:02", "remaining_time": "2:51:55"} +{"current_steps": 6530, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 0.00033883838658183154, "epoch": 1.21, "percentage": 60.47, "elapsed_time": "4:23:04", "remaining_time": "2:51:56"} +{"current_steps": 6530, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 0.00033883838658183154, "epoch": 1.21, "percentage": 60.47, "elapsed_time": "4:23:00", "remaining_time": "2:51:54"} +{"current_steps": 6540, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.00033746199855655125, "epoch": 1.21, "percentage": 60.57, "elapsed_time": "4:23:29", "remaining_time": "2:51:33"} +{"current_steps": 6540, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.00033746199855655125, "epoch": 1.21, "percentage": 60.57, "elapsed_time": "4:23:26", "remaining_time": "2:51:30"} +{"current_steps": 6540, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.00033746199855655125, "epoch": 1.21, "percentage": 60.57, "elapsed_time": "4:29:30", "remaining_time": "2:55:28"} +{"current_steps": 6540, "total_steps": 10798, "loss": 1.9973, "reward": null, "learning_rate": 0.00033746199855655125, "epoch": 1.21, "percentage": 60.57, "elapsed_time": "4:23:27", "remaining_time": "2:51:31"} +{"current_steps": 6550, "total_steps": 10798, "loss": 1.9718, "reward": null, "learning_rate": 0.000336086986370563, "epoch": 1.21, "percentage": 60.66, "elapsed_time": "4:29:55", "remaining_time": "2:55:03"} +{"current_steps": 6550, "total_steps": 10798, "loss": 1.9718, "reward": null, "learning_rate": 0.000336086986370563, "epoch": 1.21, "percentage": 60.66, "elapsed_time": "4:23:50", "remaining_time": "2:51:06"} +{"current_steps": 6550, "total_steps": 10798, "loss": 1.9718, "reward": null, "learning_rate": 0.000336086986370563, "epoch": 1.21, "percentage": 60.66, "elapsed_time": "4:23:51", "remaining_time": "2:51:07"} +{"current_steps": 6550, "total_steps": 10798, "loss": 1.9718, "reward": null, "learning_rate": 0.000336086986370563, "epoch": 1.21, "percentage": 60.66, "elapsed_time": "4:23:53", "remaining_time": "2:51:08"} +{"current_steps": 6560, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 0.0003347133616629652, "epoch": 1.22, "percentage": 60.75, "elapsed_time": "4:30:19", "remaining_time": "2:54:38"} +{"current_steps": 6560, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 0.0003347133616629652, "epoch": 1.22, "percentage": 60.75, "elapsed_time": "4:24:14", "remaining_time": "2:50:42"} +{"current_steps": 6560, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 0.0003347133616629652, "epoch": 1.22, "percentage": 60.75, "elapsed_time": "4:24:16", "remaining_time": "2:50:43"} +{"current_steps": 6560, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 0.0003347133616629652, "epoch": 1.22, "percentage": 60.75, "elapsed_time": "4:24:17", "remaining_time": "2:50:44"} +{"current_steps": 6570, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00033334113606111194, "epoch": 1.22, "percentage": 60.84, "elapsed_time": "4:30:43", "remaining_time": "2:54:13"} +{"current_steps": 6570, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00033334113606111194, "epoch": 1.22, "percentage": 60.84, "elapsed_time": "4:24:38", "remaining_time": "2:50:18"} +{"current_steps": 6570, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00033334113606111194, "epoch": 1.22, "percentage": 60.84, "elapsed_time": "4:24:41", "remaining_time": "2:50:20"} +{"current_steps": 6570, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00033334113606111194, "epoch": 1.22, "percentage": 60.84, "elapsed_time": "4:24:40", "remaining_time": "2:50:19"} +{"current_steps": 6580, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.0003319703211805135, "epoch": 1.22, "percentage": 60.94, "elapsed_time": "4:25:03", "remaining_time": "2:49:54"} +{"current_steps": 6580, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.0003319703211805135, "epoch": 1.22, "percentage": 60.94, "elapsed_time": "4:31:07", "remaining_time": "2:53:47"} +{"current_steps": 6580, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.0003319703211805135, "epoch": 1.22, "percentage": 60.94, "elapsed_time": "4:25:02", "remaining_time": "2:49:53"} +{"current_steps": 6580, "total_steps": 10798, "loss": 1.9369, "reward": null, "learning_rate": 0.0003319703211805135, "epoch": 1.22, "percentage": 60.94, "elapsed_time": "4:25:05", "remaining_time": "2:49:56"} +{"current_steps": 6590, "total_steps": 10798, "loss": 1.9552, "reward": null, "learning_rate": 0.00033060092862473967, "epoch": 1.22, "percentage": 61.03, "elapsed_time": "4:25:28", "remaining_time": "2:49:31"} +{"current_steps": 6590, "total_steps": 10798, "loss": 1.9552, "reward": null, "learning_rate": 0.00033060092862473967, "epoch": 1.22, "percentage": 61.03, "elapsed_time": "4:25:26", "remaining_time": "2:49:30"} +{"current_steps": 6590, "total_steps": 10798, "loss": 1.9552, "reward": null, "learning_rate": 0.00033060092862473967, "epoch": 1.22, "percentage": 61.03, "elapsed_time": "4:31:31", "remaining_time": "2:53:22"} +{"current_steps": 6590, "total_steps": 10798, "loss": 1.9552, "reward": null, "learning_rate": 0.00033060092862473967, "epoch": 1.22, "percentage": 61.03, "elapsed_time": "4:25:30", "remaining_time": "2:49:32"} +{"current_steps": 6600, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.00032923296998532003, "epoch": 1.22, "percentage": 61.12, "elapsed_time": "4:31:56", "remaining_time": "2:52:58"} +{"current_steps": 6600, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.00032923296998532003, "epoch": 1.22, "percentage": 61.12, "elapsed_time": "4:25:53", "remaining_time": "2:49:07"} +{"current_steps": 6600, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.00032923296998532003, "epoch": 1.22, "percentage": 61.12, "elapsed_time": "4:25:54", "remaining_time": "2:49:08"} +{"current_steps": 6600, "total_steps": 10798, "loss": 1.9581, "reward": null, "learning_rate": 0.00032923296998532003, "epoch": 1.22, "percentage": 61.12, "elapsed_time": "4:25:51", "remaining_time": "2:49:06"} +{"current_steps": 6610, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.0003278664568416465, "epoch": 1.22, "percentage": 61.22, "elapsed_time": "4:32:21", "remaining_time": "2:52:33"} +{"current_steps": 6610, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.0003278664568416465, "epoch": 1.22, "percentage": 61.22, "elapsed_time": "4:26:16", "remaining_time": "2:48:42"} +{"current_steps": 6610, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.0003278664568416465, "epoch": 1.22, "percentage": 61.22, "elapsed_time": "4:26:17", "remaining_time": "2:48:43"} +{"current_steps": 6610, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.0003278664568416465, "epoch": 1.22, "percentage": 61.22, "elapsed_time": "4:26:19", "remaining_time": "2:48:44"} +{"current_steps": 6620, "total_steps": 10798, "loss": 1.9672, "reward": null, "learning_rate": 0.0003265014007608758, "epoch": 1.23, "percentage": 61.31, "elapsed_time": "4:32:46", "remaining_time": "2:52:08"} +{"current_steps": 6620, "total_steps": 10798, "loss": 1.9672, "reward": null, "learning_rate": 0.0003265014007608758, "epoch": 1.23, "percentage": 61.31, "elapsed_time": "4:26:41", "remaining_time": "2:48:18"} +{"current_steps": 6620, "total_steps": 10798, "loss": 1.9672, "reward": null, "learning_rate": 0.0003265014007608758, "epoch": 1.23, "percentage": 61.31, "elapsed_time": "4:26:42", "remaining_time": "2:48:19"} +{"current_steps": 6620, "total_steps": 10798, "loss": 1.9672, "reward": null, "learning_rate": 0.0003265014007608758, "epoch": 1.23, "percentage": 61.31, "elapsed_time": "4:26:44", "remaining_time": "2:48:20"} +{"current_steps": 6630, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 0.0003251378132978304, "epoch": 1.23, "percentage": 61.4, "elapsed_time": "4:27:08", "remaining_time": "2:47:56"} +{"current_steps": 6630, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 0.0003251378132978304, "epoch": 1.23, "percentage": 61.4, "elapsed_time": "4:27:10", "remaining_time": "2:47:57"} +{"current_steps": 6630, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 0.0003251378132978304, "epoch": 1.23, "percentage": 61.4, "elapsed_time": "4:33:12", "remaining_time": "2:51:44"} +{"current_steps": 6630, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 0.0003251378132978304, "epoch": 1.23, "percentage": 61.4, "elapsed_time": "4:27:07", "remaining_time": "2:47:55"} +{"current_steps": 6640, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 0.00032377570599490164, "epoch": 1.23, "percentage": 61.49, "elapsed_time": "4:33:37", "remaining_time": "2:51:20"} +{"current_steps": 6640, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 0.00032377570599490164, "epoch": 1.23, "percentage": 61.49, "elapsed_time": "4:27:35", "remaining_time": "2:47:34"} +{"current_steps": 6640, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 0.00032377570599490164, "epoch": 1.23, "percentage": 61.49, "elapsed_time": "4:27:33", "remaining_time": "2:47:32"} +{"current_steps": 6640, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 0.00032377570599490164, "epoch": 1.23, "percentage": 61.49, "elapsed_time": "4:27:32", "remaining_time": "2:47:31"} +{"current_steps": 6650, "total_steps": 10798, "loss": 1.9092, "reward": null, "learning_rate": 0.00032241509038195165, "epoch": 1.23, "percentage": 61.59, "elapsed_time": "4:27:58", "remaining_time": "2:47:09"} +{"current_steps": 6650, "total_steps": 10798, "loss": 1.9092, "reward": null, "learning_rate": 0.00032241509038195165, "epoch": 1.23, "percentage": 61.59, "elapsed_time": "4:27:59", "remaining_time": "2:47:10"} +{"current_steps": 6650, "total_steps": 10798, "loss": 1.9092, "reward": null, "learning_rate": 0.00032241509038195165, "epoch": 1.23, "percentage": 61.59, "elapsed_time": "4:28:01", "remaining_time": "2:47:11"} +{"current_steps": 6650, "total_steps": 10798, "loss": 1.9092, "reward": null, "learning_rate": 0.00032241509038195165, "epoch": 1.23, "percentage": 61.59, "elapsed_time": "4:34:03", "remaining_time": "2:50:56"} +{"current_steps": 6660, "total_steps": 10798, "loss": 1.9343, "reward": null, "learning_rate": 0.0003210559779762157, "epoch": 1.23, "percentage": 61.68, "elapsed_time": "4:28:25", "remaining_time": "2:46:46"} +{"current_steps": 6660, "total_steps": 10798, "loss": 1.9343, "reward": null, "learning_rate": 0.0003210559779762157, "epoch": 1.23, "percentage": 61.68, "elapsed_time": "4:28:27", "remaining_time": "2:46:47"} +{"current_steps": 6660, "total_steps": 10798, "loss": 1.9343, "reward": null, "learning_rate": 0.0003210559779762157, "epoch": 1.23, "percentage": 61.68, "elapsed_time": "4:28:23", "remaining_time": "2:46:45"} +{"current_steps": 6660, "total_steps": 10798, "loss": 1.9343, "reward": null, "learning_rate": 0.0003210559779762157, "epoch": 1.23, "percentage": 61.68, "elapsed_time": "4:34:28", "remaining_time": "2:50:32"} +{"current_steps": 6670, "total_steps": 10798, "loss": 1.9796, "reward": null, "learning_rate": 0.00031969838028220513, "epoch": 1.24, "percentage": 61.77, "elapsed_time": "4:34:53", "remaining_time": "2:50:07"} +{"current_steps": 6670, "total_steps": 10798, "loss": 1.9796, "reward": null, "learning_rate": 0.00031969838028220513, "epoch": 1.24, "percentage": 61.77, "elapsed_time": "4:28:51", "remaining_time": "2:46:23"} +{"current_steps": 6670, "total_steps": 10798, "loss": 1.9796, "reward": null, "learning_rate": 0.00031969838028220513, "epoch": 1.24, "percentage": 61.77, "elapsed_time": "4:28:49", "remaining_time": "2:46:22"} +{"current_steps": 6670, "total_steps": 10798, "loss": 1.9796, "reward": null, "learning_rate": 0.00031969838028220513, "epoch": 1.24, "percentage": 61.77, "elapsed_time": "4:28:48", "remaining_time": "2:46:21"} +{"current_steps": 6680, "total_steps": 10798, "loss": 1.8932, "reward": null, "learning_rate": 0.00031834230879160947, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "4:35:16", "remaining_time": "2:49:41"} +{"current_steps": 6680, "total_steps": 10798, "loss": 1.8932, "reward": null, "learning_rate": 0.00031834230879160947, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "4:29:15", "remaining_time": "2:45:59"} +{"current_steps": 6680, "total_steps": 10798, "loss": 1.8932, "reward": null, "learning_rate": 0.00031834230879160947, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "4:29:13", "remaining_time": "2:45:58"} +{"current_steps": 6680, "total_steps": 10798, "loss": 1.8932, "reward": null, "learning_rate": 0.00031834230879160947, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "4:29:11", "remaining_time": "2:45:57"} +{"current_steps": 6690, "total_steps": 10798, "loss": 1.9279, "reward": null, "learning_rate": 0.0003169877749831993, "epoch": 1.24, "percentage": 61.96, "elapsed_time": "4:29:35", "remaining_time": "2:45:32"} +{"current_steps": 6690, "total_steps": 10798, "loss": 1.9279, "reward": null, "learning_rate": 0.0003169877749831993, "epoch": 1.24, "percentage": 61.96, "elapsed_time": "4:29:37", "remaining_time": "2:45:33"} +{"current_steps": 6690, "total_steps": 10798, "loss": 1.9279, "reward": null, "learning_rate": 0.0003169877749831993, "epoch": 1.24, "percentage": 61.96, "elapsed_time": "4:29:39", "remaining_time": "2:45:34"} +{"current_steps": 6690, "total_steps": 10798, "loss": 1.9279, "reward": null, "learning_rate": 0.0003169877749831993, "epoch": 1.24, "percentage": 61.96, "elapsed_time": "4:35:40", "remaining_time": "2:49:16"} +{"current_steps": 6700, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.000315634790322729, "epoch": 1.24, "percentage": 62.05, "elapsed_time": "4:36:06", "remaining_time": "2:48:52"} +{"current_steps": 6700, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.000315634790322729, "epoch": 1.24, "percentage": 62.05, "elapsed_time": "4:30:02", "remaining_time": "2:45:10"} +{"current_steps": 6700, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.000315634790322729, "epoch": 1.24, "percentage": 62.05, "elapsed_time": "4:30:04", "remaining_time": "2:45:11"} +{"current_steps": 6700, "total_steps": 10798, "loss": 1.9444, "reward": null, "learning_rate": 0.000315634790322729, "epoch": 1.24, "percentage": 62.05, "elapsed_time": "4:30:01", "remaining_time": "2:45:09"} +{"current_steps": 6710, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 0.00031428336626284037, "epoch": 1.24, "percentage": 62.14, "elapsed_time": "4:30:26", "remaining_time": "2:44:45"} +{"current_steps": 6710, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 0.00031428336626284037, "epoch": 1.24, "percentage": 62.14, "elapsed_time": "4:30:27", "remaining_time": "2:44:46"} +{"current_steps": 6710, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 0.00031428336626284037, "epoch": 1.24, "percentage": 62.14, "elapsed_time": "4:30:29", "remaining_time": "2:44:47"} +{"current_steps": 6710, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 0.00031428336626284037, "epoch": 1.24, "percentage": 62.14, "elapsed_time": "4:36:30", "remaining_time": "2:48:27"} +{"current_steps": 6720, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.00031293351424296467, "epoch": 1.24, "percentage": 62.23, "elapsed_time": "4:30:50", "remaining_time": "2:44:21"} +{"current_steps": 6720, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.00031293351424296467, "epoch": 1.24, "percentage": 62.23, "elapsed_time": "4:36:55", "remaining_time": "2:48:03"} +{"current_steps": 6720, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.00031293351424296467, "epoch": 1.24, "percentage": 62.23, "elapsed_time": "4:30:52", "remaining_time": "2:44:22"} +{"current_steps": 6720, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 0.00031293351424296467, "epoch": 1.24, "percentage": 62.23, "elapsed_time": "4:30:54", "remaining_time": "2:44:23"} +{"current_steps": 6730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00031158524568922663, "epoch": 1.25, "percentage": 62.33, "elapsed_time": "4:31:18", "remaining_time": "2:43:59"} +{"current_steps": 6730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00031158524568922663, "epoch": 1.25, "percentage": 62.33, "elapsed_time": "4:37:20", "remaining_time": "2:47:38"} +{"current_steps": 6730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00031158524568922663, "epoch": 1.25, "percentage": 62.33, "elapsed_time": "4:31:16", "remaining_time": "2:43:58"} +{"current_steps": 6730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 0.00031158524568922663, "epoch": 1.25, "percentage": 62.33, "elapsed_time": "4:31:15", "remaining_time": "2:43:57"} +{"current_steps": 6740, "total_steps": 10798, "loss": 1.8997, "reward": null, "learning_rate": 0.00031023857201434703, "epoch": 1.25, "percentage": 62.42, "elapsed_time": "4:31:39", "remaining_time": "2:43:33"} +{"current_steps": 6740, "total_steps": 10798, "loss": 1.8997, "reward": null, "learning_rate": 0.00031023857201434703, "epoch": 1.25, "percentage": 62.42, "elapsed_time": "4:37:44", "remaining_time": "2:47:13"} +{"current_steps": 6740, "total_steps": 10798, "loss": 1.8997, "reward": null, "learning_rate": 0.00031023857201434703, "epoch": 1.25, "percentage": 62.42, "elapsed_time": "4:31:43", "remaining_time": "2:43:35"} +{"current_steps": 6740, "total_steps": 10798, "loss": 1.8997, "reward": null, "learning_rate": 0.00031023857201434703, "epoch": 1.25, "percentage": 62.42, "elapsed_time": "4:31:41", "remaining_time": "2:43:34"} +{"current_steps": 6750, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.0003088935046175466, "epoch": 1.25, "percentage": 62.51, "elapsed_time": "4:38:09", "remaining_time": "2:46:48"} +{"current_steps": 6750, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.0003088935046175466, "epoch": 1.25, "percentage": 62.51, "elapsed_time": "4:32:06", "remaining_time": "2:43:10"} +{"current_steps": 6750, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.0003088935046175466, "epoch": 1.25, "percentage": 62.51, "elapsed_time": "4:32:07", "remaining_time": "2:43:11"} +{"current_steps": 6750, "total_steps": 10798, "loss": 1.9417, "reward": null, "learning_rate": 0.0003088935046175466, "epoch": 1.25, "percentage": 62.51, "elapsed_time": "4:32:04", "remaining_time": "2:43:09"} +{"current_steps": 6760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 0.0003075500548844492, "epoch": 1.25, "percentage": 62.6, "elapsed_time": "4:32:32", "remaining_time": "2:42:47"} +{"current_steps": 6760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 0.0003075500548844492, "epoch": 1.25, "percentage": 62.6, "elapsed_time": "4:38:33", "remaining_time": "2:46:23"} +{"current_steps": 6760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 0.0003075500548844492, "epoch": 1.25, "percentage": 62.6, "elapsed_time": "4:32:30", "remaining_time": "2:42:46"} +{"current_steps": 6760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 0.0003075500548844492, "epoch": 1.25, "percentage": 62.6, "elapsed_time": "4:32:28", "remaining_time": "2:42:45"} +{"current_steps": 6770, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0003062082341869862, "epoch": 1.25, "percentage": 62.7, "elapsed_time": "4:32:52", "remaining_time": "2:42:21"} +{"current_steps": 6770, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0003062082341869862, "epoch": 1.25, "percentage": 62.7, "elapsed_time": "4:32:56", "remaining_time": "2:42:23"} +{"current_steps": 6770, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0003062082341869862, "epoch": 1.25, "percentage": 62.7, "elapsed_time": "4:32:54", "remaining_time": "2:42:22"} +{"current_steps": 6770, "total_steps": 10798, "loss": 1.9511, "reward": null, "learning_rate": 0.0003062082341869862, "epoch": 1.25, "percentage": 62.7, "elapsed_time": "4:38:57", "remaining_time": "2:45:58"} +{"current_steps": 6780, "total_steps": 10798, "loss": 1.922, "reward": null, "learning_rate": 0.00030486805388329894, "epoch": 1.26, "percentage": 62.79, "elapsed_time": "4:33:17", "remaining_time": "2:41:57"} +{"current_steps": 6780, "total_steps": 10798, "loss": 1.922, "reward": null, "learning_rate": 0.00030486805388329894, "epoch": 1.26, "percentage": 62.79, "elapsed_time": "4:33:20", "remaining_time": "2:41:59"} +{"current_steps": 6780, "total_steps": 10798, "loss": 1.922, "reward": null, "learning_rate": 0.00030486805388329894, "epoch": 1.26, "percentage": 62.79, "elapsed_time": "4:33:18", "remaining_time": "2:41:58"} +{"current_steps": 6780, "total_steps": 10798, "loss": 1.922, "reward": null, "learning_rate": 0.00030486805388329894, "epoch": 1.26, "percentage": 62.79, "elapsed_time": "4:39:21", "remaining_time": "2:45:33"} +{"current_steps": 6790, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 0.00030352952531764363, "epoch": 1.26, "percentage": 62.88, "elapsed_time": "4:33:45", "remaining_time": "2:41:35"} +{"current_steps": 6790, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 0.00030352952531764363, "epoch": 1.26, "percentage": 62.88, "elapsed_time": "4:33:44", "remaining_time": "2:41:34"} +{"current_steps": 6790, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 0.00030352952531764363, "epoch": 1.26, "percentage": 62.88, "elapsed_time": "4:33:42", "remaining_time": "2:41:33"} +{"current_steps": 6790, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 0.00030352952531764363, "epoch": 1.26, "percentage": 62.88, "elapsed_time": "4:39:47", "remaining_time": "2:45:09"} +{"current_steps": 6800, "total_steps": 10798, "loss": 1.9555, "reward": null, "learning_rate": 0.0003021926598202949, "epoch": 1.26, "percentage": 62.97, "elapsed_time": "4:40:12", "remaining_time": "2:44:44"} +{"current_steps": 6800, "total_steps": 10798, "loss": 1.9555, "reward": null, "learning_rate": 0.0003021926598202949, "epoch": 1.26, "percentage": 62.97, "elapsed_time": "4:34:09", "remaining_time": "2:41:11"} +{"current_steps": 6800, "total_steps": 10798, "loss": 1.9555, "reward": null, "learning_rate": 0.0003021926598202949, "epoch": 1.26, "percentage": 62.97, "elapsed_time": "4:34:10", "remaining_time": "2:41:12"} +{"current_steps": 6800, "total_steps": 10798, "loss": 1.9555, "reward": null, "learning_rate": 0.0003021926598202949, "epoch": 1.26, "percentage": 62.97, "elapsed_time": "4:34:07", "remaining_time": "2:41:10"} +{"current_steps": 6810, "total_steps": 10798, "loss": 1.9254, "reward": null, "learning_rate": 0.0003008574687074498, "epoch": 1.26, "percentage": 63.07, "elapsed_time": "4:34:31", "remaining_time": "2:40:46"} +{"current_steps": 6810, "total_steps": 10798, "loss": 1.9254, "reward": null, "learning_rate": 0.0003008574687074498, "epoch": 1.26, "percentage": 63.07, "elapsed_time": "4:34:33", "remaining_time": "2:40:47"} +{"current_steps": 6810, "total_steps": 10798, "loss": 1.9254, "reward": null, "learning_rate": 0.0003008574687074498, "epoch": 1.26, "percentage": 63.07, "elapsed_time": "4:40:36", "remaining_time": "2:44:19"} +{"current_steps": 6810, "total_steps": 10798, "loss": 1.9254, "reward": null, "learning_rate": 0.0003008574687074498, "epoch": 1.26, "percentage": 63.07, "elapsed_time": "4:34:35", "remaining_time": "2:40:48"} +{"current_steps": 6820, "total_steps": 10798, "loss": 1.9211, "reward": null, "learning_rate": 0.00029952396328113265, "epoch": 1.26, "percentage": 63.16, "elapsed_time": "4:34:57", "remaining_time": "2:40:22"} +{"current_steps": 6820, "total_steps": 10798, "loss": 1.9211, "reward": null, "learning_rate": 0.00029952396328113265, "epoch": 1.26, "percentage": 63.16, "elapsed_time": "4:34:58", "remaining_time": "2:40:23"} +{"current_steps": 6820, "total_steps": 10798, "loss": 1.9211, "reward": null, "learning_rate": 0.00029952396328113265, "epoch": 1.26, "percentage": 63.16, "elapsed_time": "4:34:55", "remaining_time": "2:40:21"} +{"current_steps": 6820, "total_steps": 10798, "loss": 1.9211, "reward": null, "learning_rate": 0.00029952396328113265, "epoch": 1.26, "percentage": 63.16, "elapsed_time": "4:41:00", "remaining_time": "2:43:54"} +{"current_steps": 6830, "total_steps": 10798, "loss": 1.9504, "reward": null, "learning_rate": 0.00029819215482909846, "epoch": 1.27, "percentage": 63.25, "elapsed_time": "4:35:23", "remaining_time": "2:39:59"} +{"current_steps": 6830, "total_steps": 10798, "loss": 1.9504, "reward": null, "learning_rate": 0.00029819215482909846, "epoch": 1.27, "percentage": 63.25, "elapsed_time": "4:41:25", "remaining_time": "2:43:29"} +{"current_steps": 6830, "total_steps": 10798, "loss": 1.9504, "reward": null, "learning_rate": 0.00029819215482909846, "epoch": 1.27, "percentage": 63.25, "elapsed_time": "4:35:22", "remaining_time": "2:39:58"} +{"current_steps": 6830, "total_steps": 10798, "loss": 1.9504, "reward": null, "learning_rate": 0.00029819215482909846, "epoch": 1.27, "percentage": 63.25, "elapsed_time": "4:35:20", "remaining_time": "2:39:57"} +{"current_steps": 6840, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.00029686205462473784, "epoch": 1.27, "percentage": 63.35, "elapsed_time": "4:35:48", "remaining_time": "2:39:36"} +{"current_steps": 6840, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.00029686205462473784, "epoch": 1.27, "percentage": 63.35, "elapsed_time": "4:35:47", "remaining_time": "2:39:35"} +{"current_steps": 6840, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.00029686205462473784, "epoch": 1.27, "percentage": 63.35, "elapsed_time": "4:41:50", "remaining_time": "2:43:05"} +{"current_steps": 6840, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 0.00029686205462473784, "epoch": 1.27, "percentage": 63.35, "elapsed_time": "4:35:45", "remaining_time": "2:39:34"} +{"current_steps": 6850, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.00029553367392698177, "epoch": 1.27, "percentage": 63.44, "elapsed_time": "4:42:15", "remaining_time": "2:42:40"} +{"current_steps": 6850, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.00029553367392698177, "epoch": 1.27, "percentage": 63.44, "elapsed_time": "4:36:10", "remaining_time": "2:39:10"} +{"current_steps": 6850, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.00029553367392698177, "epoch": 1.27, "percentage": 63.44, "elapsed_time": "4:36:11", "remaining_time": "2:39:11"} +{"current_steps": 6850, "total_steps": 10798, "loss": 1.9368, "reward": null, "learning_rate": 0.00029553367392698177, "epoch": 1.27, "percentage": 63.44, "elapsed_time": "4:36:13", "remaining_time": "2:39:12"} +{"current_steps": 6860, "total_steps": 10798, "loss": 1.8939, "reward": null, "learning_rate": 0.00029420702398020595, "epoch": 1.27, "percentage": 63.53, "elapsed_time": "4:36:36", "remaining_time": "2:38:47"} +{"current_steps": 6860, "total_steps": 10798, "loss": 1.8939, "reward": null, "learning_rate": 0.00029420702398020595, "epoch": 1.27, "percentage": 63.53, "elapsed_time": "4:42:39", "remaining_time": "2:42:15"} +{"current_steps": 6860, "total_steps": 10798, "loss": 1.8939, "reward": null, "learning_rate": 0.00029420702398020595, "epoch": 1.27, "percentage": 63.53, "elapsed_time": "4:36:34", "remaining_time": "2:38:46"} +{"current_steps": 6860, "total_steps": 10798, "loss": 1.8939, "reward": null, "learning_rate": 0.00029420702398020595, "epoch": 1.27, "percentage": 63.53, "elapsed_time": "4:36:37", "remaining_time": "2:38:48"} +{"current_steps": 6870, "total_steps": 10798, "loss": 1.9097, "reward": null, "learning_rate": 0.00029288211601413586, "epoch": 1.27, "percentage": 63.62, "elapsed_time": "4:43:03", "remaining_time": "2:41:50"} +{"current_steps": 6870, "total_steps": 10798, "loss": 1.9097, "reward": null, "learning_rate": 0.00029288211601413586, "epoch": 1.27, "percentage": 63.62, "elapsed_time": "4:36:58", "remaining_time": "2:38:21"} +{"current_steps": 6870, "total_steps": 10798, "loss": 1.9097, "reward": null, "learning_rate": 0.00029288211601413586, "epoch": 1.27, "percentage": 63.62, "elapsed_time": "4:37:00", "remaining_time": "2:38:22"} +{"current_steps": 6870, "total_steps": 10798, "loss": 1.9097, "reward": null, "learning_rate": 0.00029288211601413586, "epoch": 1.27, "percentage": 63.62, "elapsed_time": "4:37:02", "remaining_time": "2:38:23"} +{"current_steps": 6880, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.00029155896124375156, "epoch": 1.27, "percentage": 63.72, "elapsed_time": "4:37:27", "remaining_time": "2:38:00"} +{"current_steps": 6880, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.00029155896124375156, "epoch": 1.27, "percentage": 63.72, "elapsed_time": "4:37:23", "remaining_time": "2:37:58"} +{"current_steps": 6880, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.00029155896124375156, "epoch": 1.27, "percentage": 63.72, "elapsed_time": "4:43:28", "remaining_time": "2:41:26"} +{"current_steps": 6880, "total_steps": 10798, "loss": 1.9885, "reward": null, "learning_rate": 0.00029155896124375156, "epoch": 1.27, "percentage": 63.72, "elapsed_time": "4:37:25", "remaining_time": "2:37:59"} +{"current_steps": 6890, "total_steps": 10798, "loss": 1.9752, "reward": null, "learning_rate": 0.0002902375708691925, "epoch": 1.28, "percentage": 63.81, "elapsed_time": "4:43:52", "remaining_time": "2:41:00"} +{"current_steps": 6890, "total_steps": 10798, "loss": 1.9752, "reward": null, "learning_rate": 0.0002902375708691925, "epoch": 1.28, "percentage": 63.81, "elapsed_time": "4:37:51", "remaining_time": "2:37:35"} +{"current_steps": 6890, "total_steps": 10798, "loss": 1.9752, "reward": null, "learning_rate": 0.0002902375708691925, "epoch": 1.28, "percentage": 63.81, "elapsed_time": "4:37:47", "remaining_time": "2:37:33"} +{"current_steps": 6890, "total_steps": 10798, "loss": 1.9752, "reward": null, "learning_rate": 0.0002902375708691925, "epoch": 1.28, "percentage": 63.81, "elapsed_time": "4:37:49", "remaining_time": "2:37:34"} +{"current_steps": 6900, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 0.0002889179560756634, "epoch": 1.28, "percentage": 63.9, "elapsed_time": "4:38:14", "remaining_time": "2:37:11"} +{"current_steps": 6900, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 0.0002889179560756634, "epoch": 1.28, "percentage": 63.9, "elapsed_time": "4:38:12", "remaining_time": "2:37:10"} +{"current_steps": 6900, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 0.0002889179560756634, "epoch": 1.28, "percentage": 63.9, "elapsed_time": "4:38:11", "remaining_time": "2:37:09"} +{"current_steps": 6900, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 0.0002889179560756634, "epoch": 1.28, "percentage": 63.9, "elapsed_time": "4:44:15", "remaining_time": "2:40:35"} +{"current_steps": 6910, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0002876001280333391, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "4:38:38", "remaining_time": "2:36:47"} +{"current_steps": 6910, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0002876001280333391, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "4:44:40", "remaining_time": "2:40:10"} +{"current_steps": 6910, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0002876001280333391, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "4:38:35", "remaining_time": "2:36:45"} +{"current_steps": 6910, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.0002876001280333391, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "4:38:36", "remaining_time": "2:36:46"} +{"current_steps": 6920, "total_steps": 10798, "loss": 1.9192, "reward": null, "learning_rate": 0.0002862840978972698, "epoch": 1.28, "percentage": 64.09, "elapsed_time": "4:38:59", "remaining_time": "2:36:20"} +{"current_steps": 6920, "total_steps": 10798, "loss": 1.9192, "reward": null, "learning_rate": 0.0002862840978972698, "epoch": 1.28, "percentage": 64.09, "elapsed_time": "4:39:00", "remaining_time": "2:36:21"} +{"current_steps": 6920, "total_steps": 10798, "loss": 1.9192, "reward": null, "learning_rate": 0.0002862840978972698, "epoch": 1.28, "percentage": 64.09, "elapsed_time": "4:45:03", "remaining_time": "2:39:45"} +{"current_steps": 6920, "total_steps": 10798, "loss": 1.9192, "reward": null, "learning_rate": 0.0002862840978972698, "epoch": 1.28, "percentage": 64.09, "elapsed_time": "4:39:02", "remaining_time": "2:36:22"} +{"current_steps": 6930, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0002849698768072877, "epoch": 1.28, "percentage": 64.18, "elapsed_time": "4:45:27", "remaining_time": "2:39:19"} +{"current_steps": 6930, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0002849698768072877, "epoch": 1.28, "percentage": 64.18, "elapsed_time": "4:39:22", "remaining_time": "2:35:56"} +{"current_steps": 6930, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0002849698768072877, "epoch": 1.28, "percentage": 64.18, "elapsed_time": "4:39:24", "remaining_time": "2:35:57"} +{"current_steps": 6930, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0002849698768072877, "epoch": 1.28, "percentage": 64.18, "elapsed_time": "4:39:26", "remaining_time": "2:35:58"} +{"current_steps": 6940, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.0002836574758879107, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "4:45:53", "remaining_time": "2:38:55"} +{"current_steps": 6940, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.0002836574758879107, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "4:39:51", "remaining_time": "2:35:34"} +{"current_steps": 6940, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.0002836574758879107, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "4:39:48", "remaining_time": "2:35:32"} +{"current_steps": 6940, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.0002836574758879107, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "4:39:50", "remaining_time": "2:35:33"} +{"current_steps": 6950, "total_steps": 10798, "loss": 1.9318, "reward": null, "learning_rate": 0.0002823469062482503, "epoch": 1.29, "percentage": 64.36, "elapsed_time": "4:40:16", "remaining_time": "2:35:10"} +{"current_steps": 6950, "total_steps": 10798, "loss": 1.9318, "reward": null, "learning_rate": 0.0002823469062482503, "epoch": 1.29, "percentage": 64.36, "elapsed_time": "4:40:14", "remaining_time": "2:35:09"} +{"current_steps": 6950, "total_steps": 10798, "loss": 1.9318, "reward": null, "learning_rate": 0.0002823469062482503, "epoch": 1.29, "percentage": 64.36, "elapsed_time": "4:46:17", "remaining_time": "2:38:30"} +{"current_steps": 6950, "total_steps": 10798, "loss": 1.9318, "reward": null, "learning_rate": 0.0002823469062482503, "epoch": 1.29, "percentage": 64.36, "elapsed_time": "4:40:13", "remaining_time": "2:35:08"} +{"current_steps": 6960, "total_steps": 10798, "loss": 1.9422, "reward": null, "learning_rate": 0.0002810381789819167, "epoch": 1.29, "percentage": 64.46, "elapsed_time": "4:40:41", "remaining_time": "2:34:47"} +{"current_steps": 6960, "total_steps": 10798, "loss": 1.9422, "reward": null, "learning_rate": 0.0002810381789819167, "epoch": 1.29, "percentage": 64.46, "elapsed_time": "4:46:43", "remaining_time": "2:38:06"} +{"current_steps": 6960, "total_steps": 10798, "loss": 1.9422, "reward": null, "learning_rate": 0.0002810381789819167, "epoch": 1.29, "percentage": 64.46, "elapsed_time": "4:40:38", "remaining_time": "2:34:45"} +{"current_steps": 6960, "total_steps": 10798, "loss": 1.9422, "reward": null, "learning_rate": 0.0002810381789819167, "epoch": 1.29, "percentage": 64.46, "elapsed_time": "4:40:40", "remaining_time": "2:34:46"} +{"current_steps": 6970, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0002797313051669247, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "4:47:07", "remaining_time": "2:37:41"} +{"current_steps": 6970, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0002797313051669247, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "4:41:04", "remaining_time": "2:34:22"} +{"current_steps": 6970, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0002797313051669247, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "4:41:06", "remaining_time": "2:34:23"} +{"current_steps": 6970, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0002797313051669247, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "4:41:02", "remaining_time": "2:34:21"} +{"current_steps": 6980, "total_steps": 10798, "loss": 1.9189, "reward": null, "learning_rate": 0.0002784262958656003, "epoch": 1.29, "percentage": 64.64, "elapsed_time": "4:41:30", "remaining_time": "2:33:59"} +{"current_steps": 6980, "total_steps": 10798, "loss": 1.9189, "reward": null, "learning_rate": 0.0002784262958656003, "epoch": 1.29, "percentage": 64.64, "elapsed_time": "4:41:27", "remaining_time": "2:33:57"} +{"current_steps": 6980, "total_steps": 10798, "loss": 1.9189, "reward": null, "learning_rate": 0.0002784262958656003, "epoch": 1.29, "percentage": 64.64, "elapsed_time": "4:41:28", "remaining_time": "2:33:58"} +{"current_steps": 6980, "total_steps": 10798, "loss": 1.9189, "reward": null, "learning_rate": 0.0002784262958656003, "epoch": 1.29, "percentage": 64.64, "elapsed_time": "4:47:32", "remaining_time": "2:37:16"} +{"current_steps": 6990, "total_steps": 10798, "loss": 1.9453, "reward": null, "learning_rate": 0.00027712316212448663, "epoch": 1.29, "percentage": 64.73, "elapsed_time": "4:41:54", "remaining_time": "2:33:34"} +{"current_steps": 6990, "total_steps": 10798, "loss": 1.9453, "reward": null, "learning_rate": 0.00027712316212448663, "epoch": 1.29, "percentage": 64.73, "elapsed_time": "4:47:56", "remaining_time": "2:36:51"} +{"current_steps": 6990, "total_steps": 10798, "loss": 1.9453, "reward": null, "learning_rate": 0.00027712316212448663, "epoch": 1.29, "percentage": 64.73, "elapsed_time": "4:41:52", "remaining_time": "2:33:33"} +{"current_steps": 6990, "total_steps": 10798, "loss": 1.9453, "reward": null, "learning_rate": 0.00027712316212448663, "epoch": 1.29, "percentage": 64.73, "elapsed_time": "4:41:51", "remaining_time": "2:33:32"} +{"current_steps": 7000, "total_steps": 10798, "loss": 1.9335, "reward": null, "learning_rate": 0.00027582191497425114, "epoch": 1.3, "percentage": 64.83, "elapsed_time": "4:48:20", "remaining_time": "2:36:27"} +{"current_steps": 7000, "total_steps": 10798, "loss": 1.9335, "reward": null, "learning_rate": 0.00027582191497425114, "epoch": 1.3, "percentage": 64.83, "elapsed_time": "4:42:17", "remaining_time": "2:33:09"} +{"current_steps": 7000, "total_steps": 10798, "loss": 1.9335, "reward": null, "learning_rate": 0.00027582191497425114, "epoch": 1.3, "percentage": 64.83, "elapsed_time": "4:42:16", "remaining_time": "2:33:09"} +{"current_steps": 7000, "total_steps": 10798, "loss": 1.9335, "reward": null, "learning_rate": 0.00027582191497425114, "epoch": 1.3, "percentage": 64.83, "elapsed_time": "4:42:19", "remaining_time": "2:33:10"} +{"current_steps": 7010, "total_steps": 10798, "loss": 1.9724, "reward": null, "learning_rate": 0.000274522565429591, "epoch": 1.3, "percentage": 64.92, "elapsed_time": "4:48:45", "remaining_time": "2:36:02"} +{"current_steps": 7010, "total_steps": 10798, "loss": 1.9724, "reward": null, "learning_rate": 0.000274522565429591, "epoch": 1.3, "percentage": 64.92, "elapsed_time": "4:42:41", "remaining_time": "2:32:45"} +{"current_steps": 7010, "total_steps": 10798, "loss": 1.9724, "reward": null, "learning_rate": 0.000274522565429591, "epoch": 1.3, "percentage": 64.92, "elapsed_time": "4:42:42", "remaining_time": "2:32:46"} +{"current_steps": 7010, "total_steps": 10798, "loss": 1.9724, "reward": null, "learning_rate": 0.000274522565429591, "epoch": 1.3, "percentage": 64.92, "elapsed_time": "4:42:44", "remaining_time": "2:32:47"} +{"current_steps": 7020, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.0002732251244891421, "epoch": 1.3, "percentage": 65.01, "elapsed_time": "4:49:10", "remaining_time": "2:35:37"} +{"current_steps": 7020, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.0002732251244891421, "epoch": 1.3, "percentage": 65.01, "elapsed_time": "4:43:05", "remaining_time": "2:32:21"} +{"current_steps": 7020, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.0002732251244891421, "epoch": 1.3, "percentage": 65.01, "elapsed_time": "4:43:09", "remaining_time": "2:32:23"} +{"current_steps": 7020, "total_steps": 10798, "loss": 1.9236, "reward": null, "learning_rate": 0.0002732251244891421, "epoch": 1.3, "percentage": 65.01, "elapsed_time": "4:43:07", "remaining_time": "2:32:22"} +{"current_steps": 7030, "total_steps": 10798, "loss": 1.9407, "reward": null, "learning_rate": 0.00027192960313538307, "epoch": 1.3, "percentage": 65.1, "elapsed_time": "4:43:30", "remaining_time": "2:31:57"} +{"current_steps": 7030, "total_steps": 10798, "loss": 1.9407, "reward": null, "learning_rate": 0.00027192960313538307, "epoch": 1.3, "percentage": 65.1, "elapsed_time": "4:43:31", "remaining_time": "2:31:58"} +{"current_steps": 7030, "total_steps": 10798, "loss": 1.9407, "reward": null, "learning_rate": 0.00027192960313538307, "epoch": 1.3, "percentage": 65.1, "elapsed_time": "4:49:35", "remaining_time": "2:35:12"} +{"current_steps": 7030, "total_steps": 10798, "loss": 1.9407, "reward": null, "learning_rate": 0.00027192960313538307, "epoch": 1.3, "percentage": 65.1, "elapsed_time": "4:43:33", "remaining_time": "2:31:59"} +{"current_steps": 7040, "total_steps": 10798, "loss": 1.8948, "reward": null, "learning_rate": 0.0002706360123345445, "epoch": 1.3, "percentage": 65.2, "elapsed_time": "4:50:00", "remaining_time": "2:34:48"} +{"current_steps": 7040, "total_steps": 10798, "loss": 1.8948, "reward": null, "learning_rate": 0.0002706360123345445, "epoch": 1.3, "percentage": 65.2, "elapsed_time": "4:43:56", "remaining_time": "2:31:34"} +{"current_steps": 7040, "total_steps": 10798, "loss": 1.8948, "reward": null, "learning_rate": 0.0002706360123345445, "epoch": 1.3, "percentage": 65.2, "elapsed_time": "4:43:57", "remaining_time": "2:31:34"} +{"current_steps": 7040, "total_steps": 10798, "loss": 1.8948, "reward": null, "learning_rate": 0.0002706360123345445, "epoch": 1.3, "percentage": 65.2, "elapsed_time": "4:43:59", "remaining_time": "2:31:35"} +{"current_steps": 7050, "total_steps": 10798, "loss": 1.9354, "reward": null, "learning_rate": 0.00026934436303651554, "epoch": 1.31, "percentage": 65.29, "elapsed_time": "4:44:20", "remaining_time": "2:31:09"} +{"current_steps": 7050, "total_steps": 10798, "loss": 1.9354, "reward": null, "learning_rate": 0.00026934436303651554, "epoch": 1.31, "percentage": 65.29, "elapsed_time": "4:44:21", "remaining_time": "2:31:10"} +{"current_steps": 7050, "total_steps": 10798, "loss": 1.9354, "reward": null, "learning_rate": 0.00026934436303651554, "epoch": 1.31, "percentage": 65.29, "elapsed_time": "4:50:25", "remaining_time": "2:34:23"} +{"current_steps": 7050, "total_steps": 10798, "loss": 1.9354, "reward": null, "learning_rate": 0.00026934436303651554, "epoch": 1.31, "percentage": 65.29, "elapsed_time": "4:44:23", "remaining_time": "2:31:11"} +{"current_steps": 7060, "total_steps": 10798, "loss": 1.955, "reward": null, "learning_rate": 0.00026805466617475007, "epoch": 1.31, "percentage": 65.38, "elapsed_time": "4:50:49", "remaining_time": "2:33:59"} +{"current_steps": 7060, "total_steps": 10798, "loss": 1.955, "reward": null, "learning_rate": 0.00026805466617475007, "epoch": 1.31, "percentage": 65.38, "elapsed_time": "4:44:48", "remaining_time": "2:30:47"} +{"current_steps": 7060, "total_steps": 10798, "loss": 1.955, "reward": null, "learning_rate": 0.00026805466617475007, "epoch": 1.31, "percentage": 65.38, "elapsed_time": "4:44:46", "remaining_time": "2:30:46"} +{"current_steps": 7060, "total_steps": 10798, "loss": 1.955, "reward": null, "learning_rate": 0.00026805466617475007, "epoch": 1.31, "percentage": 65.38, "elapsed_time": "4:44:45", "remaining_time": "2:30:45"} +{"current_steps": 7070, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.0002667669326661767, "epoch": 1.31, "percentage": 65.48, "elapsed_time": "4:51:17", "remaining_time": "2:33:35"} +{"current_steps": 7070, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.0002667669326661767, "epoch": 1.31, "percentage": 65.48, "elapsed_time": "4:45:15", "remaining_time": "2:30:25"} +{"current_steps": 7070, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.0002667669326661767, "epoch": 1.31, "percentage": 65.48, "elapsed_time": "4:45:12", "remaining_time": "2:30:23"} +{"current_steps": 7070, "total_steps": 10798, "loss": 1.9595, "reward": null, "learning_rate": 0.0002667669326661767, "epoch": 1.31, "percentage": 65.48, "elapsed_time": "4:45:13", "remaining_time": "2:30:24"} +{"current_steps": 7080, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0002654811734111033, "epoch": 1.31, "percentage": 65.57, "elapsed_time": "4:45:40", "remaining_time": "2:30:01"} +{"current_steps": 7080, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0002654811734111033, "epoch": 1.31, "percentage": 65.57, "elapsed_time": "4:51:41", "remaining_time": "2:33:10"} +{"current_steps": 7080, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0002654811734111033, "epoch": 1.31, "percentage": 65.57, "elapsed_time": "4:45:38", "remaining_time": "2:30:00"} +{"current_steps": 7080, "total_steps": 10798, "loss": 1.9766, "reward": null, "learning_rate": 0.0002654811734111033, "epoch": 1.31, "percentage": 65.57, "elapsed_time": "4:45:36", "remaining_time": "2:29:59"} +{"current_steps": 7090, "total_steps": 10798, "loss": 1.9626, "reward": null, "learning_rate": 0.00026419739929312713, "epoch": 1.31, "percentage": 65.66, "elapsed_time": "4:46:02", "remaining_time": "2:29:35"} +{"current_steps": 7090, "total_steps": 10798, "loss": 1.9626, "reward": null, "learning_rate": 0.00026419739929312713, "epoch": 1.31, "percentage": 65.66, "elapsed_time": "4:46:04", "remaining_time": "2:29:36"} +{"current_steps": 7090, "total_steps": 10798, "loss": 1.9626, "reward": null, "learning_rate": 0.00026419739929312713, "epoch": 1.31, "percentage": 65.66, "elapsed_time": "4:52:07", "remaining_time": "2:32:46"} +{"current_steps": 7090, "total_steps": 10798, "loss": 1.9626, "reward": null, "learning_rate": 0.00026419739929312713, "epoch": 1.31, "percentage": 65.66, "elapsed_time": "4:46:05", "remaining_time": "2:29:37"} +{"current_steps": 7100, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 0.0002629156211790417, "epoch": 1.32, "percentage": 65.75, "elapsed_time": "4:52:31", "remaining_time": "2:32:21"} +{"current_steps": 7100, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 0.0002629156211790417, "epoch": 1.32, "percentage": 65.75, "elapsed_time": "4:46:28", "remaining_time": "2:29:12"} +{"current_steps": 7100, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 0.0002629156211790417, "epoch": 1.32, "percentage": 65.75, "elapsed_time": "4:46:30", "remaining_time": "2:29:13"} +{"current_steps": 7100, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 0.0002629156211790417, "epoch": 1.32, "percentage": 65.75, "elapsed_time": "4:46:26", "remaining_time": "2:29:11"} +{"current_steps": 7110, "total_steps": 10798, "loss": 1.9522, "reward": null, "learning_rate": 0.00026163584991874413, "epoch": 1.32, "percentage": 65.85, "elapsed_time": "4:46:50", "remaining_time": "2:28:47"} +{"current_steps": 7110, "total_steps": 10798, "loss": 1.9522, "reward": null, "learning_rate": 0.00026163584991874413, "epoch": 1.32, "percentage": 65.85, "elapsed_time": "4:52:55", "remaining_time": "2:31:56"} +{"current_steps": 7110, "total_steps": 10798, "loss": 1.9522, "reward": null, "learning_rate": 0.00026163584991874413, "epoch": 1.32, "percentage": 65.85, "elapsed_time": "4:46:52", "remaining_time": "2:28:48"} +{"current_steps": 7110, "total_steps": 10798, "loss": 1.9522, "reward": null, "learning_rate": 0.00026163584991874413, "epoch": 1.32, "percentage": 65.85, "elapsed_time": "4:46:54", "remaining_time": "2:28:49"} +{"current_steps": 7120, "total_steps": 10798, "loss": 1.9387, "reward": null, "learning_rate": 0.00026035809634514543, "epoch": 1.32, "percentage": 65.94, "elapsed_time": "4:47:19", "remaining_time": "2:28:25"} +{"current_steps": 7120, "total_steps": 10798, "loss": 1.9387, "reward": null, "learning_rate": 0.00026035809634514543, "epoch": 1.32, "percentage": 65.94, "elapsed_time": "4:53:20", "remaining_time": "2:31:32"} +{"current_steps": 7120, "total_steps": 10798, "loss": 1.9387, "reward": null, "learning_rate": 0.00026035809634514543, "epoch": 1.32, "percentage": 65.94, "elapsed_time": "4:47:16", "remaining_time": "2:28:23"} +{"current_steps": 7120, "total_steps": 10798, "loss": 1.9387, "reward": null, "learning_rate": 0.00026035809634514543, "epoch": 1.32, "percentage": 65.94, "elapsed_time": "4:47:17", "remaining_time": "2:28:24"} +{"current_steps": 7130, "total_steps": 10798, "loss": 1.8788, "reward": null, "learning_rate": 0.00025908237127407626, "epoch": 1.32, "percentage": 66.03, "elapsed_time": "4:47:41", "remaining_time": "2:27:59"} +{"current_steps": 7130, "total_steps": 10798, "loss": 1.8788, "reward": null, "learning_rate": 0.00025908237127407626, "epoch": 1.32, "percentage": 66.03, "elapsed_time": "4:47:39", "remaining_time": "2:27:59"} +{"current_steps": 7130, "total_steps": 10798, "loss": 1.8788, "reward": null, "learning_rate": 0.00025908237127407626, "epoch": 1.32, "percentage": 66.03, "elapsed_time": "4:53:44", "remaining_time": "2:31:06"} +{"current_steps": 7130, "total_steps": 10798, "loss": 1.8788, "reward": null, "learning_rate": 0.00025908237127407626, "epoch": 1.32, "percentage": 66.03, "elapsed_time": "4:47:42", "remaining_time": "2:28:00"} +{"current_steps": 7140, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 0.0002578086855041973, "epoch": 1.32, "percentage": 66.12, "elapsed_time": "4:54:09", "remaining_time": "2:30:42"} +{"current_steps": 7140, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 0.0002578086855041973, "epoch": 1.32, "percentage": 66.12, "elapsed_time": "4:48:04", "remaining_time": "2:27:35"} +{"current_steps": 7140, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 0.0002578086855041973, "epoch": 1.32, "percentage": 66.12, "elapsed_time": "4:48:06", "remaining_time": "2:27:36"} +{"current_steps": 7140, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 0.0002578086855041973, "epoch": 1.32, "percentage": 66.12, "elapsed_time": "4:48:07", "remaining_time": "2:27:36"} +{"current_steps": 7150, "total_steps": 10798, "loss": 1.92, "reward": null, "learning_rate": 0.0002565370498169064, "epoch": 1.32, "percentage": 66.22, "elapsed_time": "4:54:33", "remaining_time": "2:30:17"} +{"current_steps": 7150, "total_steps": 10798, "loss": 1.92, "reward": null, "learning_rate": 0.0002565370498169064, "epoch": 1.32, "percentage": 66.22, "elapsed_time": "4:48:32", "remaining_time": "2:27:13"} +{"current_steps": 7150, "total_steps": 10798, "loss": 1.92, "reward": null, "learning_rate": 0.0002565370498169064, "epoch": 1.32, "percentage": 66.22, "elapsed_time": "4:48:29", "remaining_time": "2:27:11"} +{"current_steps": 7150, "total_steps": 10798, "loss": 1.92, "reward": null, "learning_rate": 0.0002565370498169064, "epoch": 1.32, "percentage": 66.22, "elapsed_time": "4:48:30", "remaining_time": "2:27:12"} +{"current_steps": 7160, "total_steps": 10798, "loss": 1.9131, "reward": null, "learning_rate": 0.0002552674749762487, "epoch": 1.33, "percentage": 66.31, "elapsed_time": "4:54:56", "remaining_time": "2:29:51"} +{"current_steps": 7160, "total_steps": 10798, "loss": 1.9131, "reward": null, "learning_rate": 0.0002552674749762487, "epoch": 1.33, "percentage": 66.31, "elapsed_time": "4:48:55", "remaining_time": "2:26:48"} +{"current_steps": 7160, "total_steps": 10798, "loss": 1.9131, "reward": null, "learning_rate": 0.0002552674749762487, "epoch": 1.33, "percentage": 66.31, "elapsed_time": "4:48:53", "remaining_time": "2:26:47"} +{"current_steps": 7160, "total_steps": 10798, "loss": 1.9131, "reward": null, "learning_rate": 0.0002552674749762487, "epoch": 1.33, "percentage": 66.31, "elapsed_time": "4:48:52", "remaining_time": "2:26:46"} +{"current_steps": 7170, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 0.0002539999717288246, "epoch": 1.33, "percentage": 66.4, "elapsed_time": "4:55:21", "remaining_time": "2:29:26"} +{"current_steps": 7170, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 0.0002539999717288246, "epoch": 1.33, "percentage": 66.4, "elapsed_time": "4:49:18", "remaining_time": "2:26:23"} +{"current_steps": 7170, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 0.0002539999717288246, "epoch": 1.33, "percentage": 66.4, "elapsed_time": "4:49:16", "remaining_time": "2:26:22"} +{"current_steps": 7170, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 0.0002539999717288246, "epoch": 1.33, "percentage": 66.4, "elapsed_time": "4:49:19", "remaining_time": "2:26:24"} +{"current_steps": 7180, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.00025286099888629365, "epoch": 1.33, "percentage": 66.49, "elapsed_time": "4:55:47", "remaining_time": "2:29:02"} +{"current_steps": 7180, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.00025286099888629365, "epoch": 1.33, "percentage": 66.49, "elapsed_time": "4:49:43", "remaining_time": "2:25:59"} +{"current_steps": 7180, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.00025286099888629365, "epoch": 1.33, "percentage": 66.49, "elapsed_time": "4:49:45", "remaining_time": "2:26:00"} +{"current_steps": 7180, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 0.00025286099888629365, "epoch": 1.33, "percentage": 66.49, "elapsed_time": "4:49:42", "remaining_time": "2:25:58"} +{"current_steps": 7190, "total_steps": 10798, "loss": 1.9281, "reward": null, "learning_rate": 0.000251597461210021, "epoch": 1.33, "percentage": 66.59, "elapsed_time": "4:50:11", "remaining_time": "2:25:37"} +{"current_steps": 7190, "total_steps": 10798, "loss": 1.9281, "reward": null, "learning_rate": 0.000251597461210021, "epoch": 1.33, "percentage": 66.59, "elapsed_time": "4:50:09", "remaining_time": "2:25:36"} +{"current_steps": 7190, "total_steps": 10798, "loss": 1.9281, "reward": null, "learning_rate": 0.000251597461210021, "epoch": 1.33, "percentage": 66.59, "elapsed_time": "4:56:12", "remaining_time": "2:28:38"} +{"current_steps": 7190, "total_steps": 10798, "loss": 1.9281, "reward": null, "learning_rate": 0.000251597461210021, "epoch": 1.33, "percentage": 66.59, "elapsed_time": "4:50:07", "remaining_time": "2:25:35"} +{"current_steps": 7200, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.00025033602619263507, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "4:56:38", "remaining_time": "2:28:14"} +{"current_steps": 7200, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.00025033602619263507, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "4:50:34", "remaining_time": "2:25:12"} +{"current_steps": 7200, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.00025033602619263507, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "4:50:36", "remaining_time": "2:25:13"} +{"current_steps": 7200, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.00025033602619263507, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "4:50:33", "remaining_time": "2:25:11"} +{"current_steps": 7210, "total_steps": 10798, "loss": 1.9535, "reward": null, "learning_rate": 0.00024907670451183454, "epoch": 1.34, "percentage": 66.77, "elapsed_time": "4:50:59", "remaining_time": "2:24:48"} +{"current_steps": 7210, "total_steps": 10798, "loss": 1.9535, "reward": null, "learning_rate": 0.00024907670451183454, "epoch": 1.34, "percentage": 66.77, "elapsed_time": "4:57:04", "remaining_time": "2:27:50"} +{"current_steps": 7210, "total_steps": 10798, "loss": 1.9535, "reward": null, "learning_rate": 0.00024907670451183454, "epoch": 1.34, "percentage": 66.77, "elapsed_time": "4:51:02", "remaining_time": "2:24:50"} +{"current_steps": 7210, "total_steps": 10798, "loss": 1.9535, "reward": null, "learning_rate": 0.00024907670451183454, "epoch": 1.34, "percentage": 66.77, "elapsed_time": "4:51:00", "remaining_time": "2:24:49"} +{"current_steps": 7220, "total_steps": 10798, "loss": 1.8798, "reward": null, "learning_rate": 0.00024781950682742983, "epoch": 1.34, "percentage": 66.86, "elapsed_time": "4:51:27", "remaining_time": "2:24:26"} +{"current_steps": 7220, "total_steps": 10798, "loss": 1.8798, "reward": null, "learning_rate": 0.00024781950682742983, "epoch": 1.34, "percentage": 66.86, "elapsed_time": "4:51:24", "remaining_time": "2:24:24"} +{"current_steps": 7220, "total_steps": 10798, "loss": 1.8798, "reward": null, "learning_rate": 0.00024781950682742983, "epoch": 1.34, "percentage": 66.86, "elapsed_time": "4:51:26", "remaining_time": "2:24:25"} +{"current_steps": 7220, "total_steps": 10798, "loss": 1.8798, "reward": null, "learning_rate": 0.00024781950682742983, "epoch": 1.34, "percentage": 66.86, "elapsed_time": "4:57:29", "remaining_time": "2:27:25"} +{"current_steps": 7230, "total_steps": 10798, "loss": 1.9124, "reward": null, "learning_rate": 0.00024656444378125204, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "4:51:49", "remaining_time": "2:24:01"} +{"current_steps": 7230, "total_steps": 10798, "loss": 1.9124, "reward": null, "learning_rate": 0.00024656444378125204, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "4:57:54", "remaining_time": "2:27:01"} +{"current_steps": 7230, "total_steps": 10798, "loss": 1.9124, "reward": null, "learning_rate": 0.00024656444378125204, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "4:51:51", "remaining_time": "2:24:01"} +{"current_steps": 7230, "total_steps": 10798, "loss": 1.9124, "reward": null, "learning_rate": 0.00024656444378125204, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "4:51:53", "remaining_time": "2:24:02"} +{"current_steps": 7240, "total_steps": 10798, "loss": 1.9472, "reward": null, "learning_rate": 0.00024531152599706346, "epoch": 1.34, "percentage": 67.05, "elapsed_time": "4:52:14", "remaining_time": "2:23:37"} +{"current_steps": 7240, "total_steps": 10798, "loss": 1.9472, "reward": null, "learning_rate": 0.00024531152599706346, "epoch": 1.34, "percentage": 67.05, "elapsed_time": "4:52:16", "remaining_time": "2:23:38"} +{"current_steps": 7240, "total_steps": 10798, "loss": 1.9472, "reward": null, "learning_rate": 0.00024531152599706346, "epoch": 1.34, "percentage": 67.05, "elapsed_time": "4:58:19", "remaining_time": "2:26:36"} +{"current_steps": 7240, "total_steps": 10798, "loss": 1.9472, "reward": null, "learning_rate": 0.00024531152599706346, "epoch": 1.34, "percentage": 67.05, "elapsed_time": "4:52:18", "remaining_time": "2:23:38"} +{"current_steps": 7250, "total_steps": 10798, "loss": 1.9697, "reward": null, "learning_rate": 0.0002440607640804668, "epoch": 1.34, "percentage": 67.14, "elapsed_time": "4:52:41", "remaining_time": "2:23:14"} +{"current_steps": 7250, "total_steps": 10798, "loss": 1.9697, "reward": null, "learning_rate": 0.0002440607640804668, "epoch": 1.34, "percentage": 67.14, "elapsed_time": "4:58:44", "remaining_time": "2:26:12"} +{"current_steps": 7250, "total_steps": 10798, "loss": 1.9697, "reward": null, "learning_rate": 0.0002440607640804668, "epoch": 1.34, "percentage": 67.14, "elapsed_time": "4:52:43", "remaining_time": "2:23:15"} +{"current_steps": 7250, "total_steps": 10798, "loss": 1.9697, "reward": null, "learning_rate": 0.0002440607640804668, "epoch": 1.34, "percentage": 67.14, "elapsed_time": "4:52:40", "remaining_time": "2:23:13"} +{"current_steps": 7260, "total_steps": 10798, "loss": 1.938, "reward": null, "learning_rate": 0.00024281216861881633, "epoch": 1.34, "percentage": 67.23, "elapsed_time": "4:59:11", "remaining_time": "2:25:48"} +{"current_steps": 7260, "total_steps": 10798, "loss": 1.938, "reward": null, "learning_rate": 0.00024281216861881633, "epoch": 1.34, "percentage": 67.23, "elapsed_time": "4:53:10", "remaining_time": "2:22:52"} +{"current_steps": 7260, "total_steps": 10798, "loss": 1.938, "reward": null, "learning_rate": 0.00024281216861881633, "epoch": 1.34, "percentage": 67.23, "elapsed_time": "4:53:06", "remaining_time": "2:22:50"} +{"current_steps": 7260, "total_steps": 10798, "loss": 1.938, "reward": null, "learning_rate": 0.00024281216861881633, "epoch": 1.34, "percentage": 67.23, "elapsed_time": "4:53:08", "remaining_time": "2:22:51"} +{"current_steps": 7270, "total_steps": 10798, "loss": 1.9035, "reward": null, "learning_rate": 0.00024156575018112787, "epoch": 1.35, "percentage": 67.33, "elapsed_time": "4:59:35", "remaining_time": "2:25:23"} +{"current_steps": 7270, "total_steps": 10798, "loss": 1.9035, "reward": null, "learning_rate": 0.00024156575018112787, "epoch": 1.35, "percentage": 67.33, "elapsed_time": "4:53:34", "remaining_time": "2:22:27"} +{"current_steps": 7270, "total_steps": 10798, "loss": 1.9035, "reward": null, "learning_rate": 0.00024156575018112787, "epoch": 1.35, "percentage": 67.33, "elapsed_time": "4:53:30", "remaining_time": "2:22:26"} +{"current_steps": 7270, "total_steps": 10798, "loss": 1.9035, "reward": null, "learning_rate": 0.00024156575018112787, "epoch": 1.35, "percentage": 67.33, "elapsed_time": "4:53:32", "remaining_time": "2:22:26"} +{"current_steps": 7280, "total_steps": 10798, "loss": 1.9379, "reward": null, "learning_rate": 0.00024032151931798918, "epoch": 1.35, "percentage": 67.42, "elapsed_time": "5:00:00", "remaining_time": "2:24:58"} +{"current_steps": 7280, "total_steps": 10798, "loss": 1.9379, "reward": null, "learning_rate": 0.00024032151931798918, "epoch": 1.35, "percentage": 67.42, "elapsed_time": "4:53:59", "remaining_time": "2:22:04"} +{"current_steps": 7280, "total_steps": 10798, "loss": 1.9379, "reward": null, "learning_rate": 0.00024032151931798918, "epoch": 1.35, "percentage": 67.42, "elapsed_time": "4:53:57", "remaining_time": "2:22:03"} +{"current_steps": 7280, "total_steps": 10798, "loss": 1.9379, "reward": null, "learning_rate": 0.00024032151931798918, "epoch": 1.35, "percentage": 67.42, "elapsed_time": "4:53:56", "remaining_time": "2:22:02"} +{"current_steps": 7290, "total_steps": 10798, "loss": 1.9176, "reward": null, "learning_rate": 0.0002390794865614711, "epoch": 1.35, "percentage": 67.51, "elapsed_time": "4:54:20", "remaining_time": "2:21:38"} +{"current_steps": 7290, "total_steps": 10798, "loss": 1.9176, "reward": null, "learning_rate": 0.0002390794865614711, "epoch": 1.35, "percentage": 67.51, "elapsed_time": "4:54:21", "remaining_time": "2:21:39"} +{"current_steps": 7290, "total_steps": 10798, "loss": 1.9176, "reward": null, "learning_rate": 0.0002390794865614711, "epoch": 1.35, "percentage": 67.51, "elapsed_time": "4:54:23", "remaining_time": "2:21:39"} +{"current_steps": 7290, "total_steps": 10798, "loss": 1.9176, "reward": null, "learning_rate": 0.0002390794865614711, "epoch": 1.35, "percentage": 67.51, "elapsed_time": "5:00:25", "remaining_time": "2:24:33"} +{"current_steps": 7300, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0002378396624250375, "epoch": 1.35, "percentage": 67.61, "elapsed_time": "4:54:46", "remaining_time": "2:21:15"} +{"current_steps": 7300, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0002378396624250375, "epoch": 1.35, "percentage": 67.61, "elapsed_time": "5:00:49", "remaining_time": "2:24:09"} +{"current_steps": 7300, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0002378396624250375, "epoch": 1.35, "percentage": 67.61, "elapsed_time": "4:54:48", "remaining_time": "2:21:15"} +{"current_steps": 7300, "total_steps": 10798, "loss": 1.9392, "reward": null, "learning_rate": 0.0002378396624250375, "epoch": 1.35, "percentage": 67.61, "elapsed_time": "4:54:44", "remaining_time": "2:21:14"} +{"current_steps": 7310, "total_steps": 10798, "loss": 1.9235, "reward": null, "learning_rate": 0.0002366020574034576, "epoch": 1.35, "percentage": 67.7, "elapsed_time": "4:55:10", "remaining_time": "2:20:50"} +{"current_steps": 7310, "total_steps": 10798, "loss": 1.9235, "reward": null, "learning_rate": 0.0002366020574034576, "epoch": 1.35, "percentage": 67.7, "elapsed_time": "4:55:12", "remaining_time": "2:20:51"} +{"current_steps": 7310, "total_steps": 10798, "loss": 1.9235, "reward": null, "learning_rate": 0.0002366020574034576, "epoch": 1.35, "percentage": 67.7, "elapsed_time": "4:55:09", "remaining_time": "2:20:50"} +{"current_steps": 7310, "total_steps": 10798, "loss": 1.9235, "reward": null, "learning_rate": 0.0002366020574034576, "epoch": 1.35, "percentage": 67.7, "elapsed_time": "5:01:14", "remaining_time": "2:23:44"} +{"current_steps": 7320, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00023536668197271588, "epoch": 1.36, "percentage": 67.79, "elapsed_time": "5:01:39", "remaining_time": "2:23:19"} +{"current_steps": 7320, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00023536668197271588, "epoch": 1.36, "percentage": 67.79, "elapsed_time": "4:55:34", "remaining_time": "2:20:26"} +{"current_steps": 7320, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00023536668197271588, "epoch": 1.36, "percentage": 67.79, "elapsed_time": "4:55:36", "remaining_time": "2:20:27"} +{"current_steps": 7320, "total_steps": 10798, "loss": 1.939, "reward": null, "learning_rate": 0.00023536668197271588, "epoch": 1.36, "percentage": 67.79, "elapsed_time": "4:55:37", "remaining_time": "2:20:27"} +{"current_steps": 7330, "total_steps": 10798, "loss": 1.889, "reward": null, "learning_rate": 0.0002341335465899243, "epoch": 1.36, "percentage": 67.88, "elapsed_time": "5:02:02", "remaining_time": "2:22:54"} +{"current_steps": 7330, "total_steps": 10798, "loss": 1.889, "reward": null, "learning_rate": 0.0002341335465899243, "epoch": 1.36, "percentage": 67.88, "elapsed_time": "4:55:57", "remaining_time": "2:20:01"} +{"current_steps": 7330, "total_steps": 10798, "loss": 1.889, "reward": null, "learning_rate": 0.0002341335465899243, "epoch": 1.36, "percentage": 67.88, "elapsed_time": "4:55:59", "remaining_time": "2:20:02"} +{"current_steps": 7330, "total_steps": 10798, "loss": 1.889, "reward": null, "learning_rate": 0.0002341335465899243, "epoch": 1.36, "percentage": 67.88, "elapsed_time": "4:56:01", "remaining_time": "2:20:03"} +{"current_steps": 7340, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 0.00023290266169323354, "epoch": 1.36, "percentage": 67.98, "elapsed_time": "4:56:22", "remaining_time": "2:19:37"} +{"current_steps": 7340, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 0.00023290266169323354, "epoch": 1.36, "percentage": 67.98, "elapsed_time": "4:56:25", "remaining_time": "2:19:39"} +{"current_steps": 7340, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 0.00023290266169323354, "epoch": 1.36, "percentage": 67.98, "elapsed_time": "4:56:23", "remaining_time": "2:19:38"} +{"current_steps": 7340, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 0.00023290266169323354, "epoch": 1.36, "percentage": 67.98, "elapsed_time": "5:02:26", "remaining_time": "2:22:29"} +{"current_steps": 7350, "total_steps": 10798, "loss": 1.935, "reward": null, "learning_rate": 0.0002316740377017438, "epoch": 1.36, "percentage": 68.07, "elapsed_time": "5:02:52", "remaining_time": "2:22:04"} +{"current_steps": 7350, "total_steps": 10798, "loss": 1.935, "reward": null, "learning_rate": 0.0002316740377017438, "epoch": 1.36, "percentage": 68.07, "elapsed_time": "4:56:48", "remaining_time": "2:19:14"} +{"current_steps": 7350, "total_steps": 10798, "loss": 1.935, "reward": null, "learning_rate": 0.0002316740377017438, "epoch": 1.36, "percentage": 68.07, "elapsed_time": "4:56:50", "remaining_time": "2:19:15"} +{"current_steps": 7350, "total_steps": 10798, "loss": 1.935, "reward": null, "learning_rate": 0.0002316740377017438, "epoch": 1.36, "percentage": 68.07, "elapsed_time": "4:56:47", "remaining_time": "2:19:13"} +{"current_steps": 7360, "total_steps": 10798, "loss": 1.9198, "reward": null, "learning_rate": 0.0002304476850154183, "epoch": 1.36, "percentage": 68.16, "elapsed_time": "4:57:13", "remaining_time": "2:18:50"} +{"current_steps": 7360, "total_steps": 10798, "loss": 1.9198, "reward": null, "learning_rate": 0.0002304476850154183, "epoch": 1.36, "percentage": 68.16, "elapsed_time": "4:57:15", "remaining_time": "2:18:51"} +{"current_steps": 7360, "total_steps": 10798, "loss": 1.9198, "reward": null, "learning_rate": 0.0002304476850154183, "epoch": 1.36, "percentage": 68.16, "elapsed_time": "4:57:11", "remaining_time": "2:18:49"} +{"current_steps": 7360, "total_steps": 10798, "loss": 1.9198, "reward": null, "learning_rate": 0.0002304476850154183, "epoch": 1.36, "percentage": 68.16, "elapsed_time": "5:03:16", "remaining_time": "2:21:39"} +{"current_steps": 7370, "total_steps": 10798, "loss": 1.9068, "reward": null, "learning_rate": 0.00022922361401499325, "epoch": 1.37, "percentage": 68.25, "elapsed_time": "5:03:41", "remaining_time": "2:21:15"} +{"current_steps": 7370, "total_steps": 10798, "loss": 1.9068, "reward": null, "learning_rate": 0.00022922361401499325, "epoch": 1.37, "percentage": 68.25, "elapsed_time": "4:57:37", "remaining_time": "2:18:26"} +{"current_steps": 7370, "total_steps": 10798, "loss": 1.9068, "reward": null, "learning_rate": 0.00022922361401499325, "epoch": 1.37, "percentage": 68.25, "elapsed_time": "4:57:36", "remaining_time": "2:18:25"} +{"current_steps": 7370, "total_steps": 10798, "loss": 1.9068, "reward": null, "learning_rate": 0.00022922361401499325, "epoch": 1.37, "percentage": 68.25, "elapsed_time": "4:57:39", "remaining_time": "2:18:26"} +{"current_steps": 7380, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.00022800183506189238, "epoch": 1.37, "percentage": 68.35, "elapsed_time": "5:04:06", "remaining_time": "2:20:50"} +{"current_steps": 7380, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.00022800183506189238, "epoch": 1.37, "percentage": 68.35, "elapsed_time": "4:58:05", "remaining_time": "2:18:03"} +{"current_steps": 7380, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.00022800183506189238, "epoch": 1.37, "percentage": 68.35, "elapsed_time": "4:58:03", "remaining_time": "2:18:02"} +{"current_steps": 7380, "total_steps": 10798, "loss": 1.9505, "reward": null, "learning_rate": 0.00022800183506189238, "epoch": 1.37, "percentage": 68.35, "elapsed_time": "4:58:01", "remaining_time": "2:18:01"} +{"current_steps": 7390, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 0.00022678235849813645, "epoch": 1.37, "percentage": 68.44, "elapsed_time": "5:04:31", "remaining_time": "2:20:25"} +{"current_steps": 7390, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 0.00022678235849813645, "epoch": 1.37, "percentage": 68.44, "elapsed_time": "4:58:26", "remaining_time": "2:17:37"} +{"current_steps": 7390, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 0.00022678235849813645, "epoch": 1.37, "percentage": 68.44, "elapsed_time": "4:58:27", "remaining_time": "2:17:38"} +{"current_steps": 7390, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 0.00022678235849813645, "epoch": 1.37, "percentage": 68.44, "elapsed_time": "4:58:29", "remaining_time": "2:17:39"} +{"current_steps": 7400, "total_steps": 10798, "loss": 1.9302, "reward": null, "learning_rate": 0.00022556519464625807, "epoch": 1.37, "percentage": 68.53, "elapsed_time": "5:04:55", "remaining_time": "2:20:00"} +{"current_steps": 7400, "total_steps": 10798, "loss": 1.9302, "reward": null, "learning_rate": 0.00022556519464625807, "epoch": 1.37, "percentage": 68.53, "elapsed_time": "4:58:52", "remaining_time": "2:17:14"} +{"current_steps": 7400, "total_steps": 10798, "loss": 1.9302, "reward": null, "learning_rate": 0.00022556519464625807, "epoch": 1.37, "percentage": 68.53, "elapsed_time": "4:58:50", "remaining_time": "2:17:13"} +{"current_steps": 7400, "total_steps": 10798, "loss": 1.9302, "reward": null, "learning_rate": 0.00022556519464625807, "epoch": 1.37, "percentage": 68.53, "elapsed_time": "4:58:53", "remaining_time": "2:17:15"} +{"current_steps": 7410, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.00022435035380921321, "epoch": 1.37, "percentage": 68.62, "elapsed_time": "5:05:19", "remaining_time": "2:19:36"} +{"current_steps": 7410, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.00022435035380921321, "epoch": 1.37, "percentage": 68.62, "elapsed_time": "4:59:16", "remaining_time": "2:16:50"} +{"current_steps": 7410, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.00022435035380921321, "epoch": 1.37, "percentage": 68.62, "elapsed_time": "4:59:18", "remaining_time": "2:16:50"} +{"current_steps": 7410, "total_steps": 10798, "loss": 1.9345, "reward": null, "learning_rate": 0.00022435035380921321, "epoch": 1.37, "percentage": 68.62, "elapsed_time": "4:59:14", "remaining_time": "2:16:49"} +{"current_steps": 7420, "total_steps": 10798, "loss": 1.9304, "reward": null, "learning_rate": 0.0002231378462702935, "epoch": 1.37, "percentage": 68.72, "elapsed_time": "5:05:44", "remaining_time": "2:19:11"} +{"current_steps": 7420, "total_steps": 10798, "loss": 1.9304, "reward": null, "learning_rate": 0.0002231378462702935, "epoch": 1.37, "percentage": 68.72, "elapsed_time": "4:59:39", "remaining_time": "2:16:25"} +{"current_steps": 7420, "total_steps": 10798, "loss": 1.9304, "reward": null, "learning_rate": 0.0002231378462702935, "epoch": 1.37, "percentage": 68.72, "elapsed_time": "4:59:41", "remaining_time": "2:16:26"} +{"current_steps": 7420, "total_steps": 10798, "loss": 1.9304, "reward": null, "learning_rate": 0.0002231378462702935, "epoch": 1.37, "percentage": 68.72, "elapsed_time": "4:59:43", "remaining_time": "2:16:26"} +{"current_steps": 7430, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 0.00022192768229304107, "epoch": 1.38, "percentage": 68.81, "elapsed_time": "5:00:03", "remaining_time": "2:16:01"} +{"current_steps": 7430, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 0.00022192768229304107, "epoch": 1.38, "percentage": 68.81, "elapsed_time": "5:00:06", "remaining_time": "2:16:02"} +{"current_steps": 7430, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 0.00022192768229304107, "epoch": 1.38, "percentage": 68.81, "elapsed_time": "5:00:05", "remaining_time": "2:16:01"} +{"current_steps": 7430, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 0.00022192768229304107, "epoch": 1.38, "percentage": 68.81, "elapsed_time": "5:06:08", "remaining_time": "2:18:46"} +{"current_steps": 7440, "total_steps": 10798, "loss": 1.9395, "reward": null, "learning_rate": 0.0002207198721211593, "epoch": 1.38, "percentage": 68.9, "elapsed_time": "5:00:28", "remaining_time": "2:15:36"} +{"current_steps": 7440, "total_steps": 10798, "loss": 1.9395, "reward": null, "learning_rate": 0.0002207198721211593, "epoch": 1.38, "percentage": 68.9, "elapsed_time": "5:00:31", "remaining_time": "2:15:38"} +{"current_steps": 7440, "total_steps": 10798, "loss": 1.9395, "reward": null, "learning_rate": 0.0002207198721211593, "epoch": 1.38, "percentage": 68.9, "elapsed_time": "5:06:33", "remaining_time": "2:18:21"} +{"current_steps": 7440, "total_steps": 10798, "loss": 1.9395, "reward": null, "learning_rate": 0.0002207198721211593, "epoch": 1.38, "percentage": 68.9, "elapsed_time": "5:00:29", "remaining_time": "2:15:37"} +{"current_steps": 7450, "total_steps": 10798, "loss": 1.9867, "reward": null, "learning_rate": 0.00021951442597842785, "epoch": 1.38, "percentage": 68.99, "elapsed_time": "5:00:52", "remaining_time": "2:15:12"} +{"current_steps": 7450, "total_steps": 10798, "loss": 1.9867, "reward": null, "learning_rate": 0.00021951442597842785, "epoch": 1.38, "percentage": 68.99, "elapsed_time": "5:06:57", "remaining_time": "2:17:56"} +{"current_steps": 7450, "total_steps": 10798, "loss": 1.9867, "reward": null, "learning_rate": 0.00021951442597842785, "epoch": 1.38, "percentage": 68.99, "elapsed_time": "5:00:54", "remaining_time": "2:15:13"} +{"current_steps": 7450, "total_steps": 10798, "loss": 1.9867, "reward": null, "learning_rate": 0.00021951442597842785, "epoch": 1.38, "percentage": 68.99, "elapsed_time": "5:00:55", "remaining_time": "2:15:14"} +{"current_steps": 7460, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.00021831135406861558, "epoch": 1.38, "percentage": 69.09, "elapsed_time": "5:07:22", "remaining_time": "2:17:32"} +{"current_steps": 7460, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.00021831135406861558, "epoch": 1.38, "percentage": 69.09, "elapsed_time": "5:01:18", "remaining_time": "2:14:49"} +{"current_steps": 7460, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.00021831135406861558, "epoch": 1.38, "percentage": 69.09, "elapsed_time": "5:01:21", "remaining_time": "2:14:50"} +{"current_steps": 7460, "total_steps": 10798, "loss": 1.9217, "reward": null, "learning_rate": 0.00021831135406861558, "epoch": 1.38, "percentage": 69.09, "elapsed_time": "5:01:19", "remaining_time": "2:14:49"} +{"current_steps": 7470, "total_steps": 10798, "loss": 1.991, "reward": null, "learning_rate": 0.00021711066657539342, "epoch": 1.38, "percentage": 69.18, "elapsed_time": "5:07:48", "remaining_time": "2:17:08"} +{"current_steps": 7470, "total_steps": 10798, "loss": 1.991, "reward": null, "learning_rate": 0.00021711066657539342, "epoch": 1.38, "percentage": 69.18, "elapsed_time": "5:01:47", "remaining_time": "2:14:27"} +{"current_steps": 7470, "total_steps": 10798, "loss": 1.991, "reward": null, "learning_rate": 0.00021711066657539342, "epoch": 1.38, "percentage": 69.18, "elapsed_time": "5:01:45", "remaining_time": "2:14:26"} +{"current_steps": 7470, "total_steps": 10798, "loss": 1.991, "reward": null, "learning_rate": 0.00021711066657539342, "epoch": 1.38, "percentage": 69.18, "elapsed_time": "5:01:43", "remaining_time": "2:14:25"} +{"current_steps": 7480, "total_steps": 10798, "loss": 1.9492, "reward": null, "learning_rate": 0.00021591237366225008, "epoch": 1.39, "percentage": 69.27, "elapsed_time": "5:02:09", "remaining_time": "2:14:01"} +{"current_steps": 7480, "total_steps": 10798, "loss": 1.9492, "reward": null, "learning_rate": 0.00021591237366225008, "epoch": 1.39, "percentage": 69.27, "elapsed_time": "5:02:11", "remaining_time": "2:14:02"} +{"current_steps": 7480, "total_steps": 10798, "loss": 1.9492, "reward": null, "learning_rate": 0.00021591237366225008, "epoch": 1.39, "percentage": 69.27, "elapsed_time": "5:02:07", "remaining_time": "2:14:01"} +{"current_steps": 7480, "total_steps": 10798, "loss": 1.9492, "reward": null, "learning_rate": 0.00021591237366225008, "epoch": 1.39, "percentage": 69.27, "elapsed_time": "5:08:12", "remaining_time": "2:16:43"} +{"current_steps": 7490, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00021471648547240365, "epoch": 1.39, "percentage": 69.36, "elapsed_time": "5:08:37", "remaining_time": "2:16:18"} +{"current_steps": 7490, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00021471648547240365, "epoch": 1.39, "percentage": 69.36, "elapsed_time": "5:02:33", "remaining_time": "2:13:37"} +{"current_steps": 7490, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00021471648547240365, "epoch": 1.39, "percentage": 69.36, "elapsed_time": "5:02:35", "remaining_time": "2:13:38"} +{"current_steps": 7490, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00021471648547240365, "epoch": 1.39, "percentage": 69.36, "elapsed_time": "5:02:32", "remaining_time": "2:13:37"} +{"current_steps": 7500, "total_steps": 10798, "loss": 1.9436, "reward": null, "learning_rate": 0.00021352301212871762, "epoch": 1.39, "percentage": 69.46, "elapsed_time": "5:02:57", "remaining_time": "2:13:13"} +{"current_steps": 7500, "total_steps": 10798, "loss": 1.9436, "reward": null, "learning_rate": 0.00021352301212871762, "epoch": 1.39, "percentage": 69.46, "elapsed_time": "5:09:02", "remaining_time": "2:15:53"} +{"current_steps": 7500, "total_steps": 10798, "loss": 1.9436, "reward": null, "learning_rate": 0.00021352301212871762, "epoch": 1.39, "percentage": 69.46, "elapsed_time": "5:02:59", "remaining_time": "2:13:14"} +{"current_steps": 7500, "total_steps": 10798, "loss": 1.9436, "reward": null, "learning_rate": 0.00021352301212871762, "epoch": 1.39, "percentage": 69.46, "elapsed_time": "5:03:01", "remaining_time": "2:13:14"} +{"current_steps": 7510, "total_steps": 10798, "loss": 1.9267, "reward": null, "learning_rate": 0.00021233196373361397, "epoch": 1.39, "percentage": 69.55, "elapsed_time": "5:03:21", "remaining_time": "2:12:49"} +{"current_steps": 7510, "total_steps": 10798, "loss": 1.9267, "reward": null, "learning_rate": 0.00021233196373361397, "epoch": 1.39, "percentage": 69.55, "elapsed_time": "5:09:26", "remaining_time": "2:15:28"} +{"current_steps": 7510, "total_steps": 10798, "loss": 1.9267, "reward": null, "learning_rate": 0.00021233196373361397, "epoch": 1.39, "percentage": 69.55, "elapsed_time": "5:03:25", "remaining_time": "2:12:50"} +{"current_steps": 7510, "total_steps": 10798, "loss": 1.9267, "reward": null, "learning_rate": 0.00021233196373361397, "epoch": 1.39, "percentage": 69.55, "elapsed_time": "5:03:23", "remaining_time": "2:12:49"} +{"current_steps": 7520, "total_steps": 10798, "loss": 1.9483, "reward": null, "learning_rate": 0.00021114335036898852, "epoch": 1.39, "percentage": 69.64, "elapsed_time": "5:03:48", "remaining_time": "2:12:25"} +{"current_steps": 7520, "total_steps": 10798, "loss": 1.9483, "reward": null, "learning_rate": 0.00021114335036898852, "epoch": 1.39, "percentage": 69.64, "elapsed_time": "5:09:51", "remaining_time": "2:15:04"} +{"current_steps": 7520, "total_steps": 10798, "loss": 1.9483, "reward": null, "learning_rate": 0.00021114335036898852, "epoch": 1.39, "percentage": 69.64, "elapsed_time": "5:03:46", "remaining_time": "2:12:25"} +{"current_steps": 7520, "total_steps": 10798, "loss": 1.9483, "reward": null, "learning_rate": 0.00021114335036898852, "epoch": 1.39, "percentage": 69.64, "elapsed_time": "5:03:49", "remaining_time": "2:12:26"} +{"current_steps": 7530, "total_steps": 10798, "loss": 1.9485, "reward": null, "learning_rate": 0.0002099571820961252, "epoch": 1.39, "percentage": 69.74, "elapsed_time": "5:10:15", "remaining_time": "2:14:38"} +{"current_steps": 7530, "total_steps": 10798, "loss": 1.9485, "reward": null, "learning_rate": 0.0002099571820961252, "epoch": 1.39, "percentage": 69.74, "elapsed_time": "5:04:10", "remaining_time": "2:12:00"} +{"current_steps": 7530, "total_steps": 10798, "loss": 1.9485, "reward": null, "learning_rate": 0.0002099571820961252, "epoch": 1.39, "percentage": 69.74, "elapsed_time": "5:04:13", "remaining_time": "2:12:02"} +{"current_steps": 7530, "total_steps": 10798, "loss": 1.9485, "reward": null, "learning_rate": 0.0002099571820961252, "epoch": 1.39, "percentage": 69.74, "elapsed_time": "5:04:12", "remaining_time": "2:12:01"} +{"current_steps": 7540, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.00020877346895561082, "epoch": 1.4, "percentage": 69.83, "elapsed_time": "5:10:39", "remaining_time": "2:14:14"} +{"current_steps": 7540, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.00020877346895561082, "epoch": 1.4, "percentage": 69.83, "elapsed_time": "5:04:36", "remaining_time": "2:11:37"} +{"current_steps": 7540, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.00020877346895561082, "epoch": 1.4, "percentage": 69.83, "elapsed_time": "5:04:34", "remaining_time": "2:11:36"} +{"current_steps": 7540, "total_steps": 10798, "loss": 1.9607, "reward": null, "learning_rate": 0.00020877346895561082, "epoch": 1.4, "percentage": 69.83, "elapsed_time": "5:04:38", "remaining_time": "2:11:37"} +{"current_steps": 7550, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 0.00020759222096725034, "epoch": 1.4, "percentage": 69.92, "elapsed_time": "5:11:04", "remaining_time": "2:13:49"} +{"current_steps": 7550, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 0.00020759222096725034, "epoch": 1.4, "percentage": 69.92, "elapsed_time": "5:04:59", "remaining_time": "2:11:12"} +{"current_steps": 7550, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 0.00020759222096725034, "epoch": 1.4, "percentage": 69.92, "elapsed_time": "5:05:03", "remaining_time": "2:11:14"} +{"current_steps": 7550, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 0.00020759222096725034, "epoch": 1.4, "percentage": 69.92, "elapsed_time": "5:05:01", "remaining_time": "2:11:13"} +{"current_steps": 7560, "total_steps": 10798, "loss": 1.9202, "reward": null, "learning_rate": 0.0002064134481299814, "epoch": 1.4, "percentage": 70.01, "elapsed_time": "5:11:27", "remaining_time": "2:13:24"} +{"current_steps": 7560, "total_steps": 10798, "loss": 1.9202, "reward": null, "learning_rate": 0.0002064134481299814, "epoch": 1.4, "percentage": 70.01, "elapsed_time": "5:05:26", "remaining_time": "2:10:49"} +{"current_steps": 7560, "total_steps": 10798, "loss": 1.9202, "reward": null, "learning_rate": 0.0002064134481299814, "epoch": 1.4, "percentage": 70.01, "elapsed_time": "5:05:22", "remaining_time": "2:10:47"} +{"current_steps": 7560, "total_steps": 10798, "loss": 1.9202, "reward": null, "learning_rate": 0.0002064134481299814, "epoch": 1.4, "percentage": 70.01, "elapsed_time": "5:05:24", "remaining_time": "2:10:48"} +{"current_steps": 7570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 0.00020523716042179075, "epoch": 1.4, "percentage": 70.11, "elapsed_time": "5:11:51", "remaining_time": "2:12:59"} +{"current_steps": 7570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 0.00020523716042179075, "epoch": 1.4, "percentage": 70.11, "elapsed_time": "5:05:47", "remaining_time": "2:10:23"} +{"current_steps": 7570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 0.00020523716042179075, "epoch": 1.4, "percentage": 70.11, "elapsed_time": "5:05:50", "remaining_time": "2:10:25"} +{"current_steps": 7570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 0.00020523716042179075, "epoch": 1.4, "percentage": 70.11, "elapsed_time": "5:05:48", "remaining_time": "2:10:24"} +{"current_steps": 7580, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00020406336779962888, "epoch": 1.4, "percentage": 70.2, "elapsed_time": "5:12:17", "remaining_time": "2:12:34"} +{"current_steps": 7580, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00020406336779962888, "epoch": 1.4, "percentage": 70.2, "elapsed_time": "5:06:12", "remaining_time": "2:09:59"} +{"current_steps": 7580, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00020406336779962888, "epoch": 1.4, "percentage": 70.2, "elapsed_time": "5:06:14", "remaining_time": "2:10:00"} +{"current_steps": 7580, "total_steps": 10798, "loss": 1.9406, "reward": null, "learning_rate": 0.00020406336779962888, "epoch": 1.4, "percentage": 70.2, "elapsed_time": "5:06:15", "remaining_time": "2:10:01"} +{"current_steps": 7590, "total_steps": 10798, "loss": 1.9357, "reward": null, "learning_rate": 0.00020289208019932635, "epoch": 1.41, "percentage": 70.29, "elapsed_time": "5:12:43", "remaining_time": "2:12:10"} +{"current_steps": 7590, "total_steps": 10798, "loss": 1.9357, "reward": null, "learning_rate": 0.00020289208019932635, "epoch": 1.41, "percentage": 70.29, "elapsed_time": "5:06:38", "remaining_time": "2:09:36"} +{"current_steps": 7590, "total_steps": 10798, "loss": 1.9357, "reward": null, "learning_rate": 0.00020289208019932635, "epoch": 1.41, "percentage": 70.29, "elapsed_time": "5:06:41", "remaining_time": "2:09:37"} +{"current_steps": 7590, "total_steps": 10798, "loss": 1.9357, "reward": null, "learning_rate": 0.00020289208019932635, "epoch": 1.41, "percentage": 70.29, "elapsed_time": "5:06:39", "remaining_time": "2:09:36"} +{"current_steps": 7600, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0002017233075355089, "epoch": 1.41, "percentage": 70.38, "elapsed_time": "5:07:03", "remaining_time": "2:09:12"} +{"current_steps": 7600, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0002017233075355089, "epoch": 1.41, "percentage": 70.38, "elapsed_time": "5:13:08", "remaining_time": "2:11:45"} +{"current_steps": 7600, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0002017233075355089, "epoch": 1.41, "percentage": 70.38, "elapsed_time": "5:07:06", "remaining_time": "2:09:13"} +{"current_steps": 7600, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0002017233075355089, "epoch": 1.41, "percentage": 70.38, "elapsed_time": "5:07:04", "remaining_time": "2:09:13"} +{"current_steps": 7610, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.0002005570597015145, "epoch": 1.41, "percentage": 70.48, "elapsed_time": "5:07:30", "remaining_time": "2:08:49"} +{"current_steps": 7610, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.0002005570597015145, "epoch": 1.41, "percentage": 70.48, "elapsed_time": "5:13:33", "remaining_time": "2:11:21"} +{"current_steps": 7610, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.0002005570597015145, "epoch": 1.41, "percentage": 70.48, "elapsed_time": "5:07:28", "remaining_time": "2:08:48"} +{"current_steps": 7610, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.0002005570597015145, "epoch": 1.41, "percentage": 70.48, "elapsed_time": "5:07:31", "remaining_time": "2:08:49"} +{"current_steps": 7620, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 0.00019939334656930892, "epoch": 1.41, "percentage": 70.57, "elapsed_time": "5:13:56", "remaining_time": "2:10:56"} +{"current_steps": 7620, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 0.00019939334656930892, "epoch": 1.41, "percentage": 70.57, "elapsed_time": "5:07:55", "remaining_time": "2:08:25"} +{"current_steps": 7620, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 0.00019939334656930892, "epoch": 1.41, "percentage": 70.57, "elapsed_time": "5:07:53", "remaining_time": "2:08:24"} +{"current_steps": 7620, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 0.00019939334656930892, "epoch": 1.41, "percentage": 70.57, "elapsed_time": "5:07:52", "remaining_time": "2:08:24"} +{"current_steps": 7630, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.00019823217798940247, "epoch": 1.41, "percentage": 70.66, "elapsed_time": "5:14:22", "remaining_time": "2:10:31"} +{"current_steps": 7630, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.00019823217798940247, "epoch": 1.41, "percentage": 70.66, "elapsed_time": "5:08:20", "remaining_time": "2:08:01"} +{"current_steps": 7630, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.00019823217798940247, "epoch": 1.41, "percentage": 70.66, "elapsed_time": "5:08:19", "remaining_time": "2:08:00"} +{"current_steps": 7630, "total_steps": 10798, "loss": 1.9688, "reward": null, "learning_rate": 0.00019823217798940247, "epoch": 1.41, "percentage": 70.66, "elapsed_time": "5:08:17", "remaining_time": "2:08:00"} +{"current_steps": 7640, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.00019707356379076668, "epoch": 1.42, "percentage": 70.75, "elapsed_time": "5:08:43", "remaining_time": "2:07:36"} +{"current_steps": 7640, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.00019707356379076668, "epoch": 1.42, "percentage": 70.75, "elapsed_time": "5:08:41", "remaining_time": "2:07:36"} +{"current_steps": 7640, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.00019707356379076668, "epoch": 1.42, "percentage": 70.75, "elapsed_time": "5:08:45", "remaining_time": "2:07:37"} +{"current_steps": 7640, "total_steps": 10798, "loss": 1.9524, "reward": null, "learning_rate": 0.00019707356379076668, "epoch": 1.42, "percentage": 70.75, "elapsed_time": "5:14:46", "remaining_time": "2:10:06"} +{"current_steps": 7650, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.00019591751378075035, "epoch": 1.42, "percentage": 70.85, "elapsed_time": "5:15:12", "remaining_time": "2:09:42"} +{"current_steps": 7650, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.00019591751378075035, "epoch": 1.42, "percentage": 70.85, "elapsed_time": "5:09:07", "remaining_time": "2:07:12"} +{"current_steps": 7650, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.00019591751378075035, "epoch": 1.42, "percentage": 70.85, "elapsed_time": "5:09:08", "remaining_time": "2:07:12"} +{"current_steps": 7650, "total_steps": 10798, "loss": 1.981, "reward": null, "learning_rate": 0.00019591751378075035, "epoch": 1.42, "percentage": 70.85, "elapsed_time": "5:09:10", "remaining_time": "2:07:13"} +{"current_steps": 7660, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00019476403774499774, "epoch": 1.42, "percentage": 70.94, "elapsed_time": "5:15:37", "remaining_time": "2:09:17"} +{"current_steps": 7660, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00019476403774499774, "epoch": 1.42, "percentage": 70.94, "elapsed_time": "5:09:32", "remaining_time": "2:06:48"} +{"current_steps": 7660, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00019476403774499774, "epoch": 1.42, "percentage": 70.94, "elapsed_time": "5:09:33", "remaining_time": "2:06:48"} +{"current_steps": 7660, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00019476403774499774, "epoch": 1.42, "percentage": 70.94, "elapsed_time": "5:09:35", "remaining_time": "2:06:49"} +{"current_steps": 7670, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 0.0001936131454473649, "epoch": 1.42, "percentage": 71.03, "elapsed_time": "5:16:02", "remaining_time": "2:08:53"} +{"current_steps": 7670, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 0.0001936131454473649, "epoch": 1.42, "percentage": 71.03, "elapsed_time": "5:10:01", "remaining_time": "2:06:25"} +{"current_steps": 7670, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 0.0001936131454473649, "epoch": 1.42, "percentage": 71.03, "elapsed_time": "5:09:59", "remaining_time": "2:06:25"} +{"current_steps": 7670, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 0.0001936131454473649, "epoch": 1.42, "percentage": 71.03, "elapsed_time": "5:09:57", "remaining_time": "2:06:24"} +{"current_steps": 7680, "total_steps": 10798, "loss": 1.8852, "reward": null, "learning_rate": 0.00019246484662983733, "epoch": 1.42, "percentage": 71.12, "elapsed_time": "5:10:22", "remaining_time": "2:06:00"} +{"current_steps": 7680, "total_steps": 10798, "loss": 1.8852, "reward": null, "learning_rate": 0.00019246484662983733, "epoch": 1.42, "percentage": 71.12, "elapsed_time": "5:10:25", "remaining_time": "2:06:01"} +{"current_steps": 7680, "total_steps": 10798, "loss": 1.8852, "reward": null, "learning_rate": 0.00019246484662983733, "epoch": 1.42, "percentage": 71.12, "elapsed_time": "5:10:24", "remaining_time": "2:06:01"} +{"current_steps": 7680, "total_steps": 10798, "loss": 1.8852, "reward": null, "learning_rate": 0.00019246484662983733, "epoch": 1.42, "percentage": 71.12, "elapsed_time": "5:16:27", "remaining_time": "2:08:28"} +{"current_steps": 7690, "total_steps": 10798, "loss": 1.9447, "reward": null, "learning_rate": 0.00019131915101244752, "epoch": 1.42, "percentage": 71.22, "elapsed_time": "5:16:51", "remaining_time": "2:08:03"} +{"current_steps": 7690, "total_steps": 10798, "loss": 1.9447, "reward": null, "learning_rate": 0.00019131915101244752, "epoch": 1.42, "percentage": 71.22, "elapsed_time": "5:10:47", "remaining_time": "2:05:36"} +{"current_steps": 7690, "total_steps": 10798, "loss": 1.9447, "reward": null, "learning_rate": 0.00019131915101244752, "epoch": 1.42, "percentage": 71.22, "elapsed_time": "5:10:50", "remaining_time": "2:05:37"} +{"current_steps": 7690, "total_steps": 10798, "loss": 1.9447, "reward": null, "learning_rate": 0.00019131915101244752, "epoch": 1.42, "percentage": 71.22, "elapsed_time": "5:10:48", "remaining_time": "2:05:37"} +{"current_steps": 7700, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.00019017606829319205, "epoch": 1.43, "percentage": 71.31, "elapsed_time": "5:11:12", "remaining_time": "2:05:12"} +{"current_steps": 7700, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.00019017606829319205, "epoch": 1.43, "percentage": 71.31, "elapsed_time": "5:17:16", "remaining_time": "2:07:39"} +{"current_steps": 7700, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.00019017606829319205, "epoch": 1.43, "percentage": 71.31, "elapsed_time": "5:11:15", "remaining_time": "2:05:13"} +{"current_steps": 7700, "total_steps": 10798, "loss": 1.9221, "reward": null, "learning_rate": 0.00019017606829319205, "epoch": 1.43, "percentage": 71.31, "elapsed_time": "5:11:13", "remaining_time": "2:05:13"} +{"current_steps": 7710, "total_steps": 10798, "loss": 1.9481, "reward": null, "learning_rate": 0.00018903560814795086, "epoch": 1.43, "percentage": 71.4, "elapsed_time": "5:11:41", "remaining_time": "2:04:50"} +{"current_steps": 7710, "total_steps": 10798, "loss": 1.9481, "reward": null, "learning_rate": 0.00018903560814795086, "epoch": 1.43, "percentage": 71.4, "elapsed_time": "5:11:39", "remaining_time": "2:04:49"} +{"current_steps": 7710, "total_steps": 10798, "loss": 1.9481, "reward": null, "learning_rate": 0.00018903560814795086, "epoch": 1.43, "percentage": 71.4, "elapsed_time": "5:17:42", "remaining_time": "2:07:15"} +{"current_steps": 7710, "total_steps": 10798, "loss": 1.9481, "reward": null, "learning_rate": 0.00018903560814795086, "epoch": 1.43, "percentage": 71.4, "elapsed_time": "5:11:38", "remaining_time": "2:04:48"} +{"current_steps": 7720, "total_steps": 10798, "loss": 1.8919, "reward": null, "learning_rate": 0.00018789778023040355, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "5:12:02", "remaining_time": "2:04:24"} +{"current_steps": 7720, "total_steps": 10798, "loss": 1.8919, "reward": null, "learning_rate": 0.00018789778023040355, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "5:12:06", "remaining_time": "2:04:26"} +{"current_steps": 7720, "total_steps": 10798, "loss": 1.8919, "reward": null, "learning_rate": 0.00018789778023040355, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "5:12:04", "remaining_time": "2:04:25"} +{"current_steps": 7720, "total_steps": 10798, "loss": 1.8919, "reward": null, "learning_rate": 0.00018789778023040355, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "5:18:07", "remaining_time": "2:06:50"} +{"current_steps": 7730, "total_steps": 10798, "loss": 1.94, "reward": null, "learning_rate": 0.0001867625941719499, "epoch": 1.43, "percentage": 71.59, "elapsed_time": "5:18:31", "remaining_time": "2:06:25"} +{"current_steps": 7730, "total_steps": 10798, "loss": 1.94, "reward": null, "learning_rate": 0.0001867625941719499, "epoch": 1.43, "percentage": 71.59, "elapsed_time": "5:12:26", "remaining_time": "2:04:00"} +{"current_steps": 7730, "total_steps": 10798, "loss": 1.94, "reward": null, "learning_rate": 0.0001867625941719499, "epoch": 1.43, "percentage": 71.59, "elapsed_time": "5:12:30", "remaining_time": "2:04:01"} +{"current_steps": 7730, "total_steps": 10798, "loss": 1.94, "reward": null, "learning_rate": 0.0001867625941719499, "epoch": 1.43, "percentage": 71.59, "elapsed_time": "5:12:28", "remaining_time": "2:04:01"} +{"current_steps": 7740, "total_steps": 10798, "loss": 1.9089, "reward": null, "learning_rate": 0.00018563005958162587, "epoch": 1.43, "percentage": 71.68, "elapsed_time": "5:12:53", "remaining_time": "2:03:37"} +{"current_steps": 7740, "total_steps": 10798, "loss": 1.9089, "reward": null, "learning_rate": 0.00018563005958162587, "epoch": 1.43, "percentage": 71.68, "elapsed_time": "5:12:51", "remaining_time": "2:03:36"} +{"current_steps": 7740, "total_steps": 10798, "loss": 1.9089, "reward": null, "learning_rate": 0.00018563005958162587, "epoch": 1.43, "percentage": 71.68, "elapsed_time": "5:12:55", "remaining_time": "2:03:37"} +{"current_steps": 7740, "total_steps": 10798, "loss": 1.9089, "reward": null, "learning_rate": 0.00018563005958162587, "epoch": 1.43, "percentage": 71.68, "elapsed_time": "5:18:56", "remaining_time": "2:06:00"} +{"current_steps": 7750, "total_steps": 10798, "loss": 1.9105, "reward": null, "learning_rate": 0.00018450018604602414, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "5:19:21", "remaining_time": "2:05:35"} +{"current_steps": 7750, "total_steps": 10798, "loss": 1.9105, "reward": null, "learning_rate": 0.00018450018604602414, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "5:13:16", "remaining_time": "2:03:12"} +{"current_steps": 7750, "total_steps": 10798, "loss": 1.9105, "reward": null, "learning_rate": 0.00018450018604602414, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "5:13:19", "remaining_time": "2:03:13"} +{"current_steps": 7750, "total_steps": 10798, "loss": 1.9105, "reward": null, "learning_rate": 0.00018450018604602414, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "5:13:17", "remaining_time": "2:03:13"} +{"current_steps": 7760, "total_steps": 10798, "loss": 1.9568, "reward": null, "learning_rate": 0.0001833729831292123, "epoch": 1.44, "percentage": 71.87, "elapsed_time": "5:19:46", "remaining_time": "2:05:11"} +{"current_steps": 7760, "total_steps": 10798, "loss": 1.9568, "reward": null, "learning_rate": 0.0001833729831292123, "epoch": 1.44, "percentage": 71.87, "elapsed_time": "5:13:41", "remaining_time": "2:02:48"} +{"current_steps": 7760, "total_steps": 10798, "loss": 1.9568, "reward": null, "learning_rate": 0.0001833729831292123, "epoch": 1.44, "percentage": 71.87, "elapsed_time": "5:13:45", "remaining_time": "2:02:49"} +{"current_steps": 7760, "total_steps": 10798, "loss": 1.9568, "reward": null, "learning_rate": 0.0001833729831292123, "epoch": 1.44, "percentage": 71.87, "elapsed_time": "5:13:43", "remaining_time": "2:02:49"} +{"current_steps": 7770, "total_steps": 10798, "loss": 1.9156, "reward": null, "learning_rate": 0.00018224846037265125, "epoch": 1.44, "percentage": 71.96, "elapsed_time": "5:14:07", "remaining_time": "2:02:24"} +{"current_steps": 7770, "total_steps": 10798, "loss": 1.9156, "reward": null, "learning_rate": 0.00018224846037265125, "epoch": 1.44, "percentage": 71.96, "elapsed_time": "5:14:09", "remaining_time": "2:02:25"} +{"current_steps": 7770, "total_steps": 10798, "loss": 1.9156, "reward": null, "learning_rate": 0.00018224846037265125, "epoch": 1.44, "percentage": 71.96, "elapsed_time": "5:14:10", "remaining_time": "2:02:26"} +{"current_steps": 7770, "total_steps": 10798, "loss": 1.9156, "reward": null, "learning_rate": 0.00018224846037265125, "epoch": 1.44, "percentage": 71.96, "elapsed_time": "5:20:12", "remaining_time": "2:04:47"} +{"current_steps": 7780, "total_steps": 10798, "loss": 1.9445, "reward": null, "learning_rate": 0.0001811266272951162, "epoch": 1.44, "percentage": 72.05, "elapsed_time": "5:20:36", "remaining_time": "2:04:22"} +{"current_steps": 7780, "total_steps": 10798, "loss": 1.9445, "reward": null, "learning_rate": 0.0001811266272951162, "epoch": 1.44, "percentage": 72.05, "elapsed_time": "5:14:35", "remaining_time": "2:02:02"} +{"current_steps": 7780, "total_steps": 10798, "loss": 1.9445, "reward": null, "learning_rate": 0.0001811266272951162, "epoch": 1.44, "percentage": 72.05, "elapsed_time": "5:14:33", "remaining_time": "2:02:01"} +{"current_steps": 7780, "total_steps": 10798, "loss": 1.9445, "reward": null, "learning_rate": 0.0001811266272951162, "epoch": 1.44, "percentage": 72.05, "elapsed_time": "5:14:32", "remaining_time": "2:02:00"} +{"current_steps": 7790, "total_steps": 10798, "loss": 1.8871, "reward": null, "learning_rate": 0.0001800074933926138, "epoch": 1.44, "percentage": 72.14, "elapsed_time": "5:21:01", "remaining_time": "2:03:57"} +{"current_steps": 7790, "total_steps": 10798, "loss": 1.8871, "reward": null, "learning_rate": 0.0001800074933926138, "epoch": 1.44, "percentage": 72.14, "elapsed_time": "5:14:59", "remaining_time": "2:01:37"} +{"current_steps": 7790, "total_steps": 10798, "loss": 1.8871, "reward": null, "learning_rate": 0.0001800074933926138, "epoch": 1.44, "percentage": 72.14, "elapsed_time": "5:14:56", "remaining_time": "2:01:36"} +{"current_steps": 7790, "total_steps": 10798, "loss": 1.8871, "reward": null, "learning_rate": 0.0001800074933926138, "epoch": 1.44, "percentage": 72.14, "elapsed_time": "5:14:58", "remaining_time": "2:01:37"} +{"current_steps": 7800, "total_steps": 10798, "loss": 1.9684, "reward": null, "learning_rate": 0.00017889106813830363, "epoch": 1.44, "percentage": 72.24, "elapsed_time": "5:21:26", "remaining_time": "2:03:32"} +{"current_steps": 7800, "total_steps": 10798, "loss": 1.9684, "reward": null, "learning_rate": 0.00017889106813830363, "epoch": 1.44, "percentage": 72.24, "elapsed_time": "5:15:21", "remaining_time": "2:01:12"} +{"current_steps": 7800, "total_steps": 10798, "loss": 1.9684, "reward": null, "learning_rate": 0.00017889106813830363, "epoch": 1.44, "percentage": 72.24, "elapsed_time": "5:15:24", "remaining_time": "2:01:13"} +{"current_steps": 7800, "total_steps": 10798, "loss": 1.9684, "reward": null, "learning_rate": 0.00017889106813830363, "epoch": 1.44, "percentage": 72.24, "elapsed_time": "5:15:22", "remaining_time": "2:01:13"} +{"current_steps": 7810, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 0.0001777773609824173, "epoch": 1.45, "percentage": 72.33, "elapsed_time": "5:21:50", "remaining_time": "2:03:08"} +{"current_steps": 7810, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 0.0001777773609824173, "epoch": 1.45, "percentage": 72.33, "elapsed_time": "5:15:46", "remaining_time": "2:00:48"} +{"current_steps": 7810, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 0.0001777773609824173, "epoch": 1.45, "percentage": 72.33, "elapsed_time": "5:15:47", "remaining_time": "2:00:49"} +{"current_steps": 7810, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 0.0001777773609824173, "epoch": 1.45, "percentage": 72.33, "elapsed_time": "5:15:49", "remaining_time": "2:00:49"} +{"current_steps": 7820, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00017666638135217783, "epoch": 1.45, "percentage": 72.42, "elapsed_time": "5:16:10", "remaining_time": "2:00:24"} +{"current_steps": 7820, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00017666638135217783, "epoch": 1.45, "percentage": 72.42, "elapsed_time": "5:16:12", "remaining_time": "2:00:25"} +{"current_steps": 7820, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00017666638135217783, "epoch": 1.45, "percentage": 72.42, "elapsed_time": "5:16:14", "remaining_time": "2:00:25"} +{"current_steps": 7820, "total_steps": 10798, "loss": 1.9295, "reward": null, "learning_rate": 0.00017666638135217783, "epoch": 1.45, "percentage": 72.42, "elapsed_time": "5:22:15", "remaining_time": "2:02:43"} +{"current_steps": 7830, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001755581386517216, "epoch": 1.45, "percentage": 72.51, "elapsed_time": "5:22:39", "remaining_time": "2:02:18"} +{"current_steps": 7830, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001755581386517216, "epoch": 1.45, "percentage": 72.51, "elapsed_time": "5:16:38", "remaining_time": "2:00:01"} +{"current_steps": 7830, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001755581386517216, "epoch": 1.45, "percentage": 72.51, "elapsed_time": "5:16:36", "remaining_time": "2:00:00"} +{"current_steps": 7830, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001755581386517216, "epoch": 1.45, "percentage": 72.51, "elapsed_time": "5:16:34", "remaining_time": "2:00:00"} +{"current_steps": 7840, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001744526422620165, "epoch": 1.45, "percentage": 72.61, "elapsed_time": "5:23:03", "remaining_time": "2:01:53"} +{"current_steps": 7840, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001744526422620165, "epoch": 1.45, "percentage": 72.61, "elapsed_time": "5:16:58", "remaining_time": "1:59:35"} +{"current_steps": 7840, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001744526422620165, "epoch": 1.45, "percentage": 72.61, "elapsed_time": "5:17:00", "remaining_time": "1:59:36"} +{"current_steps": 7840, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 0.0001744526422620165, "epoch": 1.45, "percentage": 72.61, "elapsed_time": "5:17:02", "remaining_time": "1:59:37"} +{"current_steps": 7850, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.00017334990154078446, "epoch": 1.45, "percentage": 72.7, "elapsed_time": "5:17:24", "remaining_time": "1:59:12"} +{"current_steps": 7850, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.00017334990154078446, "epoch": 1.45, "percentage": 72.7, "elapsed_time": "5:17:26", "remaining_time": "1:59:12"} +{"current_steps": 7850, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.00017334990154078446, "epoch": 1.45, "percentage": 72.7, "elapsed_time": "5:17:23", "remaining_time": "1:59:11"} +{"current_steps": 7850, "total_steps": 10798, "loss": 1.9262, "reward": null, "learning_rate": 0.00017334990154078446, "epoch": 1.45, "percentage": 72.7, "elapsed_time": "5:23:27", "remaining_time": "2:01:28"} +{"current_steps": 7860, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.00017224992582242076, "epoch": 1.46, "percentage": 72.79, "elapsed_time": "5:17:47", "remaining_time": "1:58:47"} +{"current_steps": 7860, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.00017224992582242076, "epoch": 1.46, "percentage": 72.79, "elapsed_time": "5:17:48", "remaining_time": "1:58:47"} +{"current_steps": 7860, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.00017224992582242076, "epoch": 1.46, "percentage": 72.79, "elapsed_time": "5:17:50", "remaining_time": "1:58:48"} +{"current_steps": 7860, "total_steps": 10798, "loss": 1.9554, "reward": null, "learning_rate": 0.00017224992582242076, "epoch": 1.46, "percentage": 72.79, "elapsed_time": "5:23:52", "remaining_time": "2:01:03"} +{"current_steps": 7870, "total_steps": 10798, "loss": 1.9685, "reward": null, "learning_rate": 0.00017115272441791635, "epoch": 1.46, "percentage": 72.88, "elapsed_time": "5:24:16", "remaining_time": "2:00:38"} +{"current_steps": 7870, "total_steps": 10798, "loss": 1.9685, "reward": null, "learning_rate": 0.00017115272441791635, "epoch": 1.46, "percentage": 72.88, "elapsed_time": "5:18:13", "remaining_time": "1:58:23"} +{"current_steps": 7870, "total_steps": 10798, "loss": 1.9685, "reward": null, "learning_rate": 0.00017115272441791635, "epoch": 1.46, "percentage": 72.88, "elapsed_time": "5:18:15", "remaining_time": "1:58:24"} +{"current_steps": 7870, "total_steps": 10798, "loss": 1.9685, "reward": null, "learning_rate": 0.00017115272441791635, "epoch": 1.46, "percentage": 72.88, "elapsed_time": "5:18:11", "remaining_time": "1:58:22"} +{"current_steps": 7880, "total_steps": 10798, "loss": 1.9021, "reward": null, "learning_rate": 0.000170058306614778, "epoch": 1.46, "percentage": 72.98, "elapsed_time": "5:24:40", "remaining_time": "2:00:13"} +{"current_steps": 7880, "total_steps": 10798, "loss": 1.9021, "reward": null, "learning_rate": 0.000170058306614778, "epoch": 1.46, "percentage": 72.98, "elapsed_time": "5:18:35", "remaining_time": "1:57:58"} +{"current_steps": 7880, "total_steps": 10798, "loss": 1.9021, "reward": null, "learning_rate": 0.000170058306614778, "epoch": 1.46, "percentage": 72.98, "elapsed_time": "5:18:38", "remaining_time": "1:57:59"} +{"current_steps": 7880, "total_steps": 10798, "loss": 1.9021, "reward": null, "learning_rate": 0.000170058306614778, "epoch": 1.46, "percentage": 72.98, "elapsed_time": "5:18:36", "remaining_time": "1:57:59"} +{"current_steps": 7890, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00016896668167695018, "epoch": 1.46, "percentage": 73.07, "elapsed_time": "5:25:04", "remaining_time": "1:59:48"} +{"current_steps": 7890, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00016896668167695018, "epoch": 1.46, "percentage": 73.07, "elapsed_time": "5:19:03", "remaining_time": "1:57:35"} +{"current_steps": 7890, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00016896668167695018, "epoch": 1.46, "percentage": 73.07, "elapsed_time": "5:19:01", "remaining_time": "1:57:34"} +{"current_steps": 7890, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00016896668167695018, "epoch": 1.46, "percentage": 73.07, "elapsed_time": "5:18:59", "remaining_time": "1:57:34"} +{"current_steps": 7900, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00016787785884473665, "epoch": 1.46, "percentage": 73.16, "elapsed_time": "5:25:28", "remaining_time": "1:59:23"} +{"current_steps": 7900, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00016787785884473665, "epoch": 1.46, "percentage": 73.16, "elapsed_time": "5:19:27", "remaining_time": "1:57:11"} +{"current_steps": 7900, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00016787785884473665, "epoch": 1.46, "percentage": 73.16, "elapsed_time": "5:19:23", "remaining_time": "1:57:09"} +{"current_steps": 7900, "total_steps": 10798, "loss": 1.9164, "reward": null, "learning_rate": 0.00016787785884473665, "epoch": 1.46, "percentage": 73.16, "elapsed_time": "5:19:25", "remaining_time": "1:57:10"} +{"current_steps": 7910, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.00016679184733472163, "epoch": 1.47, "percentage": 73.25, "elapsed_time": "5:25:52", "remaining_time": "1:58:58"} +{"current_steps": 7910, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.00016679184733472163, "epoch": 1.47, "percentage": 73.25, "elapsed_time": "5:19:48", "remaining_time": "1:56:45"} +{"current_steps": 7910, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.00016679184733472163, "epoch": 1.47, "percentage": 73.25, "elapsed_time": "5:19:49", "remaining_time": "1:56:46"} +{"current_steps": 7910, "total_steps": 10798, "loss": 1.9409, "reward": null, "learning_rate": 0.00016679184733472163, "epoch": 1.47, "percentage": 73.25, "elapsed_time": "5:19:51", "remaining_time": "1:56:46"} +{"current_steps": 7920, "total_steps": 10798, "loss": 1.9329, "reward": null, "learning_rate": 0.00016570865633969283, "epoch": 1.47, "percentage": 73.35, "elapsed_time": "5:26:17", "remaining_time": "1:58:34"} +{"current_steps": 7920, "total_steps": 10798, "loss": 1.9329, "reward": null, "learning_rate": 0.00016570865633969283, "epoch": 1.47, "percentage": 73.35, "elapsed_time": "5:20:14", "remaining_time": "1:56:22"} +{"current_steps": 7920, "total_steps": 10798, "loss": 1.9329, "reward": null, "learning_rate": 0.00016570865633969283, "epoch": 1.47, "percentage": 73.35, "elapsed_time": "5:20:16", "remaining_time": "1:56:22"} +{"current_steps": 7920, "total_steps": 10798, "loss": 1.9329, "reward": null, "learning_rate": 0.00016570865633969283, "epoch": 1.47, "percentage": 73.35, "elapsed_time": "5:20:12", "remaining_time": "1:56:21"} +{"current_steps": 7930, "total_steps": 10798, "loss": 1.9518, "reward": null, "learning_rate": 0.00016462829502856286, "epoch": 1.47, "percentage": 73.44, "elapsed_time": "5:26:42", "remaining_time": "1:58:09"} +{"current_steps": 7930, "total_steps": 10798, "loss": 1.9518, "reward": null, "learning_rate": 0.00016462829502856286, "epoch": 1.47, "percentage": 73.44, "elapsed_time": "5:20:38", "remaining_time": "1:55:57"} +{"current_steps": 7930, "total_steps": 10798, "loss": 1.9518, "reward": null, "learning_rate": 0.00016462829502856286, "epoch": 1.47, "percentage": 73.44, "elapsed_time": "5:20:41", "remaining_time": "1:55:58"} +{"current_steps": 7930, "total_steps": 10798, "loss": 1.9518, "reward": null, "learning_rate": 0.00016462829502856286, "epoch": 1.47, "percentage": 73.44, "elapsed_time": "5:20:39", "remaining_time": "1:55:58"} +{"current_steps": 7940, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.00016355077254629196, "epoch": 1.47, "percentage": 73.53, "elapsed_time": "5:27:06", "remaining_time": "1:57:44"} +{"current_steps": 7940, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.00016355077254629196, "epoch": 1.47, "percentage": 73.53, "elapsed_time": "5:21:04", "remaining_time": "1:55:34"} +{"current_steps": 7940, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.00016355077254629196, "epoch": 1.47, "percentage": 73.53, "elapsed_time": "5:21:03", "remaining_time": "1:55:33"} +{"current_steps": 7940, "total_steps": 10798, "loss": 1.9494, "reward": null, "learning_rate": 0.00016355077254629196, "epoch": 1.47, "percentage": 73.53, "elapsed_time": "5:21:01", "remaining_time": "1:55:33"} +{"current_steps": 7950, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00016247609801381003, "epoch": 1.47, "percentage": 73.62, "elapsed_time": "5:21:26", "remaining_time": "1:55:09"} +{"current_steps": 7950, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00016247609801381003, "epoch": 1.47, "percentage": 73.62, "elapsed_time": "5:21:29", "remaining_time": "1:55:10"} +{"current_steps": 7950, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00016247609801381003, "epoch": 1.47, "percentage": 73.62, "elapsed_time": "5:21:28", "remaining_time": "1:55:09"} +{"current_steps": 7950, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 0.00016247609801381003, "epoch": 1.47, "percentage": 73.62, "elapsed_time": "5:27:31", "remaining_time": "1:57:19"} +{"current_steps": 7960, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00016140428052794042, "epoch": 1.47, "percentage": 73.72, "elapsed_time": "5:21:51", "remaining_time": "1:54:45"} +{"current_steps": 7960, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00016140428052794042, "epoch": 1.47, "percentage": 73.72, "elapsed_time": "5:21:53", "remaining_time": "1:54:45"} +{"current_steps": 7960, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00016140428052794042, "epoch": 1.47, "percentage": 73.72, "elapsed_time": "5:21:55", "remaining_time": "1:54:46"} +{"current_steps": 7960, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00016140428052794042, "epoch": 1.47, "percentage": 73.72, "elapsed_time": "5:27:56", "remaining_time": "1:56:55"} +{"current_steps": 7970, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00016033532916132203, "epoch": 1.48, "percentage": 73.81, "elapsed_time": "5:22:16", "remaining_time": "1:54:21"} +{"current_steps": 7970, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00016033532916132203, "epoch": 1.48, "percentage": 73.81, "elapsed_time": "5:22:18", "remaining_time": "1:54:21"} +{"current_steps": 7970, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00016033532916132203, "epoch": 1.48, "percentage": 73.81, "elapsed_time": "5:28:21", "remaining_time": "1:56:30"} +{"current_steps": 7970, "total_steps": 10798, "loss": 1.9528, "reward": null, "learning_rate": 0.00016033532916132203, "epoch": 1.48, "percentage": 73.81, "elapsed_time": "5:22:20", "remaining_time": "1:54:22"} +{"current_steps": 7980, "total_steps": 10798, "loss": 1.9698, "reward": null, "learning_rate": 0.00015926925296233296, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "5:28:45", "remaining_time": "1:56:05"} +{"current_steps": 7980, "total_steps": 10798, "loss": 1.9698, "reward": null, "learning_rate": 0.00015926925296233296, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "5:22:44", "remaining_time": "1:53:58"} +{"current_steps": 7980, "total_steps": 10798, "loss": 1.9698, "reward": null, "learning_rate": 0.00015926925296233296, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "5:22:42", "remaining_time": "1:53:57"} +{"current_steps": 7980, "total_steps": 10798, "loss": 1.9698, "reward": null, "learning_rate": 0.00015926925296233296, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "5:22:40", "remaining_time": "1:53:56"} +{"current_steps": 7990, "total_steps": 10798, "loss": 1.936, "reward": null, "learning_rate": 0.00015820606095501405, "epoch": 1.48, "percentage": 74.0, "elapsed_time": "5:29:11", "remaining_time": "1:55:41"} +{"current_steps": 7990, "total_steps": 10798, "loss": 1.936, "reward": null, "learning_rate": 0.00015820606095501405, "epoch": 1.48, "percentage": 74.0, "elapsed_time": "5:23:06", "remaining_time": "1:53:33"} +{"current_steps": 7990, "total_steps": 10798, "loss": 1.936, "reward": null, "learning_rate": 0.00015820606095501405, "epoch": 1.48, "percentage": 74.0, "elapsed_time": "5:23:07", "remaining_time": "1:53:33"} +{"current_steps": 7990, "total_steps": 10798, "loss": 1.936, "reward": null, "learning_rate": 0.00015820606095501405, "epoch": 1.48, "percentage": 74.0, "elapsed_time": "5:23:09", "remaining_time": "1:53:34"} +{"current_steps": 8000, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.00015714576213899167, "epoch": 1.48, "percentage": 74.09, "elapsed_time": "5:29:36", "remaining_time": "1:55:16"} +{"current_steps": 8000, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.00015714576213899167, "epoch": 1.48, "percentage": 74.09, "elapsed_time": "5:23:33", "remaining_time": "1:53:09"} +{"current_steps": 8000, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.00015714576213899167, "epoch": 1.48, "percentage": 74.09, "elapsed_time": "5:23:31", "remaining_time": "1:53:09"} +{"current_steps": 8000, "total_steps": 10798, "loss": 1.962, "reward": null, "learning_rate": 0.00015714576213899167, "epoch": 1.48, "percentage": 74.09, "elapsed_time": "5:23:34", "remaining_time": "1:53:10"} +{"current_steps": 8010, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00015608836548940252, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "5:30:00", "remaining_time": "1:54:51"} +{"current_steps": 8010, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00015608836548940252, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "5:23:57", "remaining_time": "1:52:45"} +{"current_steps": 8010, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00015608836548940252, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "5:23:55", "remaining_time": "1:52:44"} +{"current_steps": 8010, "total_steps": 10798, "loss": 1.9439, "reward": null, "learning_rate": 0.00015608836548940252, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "5:23:59", "remaining_time": "1:52:46"} +{"current_steps": 8020, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.00015503387995681732, "epoch": 1.49, "percentage": 74.27, "elapsed_time": "5:30:25", "remaining_time": "1:54:27"} +{"current_steps": 8020, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.00015503387995681732, "epoch": 1.49, "percentage": 74.27, "elapsed_time": "5:24:22", "remaining_time": "1:52:21"} +{"current_steps": 8020, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.00015503387995681732, "epoch": 1.49, "percentage": 74.27, "elapsed_time": "5:24:21", "remaining_time": "1:52:20"} +{"current_steps": 8020, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 0.00015503387995681732, "epoch": 1.49, "percentage": 74.27, "elapsed_time": "5:24:24", "remaining_time": "1:52:22"} +{"current_steps": 8030, "total_steps": 10798, "loss": 1.9029, "reward": null, "learning_rate": 0.0001539823144671648, "epoch": 1.49, "percentage": 74.37, "elapsed_time": "5:30:50", "remaining_time": "1:54:02"} +{"current_steps": 8030, "total_steps": 10798, "loss": 1.9029, "reward": null, "learning_rate": 0.0001539823144671648, "epoch": 1.49, "percentage": 74.37, "elapsed_time": "5:24:45", "remaining_time": "1:51:56"} +{"current_steps": 8030, "total_steps": 10798, "loss": 1.9029, "reward": null, "learning_rate": 0.0001539823144671648, "epoch": 1.49, "percentage": 74.37, "elapsed_time": "5:24:47", "remaining_time": "1:51:57"} +{"current_steps": 8030, "total_steps": 10798, "loss": 1.9029, "reward": null, "learning_rate": 0.0001539823144671648, "epoch": 1.49, "percentage": 74.37, "elapsed_time": "5:24:49", "remaining_time": "1:51:58"} +{"current_steps": 8040, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 0.00015293367792165664, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "5:31:15", "remaining_time": "1:53:38"} +{"current_steps": 8040, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 0.00015293367792165664, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "5:25:11", "remaining_time": "1:51:32"} +{"current_steps": 8040, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 0.00015293367792165664, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "5:25:12", "remaining_time": "1:51:33"} +{"current_steps": 8040, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 0.00015293367792165664, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "5:25:14", "remaining_time": "1:51:34"} +{"current_steps": 8050, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00015188797919671115, "epoch": 1.49, "percentage": 74.55, "elapsed_time": "5:25:38", "remaining_time": "1:51:09"} +{"current_steps": 8050, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00015188797919671115, "epoch": 1.49, "percentage": 74.55, "elapsed_time": "5:25:36", "remaining_time": "1:51:09"} +{"current_steps": 8050, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00015188797919671115, "epoch": 1.49, "percentage": 74.55, "elapsed_time": "5:25:39", "remaining_time": "1:51:10"} +{"current_steps": 8050, "total_steps": 10798, "loss": 1.9405, "reward": null, "learning_rate": 0.00015188797919671115, "epoch": 1.49, "percentage": 74.55, "elapsed_time": "5:31:41", "remaining_time": "1:53:13"} +{"current_steps": 8060, "total_steps": 10798, "loss": 1.909, "reward": null, "learning_rate": 0.00015084522714387967, "epoch": 1.49, "percentage": 74.64, "elapsed_time": "5:32:06", "remaining_time": "1:52:49"} +{"current_steps": 8060, "total_steps": 10798, "loss": 1.909, "reward": null, "learning_rate": 0.00015084522714387967, "epoch": 1.49, "percentage": 74.64, "elapsed_time": "5:26:03", "remaining_time": "1:50:45"} +{"current_steps": 8060, "total_steps": 10798, "loss": 1.909, "reward": null, "learning_rate": 0.00015084522714387967, "epoch": 1.49, "percentage": 74.64, "elapsed_time": "5:26:05", "remaining_time": "1:50:46"} +{"current_steps": 8060, "total_steps": 10798, "loss": 1.909, "reward": null, "learning_rate": 0.00015084522714387967, "epoch": 1.49, "percentage": 74.64, "elapsed_time": "5:26:01", "remaining_time": "1:50:45"} +{"current_steps": 8070, "total_steps": 10798, "loss": 1.9286, "reward": null, "learning_rate": 0.00014980543058976977, "epoch": 1.49, "percentage": 74.74, "elapsed_time": "5:32:30", "remaining_time": "1:52:24"} +{"current_steps": 8070, "total_steps": 10798, "loss": 1.9286, "reward": null, "learning_rate": 0.00014980543058976977, "epoch": 1.49, "percentage": 74.74, "elapsed_time": "5:26:29", "remaining_time": "1:50:21"} +{"current_steps": 8070, "total_steps": 10798, "loss": 1.9286, "reward": null, "learning_rate": 0.00014980543058976977, "epoch": 1.49, "percentage": 74.74, "elapsed_time": "5:26:27", "remaining_time": "1:50:21"} +{"current_steps": 8070, "total_steps": 10798, "loss": 1.9286, "reward": null, "learning_rate": 0.00014980543058976977, "epoch": 1.49, "percentage": 74.74, "elapsed_time": "5:26:25", "remaining_time": "1:50:20"} +{"current_steps": 8080, "total_steps": 10798, "loss": 1.9358, "reward": null, "learning_rate": 0.00014876859833597278, "epoch": 1.5, "percentage": 74.83, "elapsed_time": "5:32:55", "remaining_time": "1:51:59"} +{"current_steps": 8080, "total_steps": 10798, "loss": 1.9358, "reward": null, "learning_rate": 0.00014876859833597278, "epoch": 1.5, "percentage": 74.83, "elapsed_time": "5:26:54", "remaining_time": "1:49:57"} +{"current_steps": 8080, "total_steps": 10798, "loss": 1.9358, "reward": null, "learning_rate": 0.00014876859833597278, "epoch": 1.5, "percentage": 74.83, "elapsed_time": "5:26:52", "remaining_time": "1:49:57"} +{"current_steps": 8080, "total_steps": 10798, "loss": 1.9358, "reward": null, "learning_rate": 0.00014876859833597278, "epoch": 1.5, "percentage": 74.83, "elapsed_time": "5:26:50", "remaining_time": "1:49:56"} +{"current_steps": 8090, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 0.00014773473915898695, "epoch": 1.5, "percentage": 74.92, "elapsed_time": "5:27:14", "remaining_time": "1:49:32"} +{"current_steps": 8090, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 0.00014773473915898695, "epoch": 1.5, "percentage": 74.92, "elapsed_time": "5:27:16", "remaining_time": "1:49:32"} +{"current_steps": 8090, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 0.00014773473915898695, "epoch": 1.5, "percentage": 74.92, "elapsed_time": "5:27:18", "remaining_time": "1:49:33"} +{"current_steps": 8090, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 0.00014773473915898695, "epoch": 1.5, "percentage": 74.92, "elapsed_time": "5:33:19", "remaining_time": "1:51:34"} +{"current_steps": 8100, "total_steps": 10798, "loss": 1.9044, "reward": null, "learning_rate": 0.00014670386181014477, "epoch": 1.5, "percentage": 75.01, "elapsed_time": "5:27:39", "remaining_time": "1:49:08"} +{"current_steps": 8100, "total_steps": 10798, "loss": 1.9044, "reward": null, "learning_rate": 0.00014670386181014477, "epoch": 1.5, "percentage": 75.01, "elapsed_time": "5:27:41", "remaining_time": "1:49:08"} +{"current_steps": 8100, "total_steps": 10798, "loss": 1.9044, "reward": null, "learning_rate": 0.00014670386181014477, "epoch": 1.5, "percentage": 75.01, "elapsed_time": "5:27:43", "remaining_time": "1:49:09"} +{"current_steps": 8100, "total_steps": 10798, "loss": 1.9044, "reward": null, "learning_rate": 0.00014670386181014477, "epoch": 1.5, "percentage": 75.01, "elapsed_time": "5:33:44", "remaining_time": "1:51:09"} +{"current_steps": 8110, "total_steps": 10798, "loss": 1.9133, "reward": null, "learning_rate": 0.00014567597501553847, "epoch": 1.5, "percentage": 75.11, "elapsed_time": "5:28:04", "remaining_time": "1:48:44"} +{"current_steps": 8110, "total_steps": 10798, "loss": 1.9133, "reward": null, "learning_rate": 0.00014567597501553847, "epoch": 1.5, "percentage": 75.11, "elapsed_time": "5:28:06", "remaining_time": "1:48:44"} +{"current_steps": 8110, "total_steps": 10798, "loss": 1.9133, "reward": null, "learning_rate": 0.00014567597501553847, "epoch": 1.5, "percentage": 75.11, "elapsed_time": "5:28:08", "remaining_time": "1:48:45"} +{"current_steps": 8110, "total_steps": 10798, "loss": 1.9133, "reward": null, "learning_rate": 0.00014567597501553847, "epoch": 1.5, "percentage": 75.11, "elapsed_time": "5:34:09", "remaining_time": "1:50:45"} +{"current_steps": 8120, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 0.0001446510874759454, "epoch": 1.5, "percentage": 75.2, "elapsed_time": "5:34:34", "remaining_time": "1:50:20"} +{"current_steps": 8120, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 0.0001446510874759454, "epoch": 1.5, "percentage": 75.2, "elapsed_time": "5:28:29", "remaining_time": "1:48:20"} +{"current_steps": 8120, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 0.0001446510874759454, "epoch": 1.5, "percentage": 75.2, "elapsed_time": "5:28:33", "remaining_time": "1:48:21"} +{"current_steps": 8120, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 0.0001446510874759454, "epoch": 1.5, "percentage": 75.2, "elapsed_time": "5:28:31", "remaining_time": "1:48:20"} +{"current_steps": 8130, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 0.00014362920786675616, "epoch": 1.51, "percentage": 75.29, "elapsed_time": "5:34:59", "remaining_time": "1:49:56"} +{"current_steps": 8130, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 0.00014362920786675616, "epoch": 1.51, "percentage": 75.29, "elapsed_time": "5:28:54", "remaining_time": "1:47:56"} +{"current_steps": 8130, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 0.00014362920786675616, "epoch": 1.51, "percentage": 75.29, "elapsed_time": "5:28:56", "remaining_time": "1:47:56"} +{"current_steps": 8130, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 0.00014362920786675616, "epoch": 1.51, "percentage": 75.29, "elapsed_time": "5:28:58", "remaining_time": "1:47:57"} +{"current_steps": 8140, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 0.00014261034483789892, "epoch": 1.51, "percentage": 75.38, "elapsed_time": "5:29:20", "remaining_time": "1:47:32"} +{"current_steps": 8140, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 0.00014261034483789892, "epoch": 1.51, "percentage": 75.38, "elapsed_time": "5:29:24", "remaining_time": "1:47:33"} +{"current_steps": 8140, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 0.00014261034483789892, "epoch": 1.51, "percentage": 75.38, "elapsed_time": "5:29:22", "remaining_time": "1:47:33"} +{"current_steps": 8140, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 0.00014261034483789892, "epoch": 1.51, "percentage": 75.38, "elapsed_time": "5:35:25", "remaining_time": "1:49:31"} +{"current_steps": 8150, "total_steps": 10798, "loss": 1.9806, "reward": null, "learning_rate": 0.00014159450701376803, "epoch": 1.51, "percentage": 75.48, "elapsed_time": "5:35:50", "remaining_time": "1:49:07"} +{"current_steps": 8150, "total_steps": 10798, "loss": 1.9806, "reward": null, "learning_rate": 0.00014159450701376803, "epoch": 1.51, "percentage": 75.48, "elapsed_time": "5:29:47", "remaining_time": "1:47:09"} +{"current_steps": 8150, "total_steps": 10798, "loss": 1.9806, "reward": null, "learning_rate": 0.00014159450701376803, "epoch": 1.51, "percentage": 75.48, "elapsed_time": "5:29:49", "remaining_time": "1:47:09"} +{"current_steps": 8150, "total_steps": 10798, "loss": 1.9806, "reward": null, "learning_rate": 0.00014159450701376803, "epoch": 1.51, "percentage": 75.48, "elapsed_time": "5:29:45", "remaining_time": "1:47:08"} +{"current_steps": 8160, "total_steps": 10798, "loss": 1.9101, "reward": null, "learning_rate": 0.00014058170299315027, "epoch": 1.51, "percentage": 75.57, "elapsed_time": "5:30:11", "remaining_time": "1:46:44"} +{"current_steps": 8160, "total_steps": 10798, "loss": 1.9101, "reward": null, "learning_rate": 0.00014058170299315027, "epoch": 1.51, "percentage": 75.57, "elapsed_time": "5:30:09", "remaining_time": "1:46:44"} +{"current_steps": 8160, "total_steps": 10798, "loss": 1.9101, "reward": null, "learning_rate": 0.00014058170299315027, "epoch": 1.51, "percentage": 75.57, "elapsed_time": "5:36:14", "remaining_time": "1:48:42"} +{"current_steps": 8160, "total_steps": 10798, "loss": 1.9101, "reward": null, "learning_rate": 0.00014058170299315027, "epoch": 1.51, "percentage": 75.57, "elapsed_time": "5:30:12", "remaining_time": "1:46:45"} +{"current_steps": 8170, "total_steps": 10798, "loss": 1.9122, "reward": null, "learning_rate": 0.00013957194134915147, "epoch": 1.51, "percentage": 75.66, "elapsed_time": "5:30:33", "remaining_time": "1:46:19"} +{"current_steps": 8170, "total_steps": 10798, "loss": 1.9122, "reward": null, "learning_rate": 0.00013957194134915147, "epoch": 1.51, "percentage": 75.66, "elapsed_time": "5:36:38", "remaining_time": "1:48:17"} +{"current_steps": 8170, "total_steps": 10798, "loss": 1.9122, "reward": null, "learning_rate": 0.00013957194134915147, "epoch": 1.51, "percentage": 75.66, "elapsed_time": "5:30:35", "remaining_time": "1:46:20"} +{"current_steps": 8170, "total_steps": 10798, "loss": 1.9122, "reward": null, "learning_rate": 0.00013957194134915147, "epoch": 1.51, "percentage": 75.66, "elapsed_time": "5:30:36", "remaining_time": "1:46:20"} +{"current_steps": 8180, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 0.00013856523062912569, "epoch": 1.52, "percentage": 75.75, "elapsed_time": "5:37:02", "remaining_time": "1:47:52"} +{"current_steps": 8180, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 0.00013856523062912569, "epoch": 1.52, "percentage": 75.75, "elapsed_time": "5:30:57", "remaining_time": "1:45:55"} +{"current_steps": 8180, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 0.00013856523062912569, "epoch": 1.52, "percentage": 75.75, "elapsed_time": "5:30:59", "remaining_time": "1:45:56"} +{"current_steps": 8180, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 0.00013856523062912569, "epoch": 1.52, "percentage": 75.75, "elapsed_time": "5:31:01", "remaining_time": "1:45:56"} +{"current_steps": 8190, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 0.0001375615793546006, "epoch": 1.52, "percentage": 75.85, "elapsed_time": "5:37:27", "remaining_time": "1:47:27"} +{"current_steps": 8190, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 0.0001375615793546006, "epoch": 1.52, "percentage": 75.85, "elapsed_time": "5:31:22", "remaining_time": "1:45:31"} +{"current_steps": 8190, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 0.0001375615793546006, "epoch": 1.52, "percentage": 75.85, "elapsed_time": "5:31:23", "remaining_time": "1:45:31"} +{"current_steps": 8190, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 0.0001375615793546006, "epoch": 1.52, "percentage": 75.85, "elapsed_time": "5:31:25", "remaining_time": "1:45:32"} +{"current_steps": 8200, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00013656099602120752, "epoch": 1.52, "percentage": 75.94, "elapsed_time": "5:37:53", "remaining_time": "1:47:03"} +{"current_steps": 8200, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00013656099602120752, "epoch": 1.52, "percentage": 75.94, "elapsed_time": "5:31:51", "remaining_time": "1:45:08"} +{"current_steps": 8200, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00013656099602120752, "epoch": 1.52, "percentage": 75.94, "elapsed_time": "5:31:48", "remaining_time": "1:45:07"} +{"current_steps": 8200, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 0.00013656099602120752, "epoch": 1.52, "percentage": 75.94, "elapsed_time": "5:31:49", "remaining_time": "1:45:08"} +{"current_steps": 8210, "total_steps": 10798, "loss": 1.9327, "reward": null, "learning_rate": 0.00013556348909860762, "epoch": 1.52, "percentage": 76.03, "elapsed_time": "5:38:17", "remaining_time": "1:46:38"} +{"current_steps": 8210, "total_steps": 10798, "loss": 1.9327, "reward": null, "learning_rate": 0.00013556348909860762, "epoch": 1.52, "percentage": 76.03, "elapsed_time": "5:32:14", "remaining_time": "1:44:43"} +{"current_steps": 8210, "total_steps": 10798, "loss": 1.9327, "reward": null, "learning_rate": 0.00013556348909860762, "epoch": 1.52, "percentage": 76.03, "elapsed_time": "5:32:16", "remaining_time": "1:44:44"} +{"current_steps": 8210, "total_steps": 10798, "loss": 1.9327, "reward": null, "learning_rate": 0.00013556348909860762, "epoch": 1.52, "percentage": 76.03, "elapsed_time": "5:32:12", "remaining_time": "1:44:43"} +{"current_steps": 8220, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00013456906703042165, "epoch": 1.52, "percentage": 76.13, "elapsed_time": "5:32:39", "remaining_time": "1:44:19"} +{"current_steps": 8220, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00013456906703042165, "epoch": 1.52, "percentage": 76.13, "elapsed_time": "5:32:37", "remaining_time": "1:44:19"} +{"current_steps": 8220, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00013456906703042165, "epoch": 1.52, "percentage": 76.13, "elapsed_time": "5:32:40", "remaining_time": "1:44:20"} +{"current_steps": 8220, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00013456906703042165, "epoch": 1.52, "percentage": 76.13, "elapsed_time": "5:38:42", "remaining_time": "1:46:13"} +{"current_steps": 8230, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00013357773823415782, "epoch": 1.52, "percentage": 76.22, "elapsed_time": "5:39:06", "remaining_time": "1:45:48"} +{"current_steps": 8230, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00013357773823415782, "epoch": 1.52, "percentage": 76.22, "elapsed_time": "5:33:04", "remaining_time": "1:43:55"} +{"current_steps": 8230, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00013357773823415782, "epoch": 1.52, "percentage": 76.22, "elapsed_time": "5:33:02", "remaining_time": "1:43:55"} +{"current_steps": 8230, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00013357773823415782, "epoch": 1.52, "percentage": 76.22, "elapsed_time": "5:33:01", "remaining_time": "1:43:54"} +{"current_steps": 8240, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00013258951110114054, "epoch": 1.53, "percentage": 76.31, "elapsed_time": "5:39:29", "remaining_time": "1:45:23"} +{"current_steps": 8240, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00013258951110114054, "epoch": 1.53, "percentage": 76.31, "elapsed_time": "5:33:26", "remaining_time": "1:43:30"} +{"current_steps": 8240, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00013258951110114054, "epoch": 1.53, "percentage": 76.31, "elapsed_time": "5:33:28", "remaining_time": "1:43:31"} +{"current_steps": 8240, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 0.00013258951110114054, "epoch": 1.53, "percentage": 76.31, "elapsed_time": "5:33:24", "remaining_time": "1:43:30"} +{"current_steps": 8250, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.0001316043939964398, "epoch": 1.53, "percentage": 76.4, "elapsed_time": "5:33:49", "remaining_time": "1:43:06"} +{"current_steps": 8250, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.0001316043939964398, "epoch": 1.53, "percentage": 76.4, "elapsed_time": "5:33:52", "remaining_time": "1:43:07"} +{"current_steps": 8250, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.0001316043939964398, "epoch": 1.53, "percentage": 76.4, "elapsed_time": "5:33:50", "remaining_time": "1:43:06"} +{"current_steps": 8250, "total_steps": 10798, "loss": 1.9525, "reward": null, "learning_rate": 0.0001316043939964398, "epoch": 1.53, "percentage": 76.4, "elapsed_time": "5:39:54", "remaining_time": "1:44:58"} +{"current_steps": 8260, "total_steps": 10798, "loss": 1.8933, "reward": null, "learning_rate": 0.00013062239525879943, "epoch": 1.53, "percentage": 76.5, "elapsed_time": "5:40:18", "remaining_time": "1:44:33"} +{"current_steps": 8260, "total_steps": 10798, "loss": 1.8933, "reward": null, "learning_rate": 0.00013062239525879943, "epoch": 1.53, "percentage": 76.5, "elapsed_time": "5:34:16", "remaining_time": "1:42:42"} +{"current_steps": 8260, "total_steps": 10798, "loss": 1.8933, "reward": null, "learning_rate": 0.00013062239525879943, "epoch": 1.53, "percentage": 76.5, "elapsed_time": "5:34:15", "remaining_time": "1:42:42"} +{"current_steps": 8260, "total_steps": 10798, "loss": 1.8933, "reward": null, "learning_rate": 0.00013062239525879943, "epoch": 1.53, "percentage": 76.5, "elapsed_time": "5:34:13", "remaining_time": "1:42:41"} +{"current_steps": 8270, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 0.0001296435232005677, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "5:40:43", "remaining_time": "1:44:09"} +{"current_steps": 8270, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 0.0001296435232005677, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "5:34:38", "remaining_time": "1:42:17"} +{"current_steps": 8270, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 0.0001296435232005677, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "5:34:40", "remaining_time": "1:42:18"} +{"current_steps": 8270, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 0.0001296435232005677, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "5:34:41", "remaining_time": "1:42:18"} +{"current_steps": 8280, "total_steps": 10798, "loss": 1.9306, "reward": null, "learning_rate": 0.0001286677861076263, "epoch": 1.53, "percentage": 76.68, "elapsed_time": "5:35:06", "remaining_time": "1:41:54"} +{"current_steps": 8280, "total_steps": 10798, "loss": 1.9306, "reward": null, "learning_rate": 0.0001286677861076263, "epoch": 1.53, "percentage": 76.68, "elapsed_time": "5:35:08", "remaining_time": "1:41:55"} +{"current_steps": 8280, "total_steps": 10798, "loss": 1.9306, "reward": null, "learning_rate": 0.0001286677861076263, "epoch": 1.53, "percentage": 76.68, "elapsed_time": "5:35:04", "remaining_time": "1:41:54"} +{"current_steps": 8280, "total_steps": 10798, "loss": 1.9306, "reward": null, "learning_rate": 0.0001286677861076263, "epoch": 1.53, "percentage": 76.68, "elapsed_time": "5:41:09", "remaining_time": "1:43:44"} +{"current_steps": 8290, "total_steps": 10798, "loss": 1.8962, "reward": null, "learning_rate": 0.00012769519223932034, "epoch": 1.54, "percentage": 76.77, "elapsed_time": "5:35:31", "remaining_time": "1:41:30"} +{"current_steps": 8290, "total_steps": 10798, "loss": 1.8962, "reward": null, "learning_rate": 0.00012769519223932034, "epoch": 1.54, "percentage": 76.77, "elapsed_time": "5:41:34", "remaining_time": "1:43:20"} +{"current_steps": 8290, "total_steps": 10798, "loss": 1.8962, "reward": null, "learning_rate": 0.00012769519223932034, "epoch": 1.54, "percentage": 76.77, "elapsed_time": "5:35:29", "remaining_time": "1:41:29"} +{"current_steps": 8290, "total_steps": 10798, "loss": 1.8962, "reward": null, "learning_rate": 0.00012769519223932034, "epoch": 1.54, "percentage": 76.77, "elapsed_time": "5:35:33", "remaining_time": "1:41:30"} +{"current_steps": 8300, "total_steps": 10798, "loss": 1.9322, "reward": null, "learning_rate": 0.00012672574982838802, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "5:41:59", "remaining_time": "1:42:55"} +{"current_steps": 8300, "total_steps": 10798, "loss": 1.9322, "reward": null, "learning_rate": 0.00012672574982838802, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "5:35:54", "remaining_time": "1:41:05"} +{"current_steps": 8300, "total_steps": 10798, "loss": 1.9322, "reward": null, "learning_rate": 0.00012672574982838802, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "5:35:55", "remaining_time": "1:41:06"} +{"current_steps": 8300, "total_steps": 10798, "loss": 1.9322, "reward": null, "learning_rate": 0.00012672574982838802, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "5:35:57", "remaining_time": "1:41:06"} +{"current_steps": 8310, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 0.00012575946708089176, "epoch": 1.54, "percentage": 76.96, "elapsed_time": "5:42:23", "remaining_time": "1:42:30"} +{"current_steps": 8310, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 0.00012575946708089176, "epoch": 1.54, "percentage": 76.96, "elapsed_time": "5:36:18", "remaining_time": "1:40:41"} +{"current_steps": 8310, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 0.00012575946708089176, "epoch": 1.54, "percentage": 76.96, "elapsed_time": "5:36:21", "remaining_time": "1:40:42"} +{"current_steps": 8310, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 0.00012575946708089176, "epoch": 1.54, "percentage": 76.96, "elapsed_time": "5:36:20", "remaining_time": "1:40:41"} +{"current_steps": 8320, "total_steps": 10798, "loss": 1.9308, "reward": null, "learning_rate": 0.0001247963521761481, "epoch": 1.54, "percentage": 77.05, "elapsed_time": "5:42:48", "remaining_time": "1:42:06"} +{"current_steps": 8320, "total_steps": 10798, "loss": 1.9308, "reward": null, "learning_rate": 0.0001247963521761481, "epoch": 1.54, "percentage": 77.05, "elapsed_time": "5:36:43", "remaining_time": "1:40:17"} +{"current_steps": 8320, "total_steps": 10798, "loss": 1.9308, "reward": null, "learning_rate": 0.0001247963521761481, "epoch": 1.54, "percentage": 77.05, "elapsed_time": "5:36:46", "remaining_time": "1:40:18"} +{"current_steps": 8320, "total_steps": 10798, "loss": 1.9308, "reward": null, "learning_rate": 0.0001247963521761481, "epoch": 1.54, "percentage": 77.05, "elapsed_time": "5:36:45", "remaining_time": "1:40:17"} +{"current_steps": 8330, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00012383641326665874, "epoch": 1.54, "percentage": 77.14, "elapsed_time": "5:43:12", "remaining_time": "1:41:41"} +{"current_steps": 8330, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00012383641326665874, "epoch": 1.54, "percentage": 77.14, "elapsed_time": "5:37:11", "remaining_time": "1:39:54"} +{"current_steps": 8330, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00012383641326665874, "epoch": 1.54, "percentage": 77.14, "elapsed_time": "5:37:09", "remaining_time": "1:39:53"} +{"current_steps": 8330, "total_steps": 10798, "loss": 1.8876, "reward": null, "learning_rate": 0.00012383641326665874, "epoch": 1.54, "percentage": 77.14, "elapsed_time": "5:37:08", "remaining_time": "1:39:53"} +{"current_steps": 8340, "total_steps": 10798, "loss": 1.9103, "reward": null, "learning_rate": 0.00012287965847804162, "epoch": 1.54, "percentage": 77.24, "elapsed_time": "5:37:35", "remaining_time": "1:39:29"} +{"current_steps": 8340, "total_steps": 10798, "loss": 1.9103, "reward": null, "learning_rate": 0.00012287965847804162, "epoch": 1.54, "percentage": 77.24, "elapsed_time": "5:43:38", "remaining_time": "1:41:16"} +{"current_steps": 8340, "total_steps": 10798, "loss": 1.9103, "reward": null, "learning_rate": 0.00012287965847804162, "epoch": 1.54, "percentage": 77.24, "elapsed_time": "5:37:36", "remaining_time": "1:39:30"} +{"current_steps": 8340, "total_steps": 10798, "loss": 1.9103, "reward": null, "learning_rate": 0.00012287965847804162, "epoch": 1.54, "percentage": 77.24, "elapsed_time": "5:37:33", "remaining_time": "1:39:29"} +{"current_steps": 8350, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00012192609590896142, "epoch": 1.55, "percentage": 77.33, "elapsed_time": "5:38:01", "remaining_time": "1:39:06"} +{"current_steps": 8350, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00012192609590896142, "epoch": 1.55, "percentage": 77.33, "elapsed_time": "5:37:58", "remaining_time": "1:39:05"} +{"current_steps": 8350, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00012192609590896142, "epoch": 1.55, "percentage": 77.33, "elapsed_time": "5:44:03", "remaining_time": "1:40:52"} +{"current_steps": 8350, "total_steps": 10798, "loss": 1.8804, "reward": null, "learning_rate": 0.00012192609590896142, "epoch": 1.55, "percentage": 77.33, "elapsed_time": "5:38:00", "remaining_time": "1:39:05"} +{"current_steps": 8360, "total_steps": 10798, "loss": 1.944, "reward": null, "learning_rate": 0.00012097573363106218, "epoch": 1.55, "percentage": 77.42, "elapsed_time": "5:44:29", "remaining_time": "1:40:27"} +{"current_steps": 8360, "total_steps": 10798, "loss": 1.944, "reward": null, "learning_rate": 0.00012097573363106218, "epoch": 1.55, "percentage": 77.42, "elapsed_time": "5:38:24", "remaining_time": "1:38:41"} +{"current_steps": 8360, "total_steps": 10798, "loss": 1.944, "reward": null, "learning_rate": 0.00012097573363106218, "epoch": 1.55, "percentage": 77.42, "elapsed_time": "5:38:28", "remaining_time": "1:38:42"} +{"current_steps": 8360, "total_steps": 10798, "loss": 1.944, "reward": null, "learning_rate": 0.00012097573363106218, "epoch": 1.55, "percentage": 77.42, "elapsed_time": "5:38:26", "remaining_time": "1:38:41"} +{"current_steps": 8370, "total_steps": 10798, "loss": 1.9259, "reward": null, "learning_rate": 0.00012002857968889797, "epoch": 1.55, "percentage": 77.51, "elapsed_time": "5:44:54", "remaining_time": "1:40:03"} +{"current_steps": 8370, "total_steps": 10798, "loss": 1.9259, "reward": null, "learning_rate": 0.00012002857968889797, "epoch": 1.55, "percentage": 77.51, "elapsed_time": "5:38:53", "remaining_time": "1:38:18"} +{"current_steps": 8370, "total_steps": 10798, "loss": 1.9259, "reward": null, "learning_rate": 0.00012002857968889797, "epoch": 1.55, "percentage": 77.51, "elapsed_time": "5:38:51", "remaining_time": "1:38:17"} +{"current_steps": 8370, "total_steps": 10798, "loss": 1.9259, "reward": null, "learning_rate": 0.00012002857968889797, "epoch": 1.55, "percentage": 77.51, "elapsed_time": "5:38:49", "remaining_time": "1:38:17"} +{"current_steps": 8380, "total_steps": 10798, "loss": 1.9421, "reward": null, "learning_rate": 0.00011908464209986541, "epoch": 1.55, "percentage": 77.61, "elapsed_time": "5:45:19", "remaining_time": "1:39:38"} +{"current_steps": 8380, "total_steps": 10798, "loss": 1.9421, "reward": null, "learning_rate": 0.00011908464209986541, "epoch": 1.55, "percentage": 77.61, "elapsed_time": "5:39:14", "remaining_time": "1:37:53"} +{"current_steps": 8380, "total_steps": 10798, "loss": 1.9421, "reward": null, "learning_rate": 0.00011908464209986541, "epoch": 1.55, "percentage": 77.61, "elapsed_time": "5:39:16", "remaining_time": "1:37:53"} +{"current_steps": 8380, "total_steps": 10798, "loss": 1.9421, "reward": null, "learning_rate": 0.00011908464209986541, "epoch": 1.55, "percentage": 77.61, "elapsed_time": "5:39:17", "remaining_time": "1:37:54"} +{"current_steps": 8390, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.00011814392885413567, "epoch": 1.55, "percentage": 77.7, "elapsed_time": "5:39:39", "remaining_time": "1:37:29"} +{"current_steps": 8390, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.00011814392885413567, "epoch": 1.55, "percentage": 77.7, "elapsed_time": "5:39:41", "remaining_time": "1:37:29"} +{"current_steps": 8390, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.00011814392885413567, "epoch": 1.55, "percentage": 77.7, "elapsed_time": "5:39:38", "remaining_time": "1:37:28"} +{"current_steps": 8390, "total_steps": 10798, "loss": 1.9251, "reward": null, "learning_rate": 0.00011814392885413567, "epoch": 1.55, "percentage": 77.7, "elapsed_time": "5:45:43", "remaining_time": "1:39:13"} +{"current_steps": 8400, "total_steps": 10798, "loss": 1.9106, "reward": null, "learning_rate": 0.00011720644791458623, "epoch": 1.56, "percentage": 77.79, "elapsed_time": "5:46:07", "remaining_time": "1:38:48"} +{"current_steps": 8400, "total_steps": 10798, "loss": 1.9106, "reward": null, "learning_rate": 0.00011720644791458623, "epoch": 1.56, "percentage": 77.79, "elapsed_time": "5:40:03", "remaining_time": "1:37:04"} +{"current_steps": 8400, "total_steps": 10798, "loss": 1.9106, "reward": null, "learning_rate": 0.00011720644791458623, "epoch": 1.56, "percentage": 77.79, "elapsed_time": "5:40:06", "remaining_time": "1:37:05"} +{"current_steps": 8400, "total_steps": 10798, "loss": 1.9106, "reward": null, "learning_rate": 0.00011720644791458623, "epoch": 1.56, "percentage": 77.79, "elapsed_time": "5:40:04", "remaining_time": "1:37:05"} +{"current_steps": 8410, "total_steps": 10798, "loss": 1.8928, "reward": null, "learning_rate": 0.00011627220721673459, "epoch": 1.56, "percentage": 77.88, "elapsed_time": "5:46:33", "remaining_time": "1:38:24"} +{"current_steps": 8410, "total_steps": 10798, "loss": 1.8928, "reward": null, "learning_rate": 0.00011627220721673459, "epoch": 1.56, "percentage": 77.88, "elapsed_time": "5:40:30", "remaining_time": "1:36:41"} +{"current_steps": 8410, "total_steps": 10798, "loss": 1.8928, "reward": null, "learning_rate": 0.00011627220721673459, "epoch": 1.56, "percentage": 77.88, "elapsed_time": "5:40:31", "remaining_time": "1:36:41"} +{"current_steps": 8410, "total_steps": 10798, "loss": 1.8928, "reward": null, "learning_rate": 0.00011627220721673459, "epoch": 1.56, "percentage": 77.88, "elapsed_time": "5:40:28", "remaining_time": "1:36:40"} +{"current_steps": 8420, "total_steps": 10798, "loss": 1.9323, "reward": null, "learning_rate": 0.00011534121466866986, "epoch": 1.56, "percentage": 77.98, "elapsed_time": "5:40:52", "remaining_time": "1:36:16"} +{"current_steps": 8420, "total_steps": 10798, "loss": 1.9323, "reward": null, "learning_rate": 0.00011534121466866986, "epoch": 1.56, "percentage": 77.98, "elapsed_time": "5:40:56", "remaining_time": "1:36:17"} +{"current_steps": 8420, "total_steps": 10798, "loss": 1.9323, "reward": null, "learning_rate": 0.00011534121466866986, "epoch": 1.56, "percentage": 77.98, "elapsed_time": "5:40:54", "remaining_time": "1:36:16"} +{"current_steps": 8420, "total_steps": 10798, "loss": 1.9323, "reward": null, "learning_rate": 0.00011534121466866986, "epoch": 1.56, "percentage": 77.98, "elapsed_time": "5:46:57", "remaining_time": "1:37:59"} +{"current_steps": 8430, "total_steps": 10798, "loss": 1.9238, "reward": null, "learning_rate": 0.00011441347815098735, "epoch": 1.56, "percentage": 78.07, "elapsed_time": "5:47:22", "remaining_time": "1:37:34"} +{"current_steps": 8430, "total_steps": 10798, "loss": 1.9238, "reward": null, "learning_rate": 0.00011441347815098735, "epoch": 1.56, "percentage": 78.07, "elapsed_time": "5:41:21", "remaining_time": "1:35:53"} +{"current_steps": 8430, "total_steps": 10798, "loss": 1.9238, "reward": null, "learning_rate": 0.00011441347815098735, "epoch": 1.56, "percentage": 78.07, "elapsed_time": "5:41:17", "remaining_time": "1:35:52"} +{"current_steps": 8430, "total_steps": 10798, "loss": 1.9238, "reward": null, "learning_rate": 0.00011441347815098735, "epoch": 1.56, "percentage": 78.07, "elapsed_time": "5:41:19", "remaining_time": "1:35:52"} +{"current_steps": 8440, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0001134890055167201, "epoch": 1.56, "percentage": 78.16, "elapsed_time": "5:41:42", "remaining_time": "1:35:28"} +{"current_steps": 8440, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0001134890055167201, "epoch": 1.56, "percentage": 78.16, "elapsed_time": "5:41:45", "remaining_time": "1:35:29"} +{"current_steps": 8440, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0001134890055167201, "epoch": 1.56, "percentage": 78.16, "elapsed_time": "5:41:44", "remaining_time": "1:35:28"} +{"current_steps": 8440, "total_steps": 10798, "loss": 1.9831, "reward": null, "learning_rate": 0.0001134890055167201, "epoch": 1.56, "percentage": 78.16, "elapsed_time": "5:47:47", "remaining_time": "1:37:10"} +{"current_steps": 8450, "total_steps": 10798, "loss": 1.85, "reward": null, "learning_rate": 0.00011256780459127374, "epoch": 1.57, "percentage": 78.26, "elapsed_time": "5:48:12", "remaining_time": "1:36:45"} +{"current_steps": 8450, "total_steps": 10798, "loss": 1.85, "reward": null, "learning_rate": 0.00011256780459127374, "epoch": 1.57, "percentage": 78.26, "elapsed_time": "5:42:10", "remaining_time": "1:35:04"} +{"current_steps": 8450, "total_steps": 10798, "loss": 1.85, "reward": null, "learning_rate": 0.00011256780459127374, "epoch": 1.57, "percentage": 78.26, "elapsed_time": "5:42:08", "remaining_time": "1:35:04"} +{"current_steps": 8450, "total_steps": 10798, "loss": 1.85, "reward": null, "learning_rate": 0.00011256780459127374, "epoch": 1.57, "percentage": 78.26, "elapsed_time": "5:42:07", "remaining_time": "1:35:03"} +{"current_steps": 8460, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 0.0001116498831723598, "epoch": 1.57, "percentage": 78.35, "elapsed_time": "5:42:31", "remaining_time": "1:34:39"} +{"current_steps": 8460, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 0.0001116498831723598, "epoch": 1.57, "percentage": 78.35, "elapsed_time": "5:42:33", "remaining_time": "1:34:40"} +{"current_steps": 8460, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 0.0001116498831723598, "epoch": 1.57, "percentage": 78.35, "elapsed_time": "5:42:34", "remaining_time": "1:34:40"} +{"current_steps": 8460, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 0.0001116498831723598, "epoch": 1.57, "percentage": 78.35, "elapsed_time": "5:48:36", "remaining_time": "1:36:20"} +{"current_steps": 8470, "total_steps": 10798, "loss": 1.9071, "reward": null, "learning_rate": 0.00011073524902992921, "epoch": 1.57, "percentage": 78.44, "elapsed_time": "5:49:01", "remaining_time": "1:35:55"} +{"current_steps": 8470, "total_steps": 10798, "loss": 1.9071, "reward": null, "learning_rate": 0.00011073524902992921, "epoch": 1.57, "percentage": 78.44, "elapsed_time": "5:42:58", "remaining_time": "1:34:16"} +{"current_steps": 8470, "total_steps": 10798, "loss": 1.9071, "reward": null, "learning_rate": 0.00011073524902992921, "epoch": 1.57, "percentage": 78.44, "elapsed_time": "5:43:00", "remaining_time": "1:34:16"} +{"current_steps": 8470, "total_steps": 10798, "loss": 1.9071, "reward": null, "learning_rate": 0.00011073524902992921, "epoch": 1.57, "percentage": 78.44, "elapsed_time": "5:42:56", "remaining_time": "1:34:15"} +{"current_steps": 8480, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.00010982390990610791, "epoch": 1.57, "percentage": 78.53, "elapsed_time": "5:49:27", "remaining_time": "1:35:31"} +{"current_steps": 8480, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.00010982390990610791, "epoch": 1.57, "percentage": 78.53, "elapsed_time": "5:43:22", "remaining_time": "1:33:51"} +{"current_steps": 8480, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.00010982390990610791, "epoch": 1.57, "percentage": 78.53, "elapsed_time": "5:43:26", "remaining_time": "1:33:52"} +{"current_steps": 8480, "total_steps": 10798, "loss": 1.9538, "reward": null, "learning_rate": 0.00010982390990610791, "epoch": 1.57, "percentage": 78.53, "elapsed_time": "5:43:24", "remaining_time": "1:33:52"} +{"current_steps": 8490, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00010891587351512949, "epoch": 1.57, "percentage": 78.63, "elapsed_time": "5:49:53", "remaining_time": "1:35:07"} +{"current_steps": 8490, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00010891587351512949, "epoch": 1.57, "percentage": 78.63, "elapsed_time": "5:43:50", "remaining_time": "1:33:28"} +{"current_steps": 8490, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00010891587351512949, "epoch": 1.57, "percentage": 78.63, "elapsed_time": "5:43:48", "remaining_time": "1:33:27"} +{"current_steps": 8490, "total_steps": 10798, "loss": 1.8972, "reward": null, "learning_rate": 0.00010891587351512949, "epoch": 1.57, "percentage": 78.63, "elapsed_time": "5:43:52", "remaining_time": "1:33:28"} +{"current_steps": 8500, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00010801114754327135, "epoch": 1.57, "percentage": 78.72, "elapsed_time": "5:50:17", "remaining_time": "1:34:42"} +{"current_steps": 8500, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00010801114754327135, "epoch": 1.57, "percentage": 78.72, "elapsed_time": "5:44:12", "remaining_time": "1:33:03"} +{"current_steps": 8500, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00010801114754327135, "epoch": 1.57, "percentage": 78.72, "elapsed_time": "5:44:13", "remaining_time": "1:33:03"} +{"current_steps": 8500, "total_steps": 10798, "loss": 1.9184, "reward": null, "learning_rate": 0.00010801114754327135, "epoch": 1.57, "percentage": 78.72, "elapsed_time": "5:44:15", "remaining_time": "1:33:04"} +{"current_steps": 8510, "total_steps": 10798, "loss": 1.9567, "reward": null, "learning_rate": 0.00010710973964878906, "epoch": 1.58, "percentage": 78.81, "elapsed_time": "5:50:42", "remaining_time": "1:34:17"} +{"current_steps": 8510, "total_steps": 10798, "loss": 1.9567, "reward": null, "learning_rate": 0.00010710973964878906, "epoch": 1.58, "percentage": 78.81, "elapsed_time": "5:44:37", "remaining_time": "1:32:39"} +{"current_steps": 8510, "total_steps": 10798, "loss": 1.9567, "reward": null, "learning_rate": 0.00010710973964878906, "epoch": 1.58, "percentage": 78.81, "elapsed_time": "5:44:39", "remaining_time": "1:32:39"} +{"current_steps": 8510, "total_steps": 10798, "loss": 1.9567, "reward": null, "learning_rate": 0.00010710973964878906, "epoch": 1.58, "percentage": 78.81, "elapsed_time": "5:44:40", "remaining_time": "1:32:40"} +{"current_steps": 8520, "total_steps": 10798, "loss": 1.9755, "reward": null, "learning_rate": 0.00010621165746185113, "epoch": 1.58, "percentage": 78.9, "elapsed_time": "5:51:07", "remaining_time": "1:33:52"} +{"current_steps": 8520, "total_steps": 10798, "loss": 1.9755, "reward": null, "learning_rate": 0.00010621165746185113, "epoch": 1.58, "percentage": 78.9, "elapsed_time": "5:45:02", "remaining_time": "1:32:15"} +{"current_steps": 8520, "total_steps": 10798, "loss": 1.9755, "reward": null, "learning_rate": 0.00010621165746185113, "epoch": 1.58, "percentage": 78.9, "elapsed_time": "5:45:04", "remaining_time": "1:32:15"} +{"current_steps": 8520, "total_steps": 10798, "loss": 1.9755, "reward": null, "learning_rate": 0.00010621165746185113, "epoch": 1.58, "percentage": 78.9, "elapsed_time": "5:45:05", "remaining_time": "1:32:16"} +{"current_steps": 8530, "total_steps": 10798, "loss": 1.9256, "reward": null, "learning_rate": 0.0001053169085844758, "epoch": 1.58, "percentage": 79.0, "elapsed_time": "5:51:32", "remaining_time": "1:33:28"} +{"current_steps": 8530, "total_steps": 10798, "loss": 1.9256, "reward": null, "learning_rate": 0.0001053169085844758, "epoch": 1.58, "percentage": 79.0, "elapsed_time": "5:45:30", "remaining_time": "1:31:51"} +{"current_steps": 8530, "total_steps": 10798, "loss": 1.9256, "reward": null, "learning_rate": 0.0001053169085844758, "epoch": 1.58, "percentage": 79.0, "elapsed_time": "5:45:28", "remaining_time": "1:31:51"} +{"current_steps": 8530, "total_steps": 10798, "loss": 1.9256, "reward": null, "learning_rate": 0.0001053169085844758, "epoch": 1.58, "percentage": 79.0, "elapsed_time": "5:45:27", "remaining_time": "1:31:51"} +{"current_steps": 8540, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0001044255005904648, "epoch": 1.58, "percentage": 79.09, "elapsed_time": "5:45:54", "remaining_time": "1:31:27"} +{"current_steps": 8540, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0001044255005904648, "epoch": 1.58, "percentage": 79.09, "elapsed_time": "5:45:52", "remaining_time": "1:31:27"} +{"current_steps": 8540, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0001044255005904648, "epoch": 1.58, "percentage": 79.09, "elapsed_time": "5:51:57", "remaining_time": "1:33:03"} +{"current_steps": 8540, "total_steps": 10798, "loss": 1.9742, "reward": null, "learning_rate": 0.0001044255005904648, "epoch": 1.58, "percentage": 79.09, "elapsed_time": "5:45:55", "remaining_time": "1:31:27"} +{"current_steps": 8550, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0001035374410253408, "epoch": 1.58, "percentage": 79.18, "elapsed_time": "5:52:22", "remaining_time": "1:32:38"} +{"current_steps": 8550, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0001035374410253408, "epoch": 1.58, "percentage": 79.18, "elapsed_time": "5:46:19", "remaining_time": "1:31:03"} +{"current_steps": 8550, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0001035374410253408, "epoch": 1.58, "percentage": 79.18, "elapsed_time": "5:46:21", "remaining_time": "1:31:03"} +{"current_steps": 8550, "total_steps": 10798, "loss": 1.9562, "reward": null, "learning_rate": 0.0001035374410253408, "epoch": 1.58, "percentage": 79.18, "elapsed_time": "5:46:18", "remaining_time": "1:31:03"} +{"current_steps": 8560, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0001026527374062825, "epoch": 1.59, "percentage": 79.27, "elapsed_time": "5:52:47", "remaining_time": "1:32:14"} +{"current_steps": 8560, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0001026527374062825, "epoch": 1.59, "percentage": 79.27, "elapsed_time": "5:46:46", "remaining_time": "1:30:39"} +{"current_steps": 8560, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0001026527374062825, "epoch": 1.59, "percentage": 79.27, "elapsed_time": "5:46:43", "remaining_time": "1:30:38"} +{"current_steps": 8560, "total_steps": 10798, "loss": 1.9432, "reward": null, "learning_rate": 0.0001026527374062825, "epoch": 1.59, "percentage": 79.27, "elapsed_time": "5:46:44", "remaining_time": "1:30:39"} +{"current_steps": 8570, "total_steps": 10798, "loss": 1.9007, "reward": null, "learning_rate": 0.00010177139722206191, "epoch": 1.59, "percentage": 79.37, "elapsed_time": "5:47:08", "remaining_time": "1:30:15"} +{"current_steps": 8570, "total_steps": 10798, "loss": 1.9007, "reward": null, "learning_rate": 0.00010177139722206191, "epoch": 1.59, "percentage": 79.37, "elapsed_time": "5:53:13", "remaining_time": "1:31:49"} +{"current_steps": 8570, "total_steps": 10798, "loss": 1.9007, "reward": null, "learning_rate": 0.00010177139722206191, "epoch": 1.59, "percentage": 79.37, "elapsed_time": "5:47:12", "remaining_time": "1:30:15"} +{"current_steps": 8570, "total_steps": 10798, "loss": 1.9007, "reward": null, "learning_rate": 0.00010177139722206191, "epoch": 1.59, "percentage": 79.37, "elapsed_time": "5:47:10", "remaining_time": "1:30:15"} +{"current_steps": 8580, "total_steps": 10798, "loss": 1.9834, "reward": null, "learning_rate": 0.00010089342793298028, "epoch": 1.59, "percentage": 79.46, "elapsed_time": "5:53:39", "remaining_time": "1:31:25"} +{"current_steps": 8580, "total_steps": 10798, "loss": 1.9834, "reward": null, "learning_rate": 0.00010089342793298028, "epoch": 1.59, "percentage": 79.46, "elapsed_time": "5:47:34", "remaining_time": "1:29:51"} +{"current_steps": 8580, "total_steps": 10798, "loss": 1.9834, "reward": null, "learning_rate": 0.00010089342793298028, "epoch": 1.59, "percentage": 79.46, "elapsed_time": "5:47:36", "remaining_time": "1:29:51"} +{"current_steps": 8580, "total_steps": 10798, "loss": 1.9834, "reward": null, "learning_rate": 0.00010089342793298028, "epoch": 1.59, "percentage": 79.46, "elapsed_time": "5:47:38", "remaining_time": "1:29:52"} +{"current_steps": 8590, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 0.00010001883697080504, "epoch": 1.59, "percentage": 79.55, "elapsed_time": "5:54:03", "remaining_time": "1:31:00"} +{"current_steps": 8590, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 0.00010001883697080504, "epoch": 1.59, "percentage": 79.55, "elapsed_time": "5:48:00", "remaining_time": "1:29:27"} +{"current_steps": 8590, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 0.00010001883697080504, "epoch": 1.59, "percentage": 79.55, "elapsed_time": "5:47:59", "remaining_time": "1:29:26"} +{"current_steps": 8590, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 0.00010001883697080504, "epoch": 1.59, "percentage": 79.55, "elapsed_time": "5:48:02", "remaining_time": "1:29:27"} +{"current_steps": 8600, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 9.914763173870738e-05, "epoch": 1.59, "percentage": 79.64, "elapsed_time": "5:54:28", "remaining_time": "1:30:35"} +{"current_steps": 8600, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 9.914763173870738e-05, "epoch": 1.59, "percentage": 79.64, "elapsed_time": "5:48:25", "remaining_time": "1:29:03"} +{"current_steps": 8600, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 9.914763173870738e-05, "epoch": 1.59, "percentage": 79.64, "elapsed_time": "5:48:24", "remaining_time": "1:29:02"} +{"current_steps": 8600, "total_steps": 10798, "loss": 1.9063, "reward": null, "learning_rate": 9.914763173870738e-05, "epoch": 1.59, "percentage": 79.64, "elapsed_time": "5:48:27", "remaining_time": "1:29:03"} +{"current_steps": 8610, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 9.827981961119869e-05, "epoch": 1.59, "percentage": 79.74, "elapsed_time": "5:54:52", "remaining_time": "1:30:11"} +{"current_steps": 8610, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 9.827981961119869e-05, "epoch": 1.59, "percentage": 79.74, "elapsed_time": "5:48:48", "remaining_time": "1:28:38"} +{"current_steps": 8610, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 9.827981961119869e-05, "epoch": 1.59, "percentage": 79.74, "elapsed_time": "5:48:49", "remaining_time": "1:28:38"} +{"current_steps": 8610, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 9.827981961119869e-05, "epoch": 1.59, "percentage": 79.74, "elapsed_time": "5:48:51", "remaining_time": "1:28:39"} +{"current_steps": 8620, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 9.741540793406911e-05, "epoch": 1.6, "percentage": 79.83, "elapsed_time": "5:55:17", "remaining_time": "1:29:46"} +{"current_steps": 8620, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 9.741540793406911e-05, "epoch": 1.6, "percentage": 79.83, "elapsed_time": "5:49:12", "remaining_time": "1:28:14"} +{"current_steps": 8620, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 9.741540793406911e-05, "epoch": 1.6, "percentage": 79.83, "elapsed_time": "5:49:14", "remaining_time": "1:28:14"} +{"current_steps": 8620, "total_steps": 10798, "loss": 1.9096, "reward": null, "learning_rate": 9.741540793406911e-05, "epoch": 1.6, "percentage": 79.83, "elapsed_time": "5:49:15", "remaining_time": "1:28:14"} +{"current_steps": 8630, "total_steps": 10798, "loss": 1.8657, "reward": null, "learning_rate": 9.655440402432464e-05, "epoch": 1.6, "percentage": 79.92, "elapsed_time": "5:55:42", "remaining_time": "1:29:21"} +{"current_steps": 8630, "total_steps": 10798, "loss": 1.8657, "reward": null, "learning_rate": 9.655440402432464e-05, "epoch": 1.6, "percentage": 79.92, "elapsed_time": "5:49:40", "remaining_time": "1:27:50"} +{"current_steps": 8630, "total_steps": 10798, "loss": 1.8657, "reward": null, "learning_rate": 9.655440402432464e-05, "epoch": 1.6, "percentage": 79.92, "elapsed_time": "5:49:38", "remaining_time": "1:27:50"} +{"current_steps": 8630, "total_steps": 10798, "loss": 1.8657, "reward": null, "learning_rate": 9.655440402432464e-05, "epoch": 1.6, "percentage": 79.92, "elapsed_time": "5:49:37", "remaining_time": "1:27:49"} +{"current_steps": 8640, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 9.569681517012585e-05, "epoch": 1.6, "percentage": 80.01, "elapsed_time": "5:56:06", "remaining_time": "1:28:56"} +{"current_steps": 8640, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 9.569681517012585e-05, "epoch": 1.6, "percentage": 80.01, "elapsed_time": "5:50:01", "remaining_time": "1:27:25"} +{"current_steps": 8640, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 9.569681517012585e-05, "epoch": 1.6, "percentage": 80.01, "elapsed_time": "5:50:05", "remaining_time": "1:27:26"} +{"current_steps": 8640, "total_steps": 10798, "loss": 1.9237, "reward": null, "learning_rate": 9.569681517012585e-05, "epoch": 1.6, "percentage": 80.01, "elapsed_time": "5:50:03", "remaining_time": "1:27:26"} +{"current_steps": 8650, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 9.484264863072523e-05, "epoch": 1.6, "percentage": 80.11, "elapsed_time": "5:56:32", "remaining_time": "1:28:32"} +{"current_steps": 8650, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 9.484264863072523e-05, "epoch": 1.6, "percentage": 80.11, "elapsed_time": "5:50:28", "remaining_time": "1:27:01"} +{"current_steps": 8650, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 9.484264863072523e-05, "epoch": 1.6, "percentage": 80.11, "elapsed_time": "5:50:30", "remaining_time": "1:27:02"} +{"current_steps": 8650, "total_steps": 10798, "loss": 1.9739, "reward": null, "learning_rate": 9.484264863072523e-05, "epoch": 1.6, "percentage": 80.11, "elapsed_time": "5:50:27", "remaining_time": "1:27:01"} +{"current_steps": 8660, "total_steps": 10798, "loss": 1.9199, "reward": null, "learning_rate": 9.399191163640675e-05, "epoch": 1.6, "percentage": 80.2, "elapsed_time": "5:56:56", "remaining_time": "1:28:07"} +{"current_steps": 8660, "total_steps": 10798, "loss": 1.9199, "reward": null, "learning_rate": 9.399191163640675e-05, "epoch": 1.6, "percentage": 80.2, "elapsed_time": "5:50:51", "remaining_time": "1:26:37"} +{"current_steps": 8660, "total_steps": 10798, "loss": 1.9199, "reward": null, "learning_rate": 9.399191163640675e-05, "epoch": 1.6, "percentage": 80.2, "elapsed_time": "5:50:55", "remaining_time": "1:26:38"} +{"current_steps": 8660, "total_steps": 10798, "loss": 1.9199, "reward": null, "learning_rate": 9.399191163640675e-05, "epoch": 1.6, "percentage": 80.2, "elapsed_time": "5:50:53", "remaining_time": "1:26:37"} +{"current_steps": 8670, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 9.314461138842406e-05, "epoch": 1.61, "percentage": 80.29, "elapsed_time": "5:57:21", "remaining_time": "1:27:42"} +{"current_steps": 8670, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 9.314461138842406e-05, "epoch": 1.61, "percentage": 80.29, "elapsed_time": "5:51:20", "remaining_time": "1:26:13"} +{"current_steps": 8670, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 9.314461138842406e-05, "epoch": 1.61, "percentage": 80.29, "elapsed_time": "5:51:16", "remaining_time": "1:26:13"} +{"current_steps": 8670, "total_steps": 10798, "loss": 1.9639, "reward": null, "learning_rate": 9.314461138842406e-05, "epoch": 1.61, "percentage": 80.29, "elapsed_time": "5:51:18", "remaining_time": "1:26:13"} +{"current_steps": 8680, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 9.230075505893987e-05, "epoch": 1.61, "percentage": 80.39, "elapsed_time": "5:57:45", "remaining_time": "1:27:17"} +{"current_steps": 8680, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 9.230075505893987e-05, "epoch": 1.61, "percentage": 80.39, "elapsed_time": "5:51:40", "remaining_time": "1:25:48"} +{"current_steps": 8680, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 9.230075505893987e-05, "epoch": 1.61, "percentage": 80.39, "elapsed_time": "5:51:42", "remaining_time": "1:25:49"} +{"current_steps": 8680, "total_steps": 10798, "loss": 1.9391, "reward": null, "learning_rate": 9.230075505893987e-05, "epoch": 1.61, "percentage": 80.39, "elapsed_time": "5:51:44", "remaining_time": "1:25:49"} +{"current_steps": 8690, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 9.146034979096496e-05, "epoch": 1.61, "percentage": 80.48, "elapsed_time": "5:58:10", "remaining_time": "1:26:53"} +{"current_steps": 8690, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 9.146034979096496e-05, "epoch": 1.61, "percentage": 80.48, "elapsed_time": "5:52:08", "remaining_time": "1:25:25"} +{"current_steps": 8690, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 9.146034979096496e-05, "epoch": 1.61, "percentage": 80.48, "elapsed_time": "5:52:05", "remaining_time": "1:25:24"} +{"current_steps": 8690, "total_steps": 10798, "loss": 1.9326, "reward": null, "learning_rate": 9.146034979096496e-05, "epoch": 1.61, "percentage": 80.48, "elapsed_time": "5:52:07", "remaining_time": "1:25:24"} +{"current_steps": 8700, "total_steps": 10798, "loss": 1.9501, "reward": null, "learning_rate": 9.06234026982976e-05, "epoch": 1.61, "percentage": 80.57, "elapsed_time": "5:52:33", "remaining_time": "1:25:01"} +{"current_steps": 8700, "total_steps": 10798, "loss": 1.9501, "reward": null, "learning_rate": 9.06234026982976e-05, "epoch": 1.61, "percentage": 80.57, "elapsed_time": "5:58:34", "remaining_time": "1:26:28"} +{"current_steps": 8700, "total_steps": 10798, "loss": 1.9501, "reward": null, "learning_rate": 9.06234026982976e-05, "epoch": 1.61, "percentage": 80.57, "elapsed_time": "5:52:30", "remaining_time": "1:25:00"} +{"current_steps": 8700, "total_steps": 10798, "loss": 1.9501, "reward": null, "learning_rate": 9.06234026982976e-05, "epoch": 1.61, "percentage": 80.57, "elapsed_time": "5:52:31", "remaining_time": "1:25:00"} +{"current_steps": 8710, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 8.9789920865464e-05, "epoch": 1.61, "percentage": 80.66, "elapsed_time": "5:52:54", "remaining_time": "1:24:35"} +{"current_steps": 8710, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 8.9789920865464e-05, "epoch": 1.61, "percentage": 80.66, "elapsed_time": "5:52:57", "remaining_time": "1:24:36"} +{"current_steps": 8710, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 8.9789920865464e-05, "epoch": 1.61, "percentage": 80.66, "elapsed_time": "5:52:55", "remaining_time": "1:24:36"} +{"current_steps": 8710, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 8.9789920865464e-05, "epoch": 1.61, "percentage": 80.66, "elapsed_time": "5:58:59", "remaining_time": "1:26:03"} +{"current_steps": 8720, "total_steps": 10798, "loss": 1.931, "reward": null, "learning_rate": 8.895991134765758e-05, "epoch": 1.62, "percentage": 80.76, "elapsed_time": "5:53:21", "remaining_time": "1:24:12"} +{"current_steps": 8720, "total_steps": 10798, "loss": 1.931, "reward": null, "learning_rate": 8.895991134765758e-05, "epoch": 1.62, "percentage": 80.76, "elapsed_time": "5:59:23", "remaining_time": "1:25:38"} +{"current_steps": 8720, "total_steps": 10798, "loss": 1.931, "reward": null, "learning_rate": 8.895991134765758e-05, "epoch": 1.62, "percentage": 80.76, "elapsed_time": "5:53:18", "remaining_time": "1:24:11"} +{"current_steps": 8720, "total_steps": 10798, "loss": 1.931, "reward": null, "learning_rate": 8.895991134765758e-05, "epoch": 1.62, "percentage": 80.76, "elapsed_time": "5:53:19", "remaining_time": "1:24:12"} +{"current_steps": 8730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 8.813338117067965e-05, "epoch": 1.62, "percentage": 80.85, "elapsed_time": "5:59:47", "remaining_time": "1:25:13"} +{"current_steps": 8730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 8.813338117067965e-05, "epoch": 1.62, "percentage": 80.85, "elapsed_time": "5:53:44", "remaining_time": "1:23:47"} +{"current_steps": 8730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 8.813338117067965e-05, "epoch": 1.62, "percentage": 80.85, "elapsed_time": "5:53:46", "remaining_time": "1:23:48"} +{"current_steps": 8730, "total_steps": 10798, "loss": 1.9589, "reward": null, "learning_rate": 8.813338117067965e-05, "epoch": 1.62, "percentage": 80.85, "elapsed_time": "5:53:42", "remaining_time": "1:23:47"} +{"current_steps": 8740, "total_steps": 10798, "loss": 1.9226, "reward": null, "learning_rate": 8.731033733088012e-05, "epoch": 1.62, "percentage": 80.94, "elapsed_time": "6:00:12", "remaining_time": "1:24:49"} +{"current_steps": 8740, "total_steps": 10798, "loss": 1.9226, "reward": null, "learning_rate": 8.731033733088012e-05, "epoch": 1.62, "percentage": 80.94, "elapsed_time": "5:54:07", "remaining_time": "1:23:23"} +{"current_steps": 8740, "total_steps": 10798, "loss": 1.9226, "reward": null, "learning_rate": 8.731033733088012e-05, "epoch": 1.62, "percentage": 80.94, "elapsed_time": "5:54:10", "remaining_time": "1:23:23"} +{"current_steps": 8740, "total_steps": 10798, "loss": 1.9226, "reward": null, "learning_rate": 8.731033733088012e-05, "epoch": 1.62, "percentage": 80.94, "elapsed_time": "5:54:09", "remaining_time": "1:23:23"} +{"current_steps": 8750, "total_steps": 10798, "loss": 1.911, "reward": null, "learning_rate": 8.649078679509742e-05, "epoch": 1.62, "percentage": 81.03, "elapsed_time": "6:00:37", "remaining_time": "1:24:24"} +{"current_steps": 8750, "total_steps": 10798, "loss": 1.911, "reward": null, "learning_rate": 8.649078679509742e-05, "epoch": 1.62, "percentage": 81.03, "elapsed_time": "5:54:35", "remaining_time": "1:22:59"} +{"current_steps": 8750, "total_steps": 10798, "loss": 1.911, "reward": null, "learning_rate": 8.649078679509742e-05, "epoch": 1.62, "percentage": 81.03, "elapsed_time": "5:54:34", "remaining_time": "1:22:59"} +{"current_steps": 8750, "total_steps": 10798, "loss": 1.911, "reward": null, "learning_rate": 8.649078679509742e-05, "epoch": 1.62, "percentage": 81.03, "elapsed_time": "5:54:32", "remaining_time": "1:22:59"} +{"current_steps": 8760, "total_steps": 10798, "loss": 1.9641, "reward": null, "learning_rate": 8.567473650060082e-05, "epoch": 1.62, "percentage": 81.13, "elapsed_time": "6:01:02", "remaining_time": "1:23:59"} +{"current_steps": 8760, "total_steps": 10798, "loss": 1.9641, "reward": null, "learning_rate": 8.567473650060082e-05, "epoch": 1.62, "percentage": 81.13, "elapsed_time": "5:54:57", "remaining_time": "1:22:34"} +{"current_steps": 8760, "total_steps": 10798, "loss": 1.9641, "reward": null, "learning_rate": 8.567473650060082e-05, "epoch": 1.62, "percentage": 81.13, "elapsed_time": "5:55:00", "remaining_time": "1:22:35"} +{"current_steps": 8760, "total_steps": 10798, "loss": 1.9641, "reward": null, "learning_rate": 8.567473650060082e-05, "epoch": 1.62, "percentage": 81.13, "elapsed_time": "5:54:58", "remaining_time": "1:22:35"} +{"current_steps": 8770, "total_steps": 10798, "loss": 1.8924, "reward": null, "learning_rate": 8.486219335503026e-05, "epoch": 1.62, "percentage": 81.22, "elapsed_time": "6:01:26", "remaining_time": "1:23:34"} +{"current_steps": 8770, "total_steps": 10798, "loss": 1.8924, "reward": null, "learning_rate": 8.486219335503026e-05, "epoch": 1.62, "percentage": 81.22, "elapsed_time": "5:55:22", "remaining_time": "1:22:10"} +{"current_steps": 8770, "total_steps": 10798, "loss": 1.8924, "reward": null, "learning_rate": 8.486219335503026e-05, "epoch": 1.62, "percentage": 81.22, "elapsed_time": "5:55:24", "remaining_time": "1:22:11"} +{"current_steps": 8770, "total_steps": 10798, "loss": 1.8924, "reward": null, "learning_rate": 8.486219335503026e-05, "epoch": 1.62, "percentage": 81.22, "elapsed_time": "5:55:21", "remaining_time": "1:22:10"} +{"current_steps": 8780, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 8.405316423633958e-05, "epoch": 1.63, "percentage": 81.31, "elapsed_time": "6:01:51", "remaining_time": "1:23:10"} +{"current_steps": 8780, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 8.405316423633958e-05, "epoch": 1.63, "percentage": 81.31, "elapsed_time": "5:55:50", "remaining_time": "1:21:47"} +{"current_steps": 8780, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 8.405316423633958e-05, "epoch": 1.63, "percentage": 81.31, "elapsed_time": "5:55:48", "remaining_time": "1:21:46"} +{"current_steps": 8780, "total_steps": 10798, "loss": 1.9583, "reward": null, "learning_rate": 8.405316423633958e-05, "epoch": 1.63, "percentage": 81.31, "elapsed_time": "5:55:47", "remaining_time": "1:21:46"} +{"current_steps": 8790, "total_steps": 10798, "loss": 1.9399, "reward": null, "learning_rate": 8.324765599273649e-05, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "5:56:12", "remaining_time": "1:21:22"} +{"current_steps": 8790, "total_steps": 10798, "loss": 1.9399, "reward": null, "learning_rate": 8.324765599273649e-05, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "5:56:13", "remaining_time": "1:21:22"} +{"current_steps": 8790, "total_steps": 10798, "loss": 1.9399, "reward": null, "learning_rate": 8.324765599273649e-05, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "5:56:15", "remaining_time": "1:21:23"} +{"current_steps": 8790, "total_steps": 10798, "loss": 1.9399, "reward": null, "learning_rate": 8.324765599273649e-05, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "6:02:17", "remaining_time": "1:22:45"} +{"current_steps": 8800, "total_steps": 10798, "loss": 1.9362, "reward": null, "learning_rate": 8.244567544262588e-05, "epoch": 1.63, "percentage": 81.5, "elapsed_time": "6:02:42", "remaining_time": "1:22:21"} +{"current_steps": 8800, "total_steps": 10798, "loss": 1.9362, "reward": null, "learning_rate": 8.244567544262588e-05, "epoch": 1.63, "percentage": 81.5, "elapsed_time": "5:56:37", "remaining_time": "1:20:58"} +{"current_steps": 8800, "total_steps": 10798, "loss": 1.9362, "reward": null, "learning_rate": 8.244567544262588e-05, "epoch": 1.63, "percentage": 81.5, "elapsed_time": "5:56:40", "remaining_time": "1:20:58"} +{"current_steps": 8800, "total_steps": 10798, "loss": 1.9362, "reward": null, "learning_rate": 8.244567544262588e-05, "epoch": 1.63, "percentage": 81.5, "elapsed_time": "5:56:39", "remaining_time": "1:20:58"} +{"current_steps": 8810, "total_steps": 10798, "loss": 1.9283, "reward": null, "learning_rate": 8.164722937455177e-05, "epoch": 1.63, "percentage": 81.59, "elapsed_time": "6:03:07", "remaining_time": "1:21:56"} +{"current_steps": 8810, "total_steps": 10798, "loss": 1.9283, "reward": null, "learning_rate": 8.164722937455177e-05, "epoch": 1.63, "percentage": 81.59, "elapsed_time": "5:57:02", "remaining_time": "1:20:34"} +{"current_steps": 8810, "total_steps": 10798, "loss": 1.9283, "reward": null, "learning_rate": 8.164722937455177e-05, "epoch": 1.63, "percentage": 81.59, "elapsed_time": "5:57:05", "remaining_time": "1:20:34"} +{"current_steps": 8810, "total_steps": 10798, "loss": 1.9283, "reward": null, "learning_rate": 8.164722937455177e-05, "epoch": 1.63, "percentage": 81.59, "elapsed_time": "5:57:04", "remaining_time": "1:20:34"} +{"current_steps": 8820, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 8.08523245471392e-05, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "6:03:32", "remaining_time": "1:21:31"} +{"current_steps": 8820, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 8.08523245471392e-05, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "5:57:27", "remaining_time": "1:20:09"} +{"current_steps": 8820, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 8.08523245471392e-05, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "5:57:28", "remaining_time": "1:20:10"} +{"current_steps": 8820, "total_steps": 10798, "loss": 1.9588, "reward": null, "learning_rate": 8.08523245471392e-05, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "5:57:30", "remaining_time": "1:20:10"} +{"current_steps": 8830, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.006096768903848e-05, "epoch": 1.64, "percentage": 81.77, "elapsed_time": "5:57:53", "remaining_time": "1:19:45"} +{"current_steps": 8830, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.006096768903848e-05, "epoch": 1.64, "percentage": 81.77, "elapsed_time": "5:57:55", "remaining_time": "1:19:46"} +{"current_steps": 8830, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.006096768903848e-05, "epoch": 1.64, "percentage": 81.77, "elapsed_time": "5:57:56", "remaining_time": "1:19:46"} +{"current_steps": 8830, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.006096768903848e-05, "epoch": 1.64, "percentage": 81.77, "elapsed_time": "6:03:58", "remaining_time": "1:21:07"} +{"current_steps": 8840, "total_steps": 10798, "loss": 1.9331, "reward": null, "learning_rate": 7.927316549886659e-05, "epoch": 1.64, "percentage": 81.87, "elapsed_time": "5:58:18", "remaining_time": "1:19:21"} +{"current_steps": 8840, "total_steps": 10798, "loss": 1.9331, "reward": null, "learning_rate": 7.927316549886659e-05, "epoch": 1.64, "percentage": 81.87, "elapsed_time": "5:58:20", "remaining_time": "1:19:22"} +{"current_steps": 8840, "total_steps": 10798, "loss": 1.9331, "reward": null, "learning_rate": 7.927316549886659e-05, "epoch": 1.64, "percentage": 81.87, "elapsed_time": "5:58:22", "remaining_time": "1:19:22"} +{"current_steps": 8840, "total_steps": 10798, "loss": 1.9331, "reward": null, "learning_rate": 7.927316549886659e-05, "epoch": 1.64, "percentage": 81.87, "elapsed_time": "6:04:23", "remaining_time": "1:20:42"} +{"current_steps": 8850, "total_steps": 10798, "loss": 1.8967, "reward": null, "learning_rate": 7.84889246451515e-05, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "6:04:47", "remaining_time": "1:20:17"} +{"current_steps": 8850, "total_steps": 10798, "loss": 1.8967, "reward": null, "learning_rate": 7.84889246451515e-05, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "5:58:42", "remaining_time": "1:18:57"} +{"current_steps": 8850, "total_steps": 10798, "loss": 1.8967, "reward": null, "learning_rate": 7.84889246451515e-05, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "5:58:46", "remaining_time": "1:18:58"} +{"current_steps": 8850, "total_steps": 10798, "loss": 1.8967, "reward": null, "learning_rate": 7.84889246451515e-05, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "5:58:44", "remaining_time": "1:18:57"} +{"current_steps": 8860, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 7.77082517662756e-05, "epoch": 1.64, "percentage": 82.05, "elapsed_time": "5:59:07", "remaining_time": "1:18:33"} +{"current_steps": 8860, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 7.77082517662756e-05, "epoch": 1.64, "percentage": 82.05, "elapsed_time": "5:59:10", "remaining_time": "1:18:33"} +{"current_steps": 8860, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 7.77082517662756e-05, "epoch": 1.64, "percentage": 82.05, "elapsed_time": "5:59:08", "remaining_time": "1:18:33"} +{"current_steps": 8860, "total_steps": 10798, "loss": 1.927, "reward": null, "learning_rate": 7.77082517662756e-05, "epoch": 1.64, "percentage": 82.05, "elapsed_time": "6:05:12", "remaining_time": "1:19:52"} +{"current_steps": 8870, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 7.693115347041884e-05, "epoch": 1.64, "percentage": 82.14, "elapsed_time": "6:05:37", "remaining_time": "1:19:28"} +{"current_steps": 8870, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 7.693115347041884e-05, "epoch": 1.64, "percentage": 82.14, "elapsed_time": "5:59:32", "remaining_time": "1:18:09"} +{"current_steps": 8870, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 7.693115347041884e-05, "epoch": 1.64, "percentage": 82.14, "elapsed_time": "5:59:36", "remaining_time": "1:18:09"} +{"current_steps": 8870, "total_steps": 10798, "loss": 1.8978, "reward": null, "learning_rate": 7.693115347041884e-05, "epoch": 1.64, "percentage": 82.14, "elapsed_time": "5:59:34", "remaining_time": "1:18:09"} +{"current_steps": 8880, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 7.615763633550421e-05, "epoch": 1.64, "percentage": 82.24, "elapsed_time": "5:59:57", "remaining_time": "1:17:44"} +{"current_steps": 8880, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 7.615763633550421e-05, "epoch": 1.64, "percentage": 82.24, "elapsed_time": "5:59:58", "remaining_time": "1:17:45"} +{"current_steps": 8880, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 7.615763633550421e-05, "epoch": 1.64, "percentage": 82.24, "elapsed_time": "6:00:00", "remaining_time": "1:17:45"} +{"current_steps": 8880, "total_steps": 10798, "loss": 1.9142, "reward": null, "learning_rate": 7.615763633550421e-05, "epoch": 1.64, "percentage": 82.24, "elapsed_time": "6:06:02", "remaining_time": "1:19:03"} +{"current_steps": 8890, "total_steps": 10798, "loss": 1.9001, "reward": null, "learning_rate": 7.538770690914015e-05, "epoch": 1.65, "percentage": 82.33, "elapsed_time": "6:06:26", "remaining_time": "1:18:38"} +{"current_steps": 8890, "total_steps": 10798, "loss": 1.9001, "reward": null, "learning_rate": 7.538770690914015e-05, "epoch": 1.65, "percentage": 82.33, "elapsed_time": "6:00:21", "remaining_time": "1:17:20"} +{"current_steps": 8890, "total_steps": 10798, "loss": 1.9001, "reward": null, "learning_rate": 7.538770690914015e-05, "epoch": 1.65, "percentage": 82.33, "elapsed_time": "6:00:24", "remaining_time": "1:17:21"} +{"current_steps": 8890, "total_steps": 10798, "loss": 1.9001, "reward": null, "learning_rate": 7.538770690914015e-05, "epoch": 1.65, "percentage": 82.33, "elapsed_time": "6:00:23", "remaining_time": "1:17:20"} +{"current_steps": 8900, "total_steps": 10798, "loss": 1.8979, "reward": null, "learning_rate": 7.462137170856698e-05, "epoch": 1.65, "percentage": 82.42, "elapsed_time": "6:06:51", "remaining_time": "1:18:14"} +{"current_steps": 8900, "total_steps": 10798, "loss": 1.8979, "reward": null, "learning_rate": 7.462137170856698e-05, "epoch": 1.65, "percentage": 82.42, "elapsed_time": "6:00:49", "remaining_time": "1:16:57"} +{"current_steps": 8900, "total_steps": 10798, "loss": 1.8979, "reward": null, "learning_rate": 7.462137170856698e-05, "epoch": 1.65, "percentage": 82.42, "elapsed_time": "6:00:48", "remaining_time": "1:16:56"} +{"current_steps": 8900, "total_steps": 10798, "loss": 1.8979, "reward": null, "learning_rate": 7.462137170856698e-05, "epoch": 1.65, "percentage": 82.42, "elapsed_time": "6:00:46", "remaining_time": "1:16:56"} +{"current_steps": 8910, "total_steps": 10798, "loss": 1.892, "reward": null, "learning_rate": 7.385863722060022e-05, "epoch": 1.65, "percentage": 82.52, "elapsed_time": "6:07:15", "remaining_time": "1:17:49"} +{"current_steps": 8910, "total_steps": 10798, "loss": 1.892, "reward": null, "learning_rate": 7.385863722060022e-05, "epoch": 1.65, "percentage": 82.52, "elapsed_time": "6:01:13", "remaining_time": "1:16:32"} +{"current_steps": 8910, "total_steps": 10798, "loss": 1.892, "reward": null, "learning_rate": 7.385863722060022e-05, "epoch": 1.65, "percentage": 82.52, "elapsed_time": "6:01:11", "remaining_time": "1:16:32"} +{"current_steps": 8910, "total_steps": 10798, "loss": 1.892, "reward": null, "learning_rate": 7.385863722060022e-05, "epoch": 1.65, "percentage": 82.52, "elapsed_time": "6:01:10", "remaining_time": "1:16:31"} +{"current_steps": 8920, "total_steps": 10798, "loss": 1.9496, "reward": null, "learning_rate": 7.309950990157677e-05, "epoch": 1.65, "percentage": 82.61, "elapsed_time": "6:07:40", "remaining_time": "1:17:24"} +{"current_steps": 8920, "total_steps": 10798, "loss": 1.9496, "reward": null, "learning_rate": 7.309950990157677e-05, "epoch": 1.65, "percentage": 82.61, "elapsed_time": "6:01:37", "remaining_time": "1:16:08"} +{"current_steps": 8920, "total_steps": 10798, "loss": 1.9496, "reward": null, "learning_rate": 7.309950990157677e-05, "epoch": 1.65, "percentage": 82.61, "elapsed_time": "6:01:35", "remaining_time": "1:16:07"} +{"current_steps": 8920, "total_steps": 10798, "loss": 1.9496, "reward": null, "learning_rate": 7.309950990157677e-05, "epoch": 1.65, "percentage": 82.61, "elapsed_time": "6:01:38", "remaining_time": "1:16:08"} +{"current_steps": 8930, "total_steps": 10798, "loss": 1.8879, "reward": null, "learning_rate": 7.234399617729976e-05, "epoch": 1.65, "percentage": 82.7, "elapsed_time": "6:08:06", "remaining_time": "1:17:00"} +{"current_steps": 8930, "total_steps": 10798, "loss": 1.8879, "reward": null, "learning_rate": 7.234399617729976e-05, "epoch": 1.65, "percentage": 82.7, "elapsed_time": "6:02:04", "remaining_time": "1:15:44"} +{"current_steps": 8930, "total_steps": 10798, "loss": 1.8879, "reward": null, "learning_rate": 7.234399617729976e-05, "epoch": 1.65, "percentage": 82.7, "elapsed_time": "6:02:03", "remaining_time": "1:15:44"} +{"current_steps": 8930, "total_steps": 10798, "loss": 1.8879, "reward": null, "learning_rate": 7.234399617729976e-05, "epoch": 1.65, "percentage": 82.7, "elapsed_time": "6:02:01", "remaining_time": "1:15:43"} +{"current_steps": 8940, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 7.159210244298414e-05, "epoch": 1.66, "percentage": 82.79, "elapsed_time": "6:02:26", "remaining_time": "1:15:19"} +{"current_steps": 8940, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 7.159210244298414e-05, "epoch": 1.66, "percentage": 82.79, "elapsed_time": "6:08:31", "remaining_time": "1:16:35"} +{"current_steps": 8940, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 7.159210244298414e-05, "epoch": 1.66, "percentage": 82.79, "elapsed_time": "6:02:29", "remaining_time": "1:15:20"} +{"current_steps": 8940, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 7.159210244298414e-05, "epoch": 1.66, "percentage": 82.79, "elapsed_time": "6:02:28", "remaining_time": "1:15:19"} +{"current_steps": 8950, "total_steps": 10798, "loss": 1.9408, "reward": null, "learning_rate": 7.084383506320291e-05, "epoch": 1.66, "percentage": 82.89, "elapsed_time": "6:08:56", "remaining_time": "1:16:10"} +{"current_steps": 8950, "total_steps": 10798, "loss": 1.9408, "reward": null, "learning_rate": 7.084383506320291e-05, "epoch": 1.66, "percentage": 82.89, "elapsed_time": "6:02:54", "remaining_time": "1:14:56"} +{"current_steps": 8950, "total_steps": 10798, "loss": 1.9408, "reward": null, "learning_rate": 7.084383506320291e-05, "epoch": 1.66, "percentage": 82.89, "elapsed_time": "6:02:51", "remaining_time": "1:14:55"} +{"current_steps": 8950, "total_steps": 10798, "loss": 1.9408, "reward": null, "learning_rate": 7.084383506320291e-05, "epoch": 1.66, "percentage": 82.89, "elapsed_time": "6:02:53", "remaining_time": "1:14:55"} +{"current_steps": 8960, "total_steps": 10798, "loss": 1.9258, "reward": null, "learning_rate": 7.009920037183248e-05, "epoch": 1.66, "percentage": 82.98, "elapsed_time": "6:09:20", "remaining_time": "1:15:45"} +{"current_steps": 8960, "total_steps": 10798, "loss": 1.9258, "reward": null, "learning_rate": 7.009920037183248e-05, "epoch": 1.66, "percentage": 82.98, "elapsed_time": "6:03:15", "remaining_time": "1:14:31"} +{"current_steps": 8960, "total_steps": 10798, "loss": 1.9258, "reward": null, "learning_rate": 7.009920037183248e-05, "epoch": 1.66, "percentage": 82.98, "elapsed_time": "6:03:17", "remaining_time": "1:14:31"} +{"current_steps": 8960, "total_steps": 10798, "loss": 1.9258, "reward": null, "learning_rate": 7.009920037183248e-05, "epoch": 1.66, "percentage": 82.98, "elapsed_time": "6:03:19", "remaining_time": "1:14:31"} +{"current_steps": 8970, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 6.935820467200005e-05, "epoch": 1.66, "percentage": 83.07, "elapsed_time": "6:09:44", "remaining_time": "1:15:20"} +{"current_steps": 8970, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 6.935820467200005e-05, "epoch": 1.66, "percentage": 83.07, "elapsed_time": "6:03:41", "remaining_time": "1:14:06"} +{"current_steps": 8970, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 6.935820467200005e-05, "epoch": 1.66, "percentage": 83.07, "elapsed_time": "6:03:42", "remaining_time": "1:14:07"} +{"current_steps": 8970, "total_steps": 10798, "loss": 1.9182, "reward": null, "learning_rate": 6.935820467200005e-05, "epoch": 1.66, "percentage": 83.07, "elapsed_time": "6:03:39", "remaining_time": "1:14:06"} +{"current_steps": 8980, "total_steps": 10798, "loss": 1.9668, "reward": null, "learning_rate": 6.862085423602955e-05, "epoch": 1.66, "percentage": 83.16, "elapsed_time": "6:04:03", "remaining_time": "1:13:42"} +{"current_steps": 8980, "total_steps": 10798, "loss": 1.9668, "reward": null, "learning_rate": 6.862085423602955e-05, "epoch": 1.66, "percentage": 83.16, "elapsed_time": "6:04:07", "remaining_time": "1:13:42"} +{"current_steps": 8980, "total_steps": 10798, "loss": 1.9668, "reward": null, "learning_rate": 6.862085423602955e-05, "epoch": 1.66, "percentage": 83.16, "elapsed_time": "6:04:05", "remaining_time": "1:13:42"} +{"current_steps": 8980, "total_steps": 10798, "loss": 1.9668, "reward": null, "learning_rate": 6.862085423602955e-05, "epoch": 1.66, "percentage": 83.16, "elapsed_time": "6:10:08", "remaining_time": "1:14:56"} +{"current_steps": 8990, "total_steps": 10798, "loss": 1.898, "reward": null, "learning_rate": 6.78871553053888e-05, "epoch": 1.67, "percentage": 83.26, "elapsed_time": "6:10:33", "remaining_time": "1:14:31"} +{"current_steps": 8990, "total_steps": 10798, "loss": 1.898, "reward": null, "learning_rate": 6.78871553053888e-05, "epoch": 1.67, "percentage": 83.26, "elapsed_time": "6:04:28", "remaining_time": "1:13:18"} +{"current_steps": 8990, "total_steps": 10798, "loss": 1.898, "reward": null, "learning_rate": 6.78871553053888e-05, "epoch": 1.67, "percentage": 83.26, "elapsed_time": "6:04:30", "remaining_time": "1:13:18"} +{"current_steps": 8990, "total_steps": 10798, "loss": 1.898, "reward": null, "learning_rate": 6.78871553053888e-05, "epoch": 1.67, "percentage": 83.26, "elapsed_time": "6:04:32", "remaining_time": "1:13:18"} +{"current_steps": 9000, "total_steps": 10798, "loss": 1.9261, "reward": null, "learning_rate": 6.715711409063652e-05, "epoch": 1.67, "percentage": 83.35, "elapsed_time": "6:10:58", "remaining_time": "1:14:06"} +{"current_steps": 9000, "total_steps": 10798, "loss": 1.9261, "reward": null, "learning_rate": 6.715711409063652e-05, "epoch": 1.67, "percentage": 83.35, "elapsed_time": "6:04:54", "remaining_time": "1:12:54"} +{"current_steps": 9000, "total_steps": 10798, "loss": 1.9261, "reward": null, "learning_rate": 6.715711409063652e-05, "epoch": 1.67, "percentage": 83.35, "elapsed_time": "6:04:56", "remaining_time": "1:12:54"} +{"current_steps": 9000, "total_steps": 10798, "loss": 1.9261, "reward": null, "learning_rate": 6.715711409063652e-05, "epoch": 1.67, "percentage": 83.35, "elapsed_time": "6:04:53", "remaining_time": "1:12:53"} +{"current_steps": 9010, "total_steps": 10798, "loss": 1.9167, "reward": null, "learning_rate": 6.643073677136996e-05, "epoch": 1.67, "percentage": 83.44, "elapsed_time": "6:05:16", "remaining_time": "1:12:29"} +{"current_steps": 9010, "total_steps": 10798, "loss": 1.9167, "reward": null, "learning_rate": 6.643073677136996e-05, "epoch": 1.67, "percentage": 83.44, "elapsed_time": "6:05:20", "remaining_time": "1:12:29"} +{"current_steps": 9010, "total_steps": 10798, "loss": 1.9167, "reward": null, "learning_rate": 6.643073677136996e-05, "epoch": 1.67, "percentage": 83.44, "elapsed_time": "6:05:18", "remaining_time": "1:12:29"} +{"current_steps": 9010, "total_steps": 10798, "loss": 1.9167, "reward": null, "learning_rate": 6.643073677136996e-05, "epoch": 1.67, "percentage": 83.44, "elapsed_time": "6:11:21", "remaining_time": "1:13:41"} +{"current_steps": 9020, "total_steps": 10798, "loss": 1.9066, "reward": null, "learning_rate": 6.570802949617261e-05, "epoch": 1.67, "percentage": 83.53, "elapsed_time": "6:11:45", "remaining_time": "1:13:16"} +{"current_steps": 9020, "total_steps": 10798, "loss": 1.9066, "reward": null, "learning_rate": 6.570802949617261e-05, "epoch": 1.67, "percentage": 83.53, "elapsed_time": "6:05:40", "remaining_time": "1:12:04"} +{"current_steps": 9020, "total_steps": 10798, "loss": 1.9066, "reward": null, "learning_rate": 6.570802949617261e-05, "epoch": 1.67, "percentage": 83.53, "elapsed_time": "6:05:44", "remaining_time": "1:12:05"} +{"current_steps": 9020, "total_steps": 10798, "loss": 1.9066, "reward": null, "learning_rate": 6.570802949617261e-05, "epoch": 1.67, "percentage": 83.53, "elapsed_time": "6:05:42", "remaining_time": "1:12:05"} +{"current_steps": 9030, "total_steps": 10798, "loss": 1.9091, "reward": null, "learning_rate": 6.49889983825619e-05, "epoch": 1.67, "percentage": 83.63, "elapsed_time": "6:12:10", "remaining_time": "1:12:52"} +{"current_steps": 9030, "total_steps": 10798, "loss": 1.9091, "reward": null, "learning_rate": 6.49889983825619e-05, "epoch": 1.67, "percentage": 83.63, "elapsed_time": "6:06:05", "remaining_time": "1:11:40"} +{"current_steps": 9030, "total_steps": 10798, "loss": 1.9091, "reward": null, "learning_rate": 6.49889983825619e-05, "epoch": 1.67, "percentage": 83.63, "elapsed_time": "6:06:09", "remaining_time": "1:11:41"} +{"current_steps": 9030, "total_steps": 10798, "loss": 1.9091, "reward": null, "learning_rate": 6.49889983825619e-05, "epoch": 1.67, "percentage": 83.63, "elapsed_time": "6:06:07", "remaining_time": "1:11:41"} +{"current_steps": 9040, "total_steps": 10798, "loss": 1.8853, "reward": null, "learning_rate": 6.427364951693776e-05, "epoch": 1.67, "percentage": 83.72, "elapsed_time": "6:12:36", "remaining_time": "1:12:27"} +{"current_steps": 9040, "total_steps": 10798, "loss": 1.8853, "reward": null, "learning_rate": 6.427364951693776e-05, "epoch": 1.67, "percentage": 83.72, "elapsed_time": "6:06:32", "remaining_time": "1:11:16"} +{"current_steps": 9040, "total_steps": 10798, "loss": 1.8853, "reward": null, "learning_rate": 6.427364951693776e-05, "epoch": 1.67, "percentage": 83.72, "elapsed_time": "6:06:31", "remaining_time": "1:11:16"} +{"current_steps": 9040, "total_steps": 10798, "loss": 1.8853, "reward": null, "learning_rate": 6.427364951693776e-05, "epoch": 1.67, "percentage": 83.72, "elapsed_time": "6:06:34", "remaining_time": "1:11:17"} +{"current_steps": 9050, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 6.356198895453053e-05, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "6:07:00", "remaining_time": "1:10:53"} +{"current_steps": 9050, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 6.356198895453053e-05, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "6:06:58", "remaining_time": "1:10:52"} +{"current_steps": 9050, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 6.356198895453053e-05, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "6:06:56", "remaining_time": "1:10:52"} +{"current_steps": 9050, "total_steps": 10798, "loss": 1.9459, "reward": null, "learning_rate": 6.356198895453053e-05, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "6:13:01", "remaining_time": "1:12:03"} +{"current_steps": 9060, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 6.285402271935048e-05, "epoch": 1.68, "percentage": 83.9, "elapsed_time": "6:13:26", "remaining_time": "1:11:38"} +{"current_steps": 9060, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 6.285402271935048e-05, "epoch": 1.68, "percentage": 83.9, "elapsed_time": "6:07:23", "remaining_time": "1:10:28"} +{"current_steps": 9060, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 6.285402271935048e-05, "epoch": 1.68, "percentage": 83.9, "elapsed_time": "6:07:25", "remaining_time": "1:10:29"} +{"current_steps": 9060, "total_steps": 10798, "loss": 1.9073, "reward": null, "learning_rate": 6.285402271935048e-05, "epoch": 1.68, "percentage": 83.9, "elapsed_time": "6:07:22", "remaining_time": "1:10:28"} +{"current_steps": 9070, "total_steps": 10798, "loss": 1.902, "reward": null, "learning_rate": 6.214975680413621e-05, "epoch": 1.68, "percentage": 84.0, "elapsed_time": "6:13:51", "remaining_time": "1:11:13"} +{"current_steps": 9070, "total_steps": 10798, "loss": 1.902, "reward": null, "learning_rate": 6.214975680413621e-05, "epoch": 1.68, "percentage": 84.0, "elapsed_time": "6:07:47", "remaining_time": "1:10:04"} +{"current_steps": 9070, "total_steps": 10798, "loss": 1.902, "reward": null, "learning_rate": 6.214975680413621e-05, "epoch": 1.68, "percentage": 84.0, "elapsed_time": "6:07:48", "remaining_time": "1:10:04"} +{"current_steps": 9070, "total_steps": 10798, "loss": 1.902, "reward": null, "learning_rate": 6.214975680413621e-05, "epoch": 1.68, "percentage": 84.0, "elapsed_time": "6:07:50", "remaining_time": "1:10:04"} +{"current_steps": 9080, "total_steps": 10798, "loss": 1.8812, "reward": null, "learning_rate": 6.144919717030417e-05, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "6:14:16", "remaining_time": "1:10:48"} +{"current_steps": 9080, "total_steps": 10798, "loss": 1.8812, "reward": null, "learning_rate": 6.144919717030417e-05, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "6:08:11", "remaining_time": "1:09:39"} +{"current_steps": 9080, "total_steps": 10798, "loss": 1.8812, "reward": null, "learning_rate": 6.144919717030417e-05, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "6:08:12", "remaining_time": "1:09:40"} +{"current_steps": 9080, "total_steps": 10798, "loss": 1.8812, "reward": null, "learning_rate": 6.144919717030417e-05, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "6:08:14", "remaining_time": "1:09:40"} +{"current_steps": 9090, "total_steps": 10798, "loss": 1.8672, "reward": null, "learning_rate": 6.075234974789839e-05, "epoch": 1.68, "percentage": 84.18, "elapsed_time": "6:08:35", "remaining_time": "1:09:15"} +{"current_steps": 9090, "total_steps": 10798, "loss": 1.8672, "reward": null, "learning_rate": 6.075234974789839e-05, "epoch": 1.68, "percentage": 84.18, "elapsed_time": "6:08:36", "remaining_time": "1:09:15"} +{"current_steps": 9090, "total_steps": 10798, "loss": 1.8672, "reward": null, "learning_rate": 6.075234974789839e-05, "epoch": 1.68, "percentage": 84.18, "elapsed_time": "6:08:38", "remaining_time": "1:09:16"} +{"current_steps": 9090, "total_steps": 10798, "loss": 1.8672, "reward": null, "learning_rate": 6.075234974789839e-05, "epoch": 1.68, "percentage": 84.18, "elapsed_time": "6:14:39", "remaining_time": "1:10:23"} +{"current_steps": 9100, "total_steps": 10798, "loss": 1.9297, "reward": null, "learning_rate": 6.005922043553952e-05, "epoch": 1.69, "percentage": 84.27, "elapsed_time": "6:15:03", "remaining_time": "1:09:59"} +{"current_steps": 9100, "total_steps": 10798, "loss": 1.9297, "reward": null, "learning_rate": 6.005922043553952e-05, "epoch": 1.69, "percentage": 84.27, "elapsed_time": "6:09:00", "remaining_time": "1:08:51"} +{"current_steps": 9100, "total_steps": 10798, "loss": 1.9297, "reward": null, "learning_rate": 6.005922043553952e-05, "epoch": 1.69, "percentage": 84.27, "elapsed_time": "6:09:02", "remaining_time": "1:08:51"} +{"current_steps": 9100, "total_steps": 10798, "loss": 1.9297, "reward": null, "learning_rate": 6.005922043553952e-05, "epoch": 1.69, "percentage": 84.27, "elapsed_time": "6:08:58", "remaining_time": "1:08:50"} +{"current_steps": 9110, "total_steps": 10798, "loss": 1.8775, "reward": null, "learning_rate": 5.9369815100376037e-05, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "6:15:28", "remaining_time": "1:09:34"} +{"current_steps": 9110, "total_steps": 10798, "loss": 1.8775, "reward": null, "learning_rate": 5.9369815100376037e-05, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "6:09:27", "remaining_time": "1:08:27"} +{"current_steps": 9110, "total_steps": 10798, "loss": 1.8775, "reward": null, "learning_rate": 5.9369815100376037e-05, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "6:09:25", "remaining_time": "1:08:27"} +{"current_steps": 9110, "total_steps": 10798, "loss": 1.8775, "reward": null, "learning_rate": 5.9369815100376037e-05, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "6:09:24", "remaining_time": "1:08:26"} +{"current_steps": 9120, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 5.868413957803331e-05, "epoch": 1.69, "percentage": 84.46, "elapsed_time": "6:15:53", "remaining_time": "1:09:09"} +{"current_steps": 9120, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 5.868413957803331e-05, "epoch": 1.69, "percentage": 84.46, "elapsed_time": "6:09:48", "remaining_time": "1:08:02"} +{"current_steps": 9120, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 5.868413957803331e-05, "epoch": 1.69, "percentage": 84.46, "elapsed_time": "6:09:52", "remaining_time": "1:08:03"} +{"current_steps": 9120, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 5.868413957803331e-05, "epoch": 1.69, "percentage": 84.46, "elapsed_time": "6:09:50", "remaining_time": "1:08:02"} +{"current_steps": 9130, "total_steps": 10798, "loss": 1.9026, "reward": null, "learning_rate": 5.800219967256576e-05, "epoch": 1.69, "percentage": 84.55, "elapsed_time": "6:16:18", "remaining_time": "1:08:44"} +{"current_steps": 9130, "total_steps": 10798, "loss": 1.9026, "reward": null, "learning_rate": 5.800219967256576e-05, "epoch": 1.69, "percentage": 84.55, "elapsed_time": "6:10:17", "remaining_time": "1:07:38"} +{"current_steps": 9130, "total_steps": 10798, "loss": 1.9026, "reward": null, "learning_rate": 5.800219967256576e-05, "epoch": 1.69, "percentage": 84.55, "elapsed_time": "6:10:15", "remaining_time": "1:07:38"} +{"current_steps": 9130, "total_steps": 10798, "loss": 1.9026, "reward": null, "learning_rate": 5.800219967256576e-05, "epoch": 1.69, "percentage": 84.55, "elapsed_time": "6:10:13", "remaining_time": "1:07:38"} +{"current_steps": 9140, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 5.7324001156406014e-05, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "6:16:44", "remaining_time": "1:08:20"} +{"current_steps": 9140, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 5.7324001156406014e-05, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "6:10:40", "remaining_time": "1:07:14"} +{"current_steps": 9140, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 5.7324001156406014e-05, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "6:10:42", "remaining_time": "1:07:14"} +{"current_steps": 9140, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 5.7324001156406014e-05, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "6:10:39", "remaining_time": "1:07:14"} +{"current_steps": 9150, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 5.664954977031733e-05, "epoch": 1.69, "percentage": 84.74, "elapsed_time": "6:17:09", "remaining_time": "1:07:55"} +{"current_steps": 9150, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 5.664954977031733e-05, "epoch": 1.69, "percentage": 84.74, "elapsed_time": "6:11:04", "remaining_time": "1:06:50"} +{"current_steps": 9150, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 5.664954977031733e-05, "epoch": 1.69, "percentage": 84.74, "elapsed_time": "6:11:05", "remaining_time": "1:06:50"} +{"current_steps": 9150, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 5.664954977031733e-05, "epoch": 1.69, "percentage": 84.74, "elapsed_time": "6:11:07", "remaining_time": "1:06:50"} +{"current_steps": 9160, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 5.5978851223344455e-05, "epoch": 1.7, "percentage": 84.83, "elapsed_time": "6:11:29", "remaining_time": "1:06:25"} +{"current_steps": 9160, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 5.5978851223344455e-05, "epoch": 1.7, "percentage": 84.83, "elapsed_time": "6:11:31", "remaining_time": "1:06:26"} +{"current_steps": 9160, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 5.5978851223344455e-05, "epoch": 1.7, "percentage": 84.83, "elapsed_time": "6:11:33", "remaining_time": "1:06:26"} +{"current_steps": 9160, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 5.5978851223344455e-05, "epoch": 1.7, "percentage": 84.83, "elapsed_time": "6:17:34", "remaining_time": "1:07:31"} +{"current_steps": 9170, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 5.531191119276513e-05, "epoch": 1.7, "percentage": 84.92, "elapsed_time": "6:11:54", "remaining_time": "1:06:01"} +{"current_steps": 9170, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 5.531191119276513e-05, "epoch": 1.7, "percentage": 84.92, "elapsed_time": "6:11:56", "remaining_time": "1:06:01"} +{"current_steps": 9170, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 5.531191119276513e-05, "epoch": 1.7, "percentage": 84.92, "elapsed_time": "6:11:58", "remaining_time": "1:06:02"} +{"current_steps": 9170, "total_steps": 10798, "loss": 1.9397, "reward": null, "learning_rate": 5.531191119276513e-05, "epoch": 1.7, "percentage": 84.92, "elapsed_time": "6:17:59", "remaining_time": "1:07:06"} +{"current_steps": 9180, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 5.4648735324042855e-05, "epoch": 1.7, "percentage": 85.02, "elapsed_time": "6:12:19", "remaining_time": "1:05:37"} +{"current_steps": 9180, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 5.4648735324042855e-05, "epoch": 1.7, "percentage": 85.02, "elapsed_time": "6:12:22", "remaining_time": "1:05:37"} +{"current_steps": 9180, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 5.4648735324042855e-05, "epoch": 1.7, "percentage": 85.02, "elapsed_time": "6:18:24", "remaining_time": "1:06:41"} +{"current_steps": 9180, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 5.4648735324042855e-05, "epoch": 1.7, "percentage": 85.02, "elapsed_time": "6:12:20", "remaining_time": "1:05:37"} +{"current_steps": 9190, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 5.398932923077793e-05, "epoch": 1.7, "percentage": 85.11, "elapsed_time": "6:18:48", "remaining_time": "1:06:16"} +{"current_steps": 9190, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 5.398932923077793e-05, "epoch": 1.7, "percentage": 85.11, "elapsed_time": "6:12:46", "remaining_time": "1:05:13"} +{"current_steps": 9190, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 5.398932923077793e-05, "epoch": 1.7, "percentage": 85.11, "elapsed_time": "6:12:45", "remaining_time": "1:05:13"} +{"current_steps": 9190, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 5.398932923077793e-05, "epoch": 1.7, "percentage": 85.11, "elapsed_time": "6:12:43", "remaining_time": "1:05:13"} +{"current_steps": 9200, "total_steps": 10798, "loss": 1.9061, "reward": null, "learning_rate": 5.333369849466091e-05, "epoch": 1.7, "percentage": 85.2, "elapsed_time": "6:19:13", "remaining_time": "1:05:52"} +{"current_steps": 9200, "total_steps": 10798, "loss": 1.9061, "reward": null, "learning_rate": 5.333369849466091e-05, "epoch": 1.7, "percentage": 85.2, "elapsed_time": "6:13:08", "remaining_time": "1:04:48"} +{"current_steps": 9200, "total_steps": 10798, "loss": 1.9061, "reward": null, "learning_rate": 5.333369849466091e-05, "epoch": 1.7, "percentage": 85.2, "elapsed_time": "6:13:10", "remaining_time": "1:04:49"} +{"current_steps": 9200, "total_steps": 10798, "loss": 1.9061, "reward": null, "learning_rate": 5.333369849466091e-05, "epoch": 1.7, "percentage": 85.2, "elapsed_time": "6:13:11", "remaining_time": "1:04:49"} +{"current_steps": 9210, "total_steps": 10798, "loss": 1.8861, "reward": null, "learning_rate": 5.268184866542502e-05, "epoch": 1.71, "percentage": 85.29, "elapsed_time": "6:19:38", "remaining_time": "1:05:27"} +{"current_steps": 9210, "total_steps": 10798, "loss": 1.8861, "reward": null, "learning_rate": 5.268184866542502e-05, "epoch": 1.71, "percentage": 85.29, "elapsed_time": "6:13:33", "remaining_time": "1:04:24"} +{"current_steps": 9210, "total_steps": 10798, "loss": 1.8861, "reward": null, "learning_rate": 5.268184866542502e-05, "epoch": 1.71, "percentage": 85.29, "elapsed_time": "6:13:37", "remaining_time": "1:04:25"} +{"current_steps": 9210, "total_steps": 10798, "loss": 1.8861, "reward": null, "learning_rate": 5.268184866542502e-05, "epoch": 1.71, "percentage": 85.29, "elapsed_time": "6:13:35", "remaining_time": "1:04:24"} +{"current_steps": 9220, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 5.2033785260798716e-05, "epoch": 1.71, "percentage": 85.39, "elapsed_time": "6:20:03", "remaining_time": "1:05:02"} +{"current_steps": 9220, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 5.2033785260798716e-05, "epoch": 1.71, "percentage": 85.39, "elapsed_time": "6:13:59", "remaining_time": "1:04:00"} +{"current_steps": 9220, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 5.2033785260798716e-05, "epoch": 1.71, "percentage": 85.39, "elapsed_time": "6:13:58", "remaining_time": "1:04:00"} +{"current_steps": 9220, "total_steps": 10798, "loss": 1.9433, "reward": null, "learning_rate": 5.2033785260798716e-05, "epoch": 1.71, "percentage": 85.39, "elapsed_time": "6:14:01", "remaining_time": "1:04:00"} +{"current_steps": 9230, "total_steps": 10798, "loss": 1.9158, "reward": null, "learning_rate": 5.138951376646012e-05, "epoch": 1.71, "percentage": 85.48, "elapsed_time": "6:20:28", "remaining_time": "1:04:38"} +{"current_steps": 9230, "total_steps": 10798, "loss": 1.9158, "reward": null, "learning_rate": 5.138951376646012e-05, "epoch": 1.71, "percentage": 85.48, "elapsed_time": "6:14:25", "remaining_time": "1:03:36"} +{"current_steps": 9230, "total_steps": 10798, "loss": 1.9158, "reward": null, "learning_rate": 5.138951376646012e-05, "epoch": 1.71, "percentage": 85.48, "elapsed_time": "6:14:26", "remaining_time": "1:03:36"} +{"current_steps": 9230, "total_steps": 10798, "loss": 1.9158, "reward": null, "learning_rate": 5.138951376646012e-05, "epoch": 1.71, "percentage": 85.48, "elapsed_time": "6:14:23", "remaining_time": "1:03:36"} +{"current_steps": 9240, "total_steps": 10798, "loss": 1.8898, "reward": null, "learning_rate": 5.074903963598926e-05, "epoch": 1.71, "percentage": 85.57, "elapsed_time": "6:20:53", "remaining_time": "1:04:13"} +{"current_steps": 9240, "total_steps": 10798, "loss": 1.8898, "reward": null, "learning_rate": 5.074903963598926e-05, "epoch": 1.71, "percentage": 85.57, "elapsed_time": "6:14:52", "remaining_time": "1:03:12"} +{"current_steps": 9240, "total_steps": 10798, "loss": 1.8898, "reward": null, "learning_rate": 5.074903963598926e-05, "epoch": 1.71, "percentage": 85.57, "elapsed_time": "6:14:50", "remaining_time": "1:03:12"} +{"current_steps": 9240, "total_steps": 10798, "loss": 1.8898, "reward": null, "learning_rate": 5.074903963598926e-05, "epoch": 1.71, "percentage": 85.57, "elapsed_time": "6:14:49", "remaining_time": "1:03:11"} +{"current_steps": 9250, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 5.0112368290822885e-05, "epoch": 1.71, "percentage": 85.66, "elapsed_time": "6:21:17", "remaining_time": "1:03:48"} +{"current_steps": 9250, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 5.0112368290822885e-05, "epoch": 1.71, "percentage": 85.66, "elapsed_time": "6:15:12", "remaining_time": "1:02:47"} +{"current_steps": 9250, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 5.0112368290822885e-05, "epoch": 1.71, "percentage": 85.66, "elapsed_time": "6:15:14", "remaining_time": "1:02:47"} +{"current_steps": 9250, "total_steps": 10798, "loss": 1.9041, "reward": null, "learning_rate": 5.0112368290822885e-05, "epoch": 1.71, "percentage": 85.66, "elapsed_time": "6:15:16", "remaining_time": "1:02:48"} +{"current_steps": 9260, "total_steps": 10798, "loss": 1.9605, "reward": null, "learning_rate": 4.9479505120207934e-05, "epoch": 1.72, "percentage": 85.76, "elapsed_time": "6:21:42", "remaining_time": "1:03:23"} +{"current_steps": 9260, "total_steps": 10798, "loss": 1.9605, "reward": null, "learning_rate": 4.9479505120207934e-05, "epoch": 1.72, "percentage": 85.76, "elapsed_time": "6:15:39", "remaining_time": "1:02:23"} +{"current_steps": 9260, "total_steps": 10798, "loss": 1.9605, "reward": null, "learning_rate": 4.9479505120207934e-05, "epoch": 1.72, "percentage": 85.76, "elapsed_time": "6:15:40", "remaining_time": "1:02:23"} +{"current_steps": 9260, "total_steps": 10798, "loss": 1.9605, "reward": null, "learning_rate": 4.9479505120207934e-05, "epoch": 1.72, "percentage": 85.76, "elapsed_time": "6:15:37", "remaining_time": "1:02:23"} +{"current_steps": 9270, "total_steps": 10798, "loss": 1.8975, "reward": null, "learning_rate": 4.885045548115646e-05, "epoch": 1.72, "percentage": 85.85, "elapsed_time": "6:22:07", "remaining_time": "1:02:59"} +{"current_steps": 9270, "total_steps": 10798, "loss": 1.8975, "reward": null, "learning_rate": 4.885045548115646e-05, "epoch": 1.72, "percentage": 85.85, "elapsed_time": "6:16:04", "remaining_time": "1:01:59"} +{"current_steps": 9270, "total_steps": 10798, "loss": 1.8975, "reward": null, "learning_rate": 4.885045548115646e-05, "epoch": 1.72, "percentage": 85.85, "elapsed_time": "6:16:03", "remaining_time": "1:01:59"} +{"current_steps": 9270, "total_steps": 10798, "loss": 1.8975, "reward": null, "learning_rate": 4.885045548115646e-05, "epoch": 1.72, "percentage": 85.85, "elapsed_time": "6:16:06", "remaining_time": "1:01:59"} +{"current_steps": 9280, "total_steps": 10798, "loss": 1.9396, "reward": null, "learning_rate": 4.822522469839996e-05, "epoch": 1.72, "percentage": 85.94, "elapsed_time": "6:16:28", "remaining_time": "1:01:35"} +{"current_steps": 9280, "total_steps": 10798, "loss": 1.9396, "reward": null, "learning_rate": 4.822522469839996e-05, "epoch": 1.72, "percentage": 85.94, "elapsed_time": "6:16:27", "remaining_time": "1:01:34"} +{"current_steps": 9280, "total_steps": 10798, "loss": 1.9396, "reward": null, "learning_rate": 4.822522469839996e-05, "epoch": 1.72, "percentage": 85.94, "elapsed_time": "6:16:30", "remaining_time": "1:01:35"} +{"current_steps": 9280, "total_steps": 10798, "loss": 1.9396, "reward": null, "learning_rate": 4.822522469839996e-05, "epoch": 1.72, "percentage": 85.94, "elapsed_time": "6:22:32", "remaining_time": "1:02:34"} +{"current_steps": 9290, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 4.760381806434427e-05, "epoch": 1.72, "percentage": 86.03, "elapsed_time": "6:22:57", "remaining_time": "1:02:09"} +{"current_steps": 9290, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 4.760381806434427e-05, "epoch": 1.72, "percentage": 86.03, "elapsed_time": "6:16:56", "remaining_time": "1:01:11"} +{"current_steps": 9290, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 4.760381806434427e-05, "epoch": 1.72, "percentage": 86.03, "elapsed_time": "6:16:54", "remaining_time": "1:01:10"} +{"current_steps": 9290, "total_steps": 10798, "loss": 1.9263, "reward": null, "learning_rate": 4.760381806434427e-05, "epoch": 1.72, "percentage": 86.03, "elapsed_time": "6:16:52", "remaining_time": "1:01:10"} +{"current_steps": 9300, "total_steps": 10798, "loss": 1.948, "reward": null, "learning_rate": 4.698624083902503e-05, "epoch": 1.72, "percentage": 86.13, "elapsed_time": "6:23:22", "remaining_time": "1:01:45"} +{"current_steps": 9300, "total_steps": 10798, "loss": 1.948, "reward": null, "learning_rate": 4.698624083902503e-05, "epoch": 1.72, "percentage": 86.13, "elapsed_time": "6:17:18", "remaining_time": "1:00:46"} +{"current_steps": 9300, "total_steps": 10798, "loss": 1.948, "reward": null, "learning_rate": 4.698624083902503e-05, "epoch": 1.72, "percentage": 86.13, "elapsed_time": "6:17:19", "remaining_time": "1:00:46"} +{"current_steps": 9300, "total_steps": 10798, "loss": 1.948, "reward": null, "learning_rate": 4.698624083902503e-05, "epoch": 1.72, "percentage": 86.13, "elapsed_time": "6:17:21", "remaining_time": "1:00:46"} +{"current_steps": 9310, "total_steps": 10798, "loss": 1.9206, "reward": null, "learning_rate": 4.637249825006273e-05, "epoch": 1.72, "percentage": 86.22, "elapsed_time": "6:23:48", "remaining_time": "1:01:20"} +{"current_steps": 9310, "total_steps": 10798, "loss": 1.9206, "reward": null, "learning_rate": 4.637249825006273e-05, "epoch": 1.72, "percentage": 86.22, "elapsed_time": "6:17:46", "remaining_time": "1:00:22"} +{"current_steps": 9310, "total_steps": 10798, "loss": 1.9206, "reward": null, "learning_rate": 4.637249825006273e-05, "epoch": 1.72, "percentage": 86.22, "elapsed_time": "6:17:44", "remaining_time": "1:00:22"} +{"current_steps": 9310, "total_steps": 10798, "loss": 1.9206, "reward": null, "learning_rate": 4.637249825006273e-05, "epoch": 1.72, "percentage": 86.22, "elapsed_time": "6:17:43", "remaining_time": "1:00:22"} +{"current_steps": 9320, "total_steps": 10798, "loss": 1.9129, "reward": null, "learning_rate": 4.5762595492618906e-05, "epoch": 1.73, "percentage": 86.31, "elapsed_time": "6:24:13", "remaining_time": "1:00:55"} +{"current_steps": 9320, "total_steps": 10798, "loss": 1.9129, "reward": null, "learning_rate": 4.5762595492618906e-05, "epoch": 1.73, "percentage": 86.31, "elapsed_time": "6:18:08", "remaining_time": "0:59:58"} +{"current_steps": 9320, "total_steps": 10798, "loss": 1.9129, "reward": null, "learning_rate": 4.5762595492618906e-05, "epoch": 1.73, "percentage": 86.31, "elapsed_time": "6:18:09", "remaining_time": "0:59:58"} +{"current_steps": 9320, "total_steps": 10798, "loss": 1.9129, "reward": null, "learning_rate": 4.5762595492618906e-05, "epoch": 1.73, "percentage": 86.31, "elapsed_time": "6:18:11", "remaining_time": "0:59:58"} +{"current_steps": 9330, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 4.515653772935207e-05, "epoch": 1.73, "percentage": 86.4, "elapsed_time": "6:18:34", "remaining_time": "0:59:33"} +{"current_steps": 9330, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 4.515653772935207e-05, "epoch": 1.73, "percentage": 86.4, "elapsed_time": "6:18:36", "remaining_time": "0:59:34"} +{"current_steps": 9330, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 4.515653772935207e-05, "epoch": 1.73, "percentage": 86.4, "elapsed_time": "6:18:32", "remaining_time": "0:59:33"} +{"current_steps": 9330, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 4.515653772935207e-05, "epoch": 1.73, "percentage": 86.4, "elapsed_time": "6:24:37", "remaining_time": "1:00:31"} +{"current_steps": 9340, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 4.455433009037385e-05, "epoch": 1.73, "percentage": 86.5, "elapsed_time": "6:25:02", "remaining_time": "1:00:06"} +{"current_steps": 9340, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 4.455433009037385e-05, "epoch": 1.73, "percentage": 86.5, "elapsed_time": "6:18:59", "remaining_time": "0:59:09"} +{"current_steps": 9340, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 4.455433009037385e-05, "epoch": 1.73, "percentage": 86.5, "elapsed_time": "6:19:01", "remaining_time": "0:59:10"} +{"current_steps": 9340, "total_steps": 10798, "loss": 1.928, "reward": null, "learning_rate": 4.455433009037385e-05, "epoch": 1.73, "percentage": 86.5, "elapsed_time": "6:18:58", "remaining_time": "0:59:09"} +{"current_steps": 9350, "total_steps": 10798, "loss": 1.9427, "reward": null, "learning_rate": 4.395597767320536e-05, "epoch": 1.73, "percentage": 86.59, "elapsed_time": "6:25:27", "remaining_time": "0:59:41"} +{"current_steps": 9350, "total_steps": 10798, "loss": 1.9427, "reward": null, "learning_rate": 4.395597767320536e-05, "epoch": 1.73, "percentage": 86.59, "elapsed_time": "6:19:26", "remaining_time": "0:58:45"} +{"current_steps": 9350, "total_steps": 10798, "loss": 1.9427, "reward": null, "learning_rate": 4.395597767320536e-05, "epoch": 1.73, "percentage": 86.59, "elapsed_time": "6:19:24", "remaining_time": "0:58:45"} +{"current_steps": 9350, "total_steps": 10798, "loss": 1.9427, "reward": null, "learning_rate": 4.395597767320536e-05, "epoch": 1.73, "percentage": 86.59, "elapsed_time": "6:19:22", "remaining_time": "0:58:45"} +{"current_steps": 9360, "total_steps": 10798, "loss": 1.8882, "reward": null, "learning_rate": 4.336148554273467e-05, "epoch": 1.73, "percentage": 86.68, "elapsed_time": "6:25:52", "remaining_time": "0:59:16"} +{"current_steps": 9360, "total_steps": 10798, "loss": 1.8882, "reward": null, "learning_rate": 4.336148554273467e-05, "epoch": 1.73, "percentage": 86.68, "elapsed_time": "6:19:49", "remaining_time": "0:58:21"} +{"current_steps": 9360, "total_steps": 10798, "loss": 1.8882, "reward": null, "learning_rate": 4.336148554273467e-05, "epoch": 1.73, "percentage": 86.68, "elapsed_time": "6:19:47", "remaining_time": "0:58:20"} +{"current_steps": 9360, "total_steps": 10798, "loss": 1.8882, "reward": null, "learning_rate": 4.336148554273467e-05, "epoch": 1.73, "percentage": 86.68, "elapsed_time": "6:19:50", "remaining_time": "0:58:21"} +{"current_steps": 9370, "total_steps": 10798, "loss": 1.9412, "reward": null, "learning_rate": 4.277085873117354e-05, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "6:26:17", "remaining_time": "0:58:52"} +{"current_steps": 9370, "total_steps": 10798, "loss": 1.9412, "reward": null, "learning_rate": 4.277085873117354e-05, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "6:20:14", "remaining_time": "0:57:56"} +{"current_steps": 9370, "total_steps": 10798, "loss": 1.9412, "reward": null, "learning_rate": 4.277085873117354e-05, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "6:20:15", "remaining_time": "0:57:57"} +{"current_steps": 9370, "total_steps": 10798, "loss": 1.9412, "reward": null, "learning_rate": 4.277085873117354e-05, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "6:20:12", "remaining_time": "0:57:56"} +{"current_steps": 9380, "total_steps": 10798, "loss": 1.9014, "reward": null, "learning_rate": 4.218410223801472e-05, "epoch": 1.74, "percentage": 86.87, "elapsed_time": "6:26:41", "remaining_time": "0:58:27"} +{"current_steps": 9380, "total_steps": 10798, "loss": 1.9014, "reward": null, "learning_rate": 4.218410223801472e-05, "epoch": 1.74, "percentage": 86.87, "elapsed_time": "6:20:36", "remaining_time": "0:57:32"} +{"current_steps": 9380, "total_steps": 10798, "loss": 1.9014, "reward": null, "learning_rate": 4.218410223801472e-05, "epoch": 1.74, "percentage": 86.87, "elapsed_time": "6:20:38", "remaining_time": "0:57:32"} +{"current_steps": 9380, "total_steps": 10798, "loss": 1.9014, "reward": null, "learning_rate": 4.218410223801472e-05, "epoch": 1.74, "percentage": 86.87, "elapsed_time": "6:20:40", "remaining_time": "0:57:32"} +{"current_steps": 9390, "total_steps": 10798, "loss": 1.9056, "reward": null, "learning_rate": 4.1601221029989976e-05, "epoch": 1.74, "percentage": 86.96, "elapsed_time": "6:21:04", "remaining_time": "0:57:08"} +{"current_steps": 9390, "total_steps": 10798, "loss": 1.9056, "reward": null, "learning_rate": 4.1601221029989976e-05, "epoch": 1.74, "percentage": 86.96, "elapsed_time": "6:21:03", "remaining_time": "0:57:08"} +{"current_steps": 9390, "total_steps": 10798, "loss": 1.9056, "reward": null, "learning_rate": 4.1601221029989976e-05, "epoch": 1.74, "percentage": 86.96, "elapsed_time": "6:27:06", "remaining_time": "0:58:02"} +{"current_steps": 9390, "total_steps": 10798, "loss": 1.9056, "reward": null, "learning_rate": 4.1601221029989976e-05, "epoch": 1.74, "percentage": 86.96, "elapsed_time": "6:21:01", "remaining_time": "0:57:08"} +{"current_steps": 9400, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 4.102222004102768e-05, "epoch": 1.74, "percentage": 87.05, "elapsed_time": "6:27:31", "remaining_time": "0:57:37"} +{"current_steps": 9400, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 4.102222004102768e-05, "epoch": 1.74, "percentage": 87.05, "elapsed_time": "6:21:26", "remaining_time": "0:56:43"} +{"current_steps": 9400, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 4.102222004102768e-05, "epoch": 1.74, "percentage": 87.05, "elapsed_time": "6:21:27", "remaining_time": "0:56:43"} +{"current_steps": 9400, "total_steps": 10798, "loss": 1.9665, "reward": null, "learning_rate": 4.102222004102768e-05, "epoch": 1.74, "percentage": 87.05, "elapsed_time": "6:21:29", "remaining_time": "0:56:44"} +{"current_steps": 9410, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 4.04471041722112e-05, "epoch": 1.74, "percentage": 87.15, "elapsed_time": "6:21:51", "remaining_time": "0:56:19"} +{"current_steps": 9410, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 4.04471041722112e-05, "epoch": 1.74, "percentage": 87.15, "elapsed_time": "6:27:54", "remaining_time": "0:57:13"} +{"current_steps": 9410, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 4.04471041722112e-05, "epoch": 1.74, "percentage": 87.15, "elapsed_time": "6:21:53", "remaining_time": "0:56:19"} +{"current_steps": 9410, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 4.04471041722112e-05, "epoch": 1.74, "percentage": 87.15, "elapsed_time": "6:21:50", "remaining_time": "0:56:19"} +{"current_steps": 9420, "total_steps": 10798, "loss": 1.885, "reward": null, "learning_rate": 3.987587829173772e-05, "epoch": 1.74, "percentage": 87.24, "elapsed_time": "6:28:19", "remaining_time": "0:56:48"} +{"current_steps": 9420, "total_steps": 10798, "loss": 1.885, "reward": null, "learning_rate": 3.987587829173772e-05, "epoch": 1.74, "percentage": 87.24, "elapsed_time": "6:22:18", "remaining_time": "0:55:55"} +{"current_steps": 9420, "total_steps": 10798, "loss": 1.885, "reward": null, "learning_rate": 3.987587829173772e-05, "epoch": 1.74, "percentage": 87.24, "elapsed_time": "6:22:14", "remaining_time": "0:55:55"} +{"current_steps": 9420, "total_steps": 10798, "loss": 1.885, "reward": null, "learning_rate": 3.987587829173772e-05, "epoch": 1.74, "percentage": 87.24, "elapsed_time": "6:22:16", "remaining_time": "0:55:55"} +{"current_steps": 9430, "total_steps": 10798, "loss": 1.8958, "reward": null, "learning_rate": 3.930854723487642e-05, "epoch": 1.75, "percentage": 87.33, "elapsed_time": "6:28:45", "remaining_time": "0:56:23"} +{"current_steps": 9430, "total_steps": 10798, "loss": 1.8958, "reward": null, "learning_rate": 3.930854723487642e-05, "epoch": 1.75, "percentage": 87.33, "elapsed_time": "6:22:43", "remaining_time": "0:55:31"} +{"current_steps": 9430, "total_steps": 10798, "loss": 1.8958, "reward": null, "learning_rate": 3.930854723487642e-05, "epoch": 1.75, "percentage": 87.33, "elapsed_time": "6:22:40", "remaining_time": "0:55:30"} +{"current_steps": 9430, "total_steps": 10798, "loss": 1.8958, "reward": null, "learning_rate": 3.930854723487642e-05, "epoch": 1.75, "percentage": 87.33, "elapsed_time": "6:22:41", "remaining_time": "0:55:31"} +{"current_steps": 9440, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 3.874511580392814e-05, "epoch": 1.75, "percentage": 87.42, "elapsed_time": "6:29:09", "remaining_time": "0:55:58"} +{"current_steps": 9440, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 3.874511580392814e-05, "epoch": 1.75, "percentage": 87.42, "elapsed_time": "6:23:06", "remaining_time": "0:55:06"} +{"current_steps": 9440, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 3.874511580392814e-05, "epoch": 1.75, "percentage": 87.42, "elapsed_time": "6:23:04", "remaining_time": "0:55:06"} +{"current_steps": 9440, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 3.874511580392814e-05, "epoch": 1.75, "percentage": 87.42, "elapsed_time": "6:23:08", "remaining_time": "0:55:06"} +{"current_steps": 9450, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 3.818558876818418e-05, "epoch": 1.75, "percentage": 87.52, "elapsed_time": "6:29:33", "remaining_time": "0:55:34"} +{"current_steps": 9450, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 3.818558876818418e-05, "epoch": 1.75, "percentage": 87.52, "elapsed_time": "6:23:29", "remaining_time": "0:54:42"} +{"current_steps": 9450, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 3.818558876818418e-05, "epoch": 1.75, "percentage": 87.52, "elapsed_time": "6:23:32", "remaining_time": "0:54:42"} +{"current_steps": 9450, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 3.818558876818418e-05, "epoch": 1.75, "percentage": 87.52, "elapsed_time": "6:23:30", "remaining_time": "0:54:42"} +{"current_steps": 9460, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 3.762997086388653e-05, "epoch": 1.75, "percentage": 87.61, "elapsed_time": "6:29:59", "remaining_time": "0:55:09"} +{"current_steps": 9460, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 3.762997086388653e-05, "epoch": 1.75, "percentage": 87.61, "elapsed_time": "6:23:58", "remaining_time": "0:54:18"} +{"current_steps": 9460, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 3.762997086388653e-05, "epoch": 1.75, "percentage": 87.61, "elapsed_time": "6:23:56", "remaining_time": "0:54:18"} +{"current_steps": 9460, "total_steps": 10798, "loss": 1.9321, "reward": null, "learning_rate": 3.762997086388653e-05, "epoch": 1.75, "percentage": 87.61, "elapsed_time": "6:23:55", "remaining_time": "0:54:18"} +{"current_steps": 9470, "total_steps": 10798, "loss": 1.8835, "reward": null, "learning_rate": 3.707826679418702e-05, "epoch": 1.75, "percentage": 87.7, "elapsed_time": "6:30:23", "remaining_time": "0:54:44"} +{"current_steps": 9470, "total_steps": 10798, "loss": 1.8835, "reward": null, "learning_rate": 3.707826679418702e-05, "epoch": 1.75, "percentage": 87.7, "elapsed_time": "6:24:20", "remaining_time": "0:53:53"} +{"current_steps": 9470, "total_steps": 10798, "loss": 1.8835, "reward": null, "learning_rate": 3.707826679418702e-05, "epoch": 1.75, "percentage": 87.7, "elapsed_time": "6:24:19", "remaining_time": "0:53:53"} +{"current_steps": 9470, "total_steps": 10798, "loss": 1.8835, "reward": null, "learning_rate": 3.707826679418702e-05, "epoch": 1.75, "percentage": 87.7, "elapsed_time": "6:24:22", "remaining_time": "0:53:54"} +{"current_steps": 9480, "total_steps": 10798, "loss": 1.9083, "reward": null, "learning_rate": 3.653048122910862e-05, "epoch": 1.76, "percentage": 87.79, "elapsed_time": "6:24:44", "remaining_time": "0:53:29"} +{"current_steps": 9480, "total_steps": 10798, "loss": 1.9083, "reward": null, "learning_rate": 3.653048122910862e-05, "epoch": 1.76, "percentage": 87.79, "elapsed_time": "6:24:45", "remaining_time": "0:53:29"} +{"current_steps": 9480, "total_steps": 10798, "loss": 1.9083, "reward": null, "learning_rate": 3.653048122910862e-05, "epoch": 1.76, "percentage": 87.79, "elapsed_time": "6:24:47", "remaining_time": "0:53:29"} +{"current_steps": 9480, "total_steps": 10798, "loss": 1.9083, "reward": null, "learning_rate": 3.653048122910862e-05, "epoch": 1.76, "percentage": 87.79, "elapsed_time": "6:30:48", "remaining_time": "0:54:20"} +{"current_steps": 9490, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 3.598661880550452e-05, "epoch": 1.76, "percentage": 87.89, "elapsed_time": "6:31:12", "remaining_time": "0:53:55"} +{"current_steps": 9490, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 3.598661880550452e-05, "epoch": 1.76, "percentage": 87.89, "elapsed_time": "6:25:08", "remaining_time": "0:53:04"} +{"current_steps": 9490, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 3.598661880550452e-05, "epoch": 1.76, "percentage": 87.89, "elapsed_time": "6:25:09", "remaining_time": "0:53:05"} +{"current_steps": 9490, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 3.598661880550452e-05, "epoch": 1.76, "percentage": 87.89, "elapsed_time": "6:25:11", "remaining_time": "0:53:05"} +{"current_steps": 9500, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 3.544668412702007e-05, "epoch": 1.76, "percentage": 87.98, "elapsed_time": "6:31:38", "remaining_time": "0:53:30"} +{"current_steps": 9500, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 3.544668412702007e-05, "epoch": 1.76, "percentage": 87.98, "elapsed_time": "6:25:37", "remaining_time": "0:52:41"} +{"current_steps": 9500, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 3.544668412702007e-05, "epoch": 1.76, "percentage": 87.98, "elapsed_time": "6:25:33", "remaining_time": "0:52:40"} +{"current_steps": 9500, "total_steps": 10798, "loss": 1.9696, "reward": null, "learning_rate": 3.544668412702007e-05, "epoch": 1.76, "percentage": 87.98, "elapsed_time": "6:25:35", "remaining_time": "0:52:41"} +{"current_steps": 9510, "total_steps": 10798, "loss": 1.9232, "reward": null, "learning_rate": 3.491068176405326e-05, "epoch": 1.76, "percentage": 88.07, "elapsed_time": "6:32:03", "remaining_time": "0:53:05"} +{"current_steps": 9510, "total_steps": 10798, "loss": 1.9232, "reward": null, "learning_rate": 3.491068176405326e-05, "epoch": 1.76, "percentage": 88.07, "elapsed_time": "6:25:58", "remaining_time": "0:52:16"} +{"current_steps": 9510, "total_steps": 10798, "loss": 1.9232, "reward": null, "learning_rate": 3.491068176405326e-05, "epoch": 1.76, "percentage": 88.07, "elapsed_time": "6:26:01", "remaining_time": "0:52:16"} +{"current_steps": 9510, "total_steps": 10798, "loss": 1.9232, "reward": null, "learning_rate": 3.491068176405326e-05, "epoch": 1.76, "percentage": 88.07, "elapsed_time": "6:25:59", "remaining_time": "0:52:16"} +{"current_steps": 9520, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 3.43786162537158e-05, "epoch": 1.76, "percentage": 88.16, "elapsed_time": "6:32:27", "remaining_time": "0:52:41"} +{"current_steps": 9520, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 3.43786162537158e-05, "epoch": 1.76, "percentage": 88.16, "elapsed_time": "6:26:22", "remaining_time": "0:51:52"} +{"current_steps": 9520, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 3.43786162537158e-05, "epoch": 1.76, "percentage": 88.16, "elapsed_time": "6:26:26", "remaining_time": "0:51:52"} +{"current_steps": 9520, "total_steps": 10798, "loss": 1.8944, "reward": null, "learning_rate": 3.43786162537158e-05, "epoch": 1.76, "percentage": 88.16, "elapsed_time": "6:26:24", "remaining_time": "0:51:52"} +{"current_steps": 9530, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 3.385049209979568e-05, "epoch": 1.77, "percentage": 88.26, "elapsed_time": "6:32:53", "remaining_time": "0:52:16"} +{"current_steps": 9530, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 3.385049209979568e-05, "epoch": 1.77, "percentage": 88.26, "elapsed_time": "6:26:49", "remaining_time": "0:51:28"} +{"current_steps": 9530, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 3.385049209979568e-05, "epoch": 1.77, "percentage": 88.26, "elapsed_time": "6:26:48", "remaining_time": "0:51:27"} +{"current_steps": 9530, "total_steps": 10798, "loss": 1.9341, "reward": null, "learning_rate": 3.385049209979568e-05, "epoch": 1.77, "percentage": 88.26, "elapsed_time": "6:26:51", "remaining_time": "0:51:28"} +{"current_steps": 9540, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 3.3326313772717667e-05, "epoch": 1.77, "percentage": 88.35, "elapsed_time": "6:33:16", "remaining_time": "0:51:51"} +{"current_steps": 9540, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 3.3326313772717667e-05, "epoch": 1.77, "percentage": 88.35, "elapsed_time": "6:27:15", "remaining_time": "0:51:03"} +{"current_steps": 9540, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 3.3326313772717667e-05, "epoch": 1.77, "percentage": 88.35, "elapsed_time": "6:27:13", "remaining_time": "0:51:03"} +{"current_steps": 9540, "total_steps": 10798, "loss": 1.9, "reward": null, "learning_rate": 3.3326313772717667e-05, "epoch": 1.77, "percentage": 88.35, "elapsed_time": "6:27:11", "remaining_time": "0:51:03"} +{"current_steps": 9550, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 3.2806085709506716e-05, "epoch": 1.77, "percentage": 88.44, "elapsed_time": "6:27:40", "remaining_time": "0:50:39"} +{"current_steps": 9550, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 3.2806085709506716e-05, "epoch": 1.77, "percentage": 88.44, "elapsed_time": "6:27:37", "remaining_time": "0:50:39"} +{"current_steps": 9550, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 3.2806085709506716e-05, "epoch": 1.77, "percentage": 88.44, "elapsed_time": "6:27:38", "remaining_time": "0:50:39"} +{"current_steps": 9550, "total_steps": 10798, "loss": 1.9157, "reward": null, "learning_rate": 3.2806085709506716e-05, "epoch": 1.77, "percentage": 88.44, "elapsed_time": "6:33:42", "remaining_time": "0:51:26"} +{"current_steps": 9560, "total_steps": 10798, "loss": 1.9287, "reward": null, "learning_rate": 3.228981231374972e-05, "epoch": 1.77, "percentage": 88.53, "elapsed_time": "6:28:02", "remaining_time": "0:50:14"} +{"current_steps": 9560, "total_steps": 10798, "loss": 1.9287, "reward": null, "learning_rate": 3.228981231374972e-05, "epoch": 1.77, "percentage": 88.53, "elapsed_time": "6:28:05", "remaining_time": "0:50:15"} +{"current_steps": 9560, "total_steps": 10798, "loss": 1.9287, "reward": null, "learning_rate": 3.228981231374972e-05, "epoch": 1.77, "percentage": 88.53, "elapsed_time": "6:28:03", "remaining_time": "0:50:15"} +{"current_steps": 9560, "total_steps": 10798, "loss": 1.9287, "reward": null, "learning_rate": 3.228981231374972e-05, "epoch": 1.77, "percentage": 88.53, "elapsed_time": "6:34:06", "remaining_time": "0:51:02"} +{"current_steps": 9570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 3.177749795555812e-05, "epoch": 1.77, "percentage": 88.63, "elapsed_time": "6:28:25", "remaining_time": "0:49:50"} +{"current_steps": 9570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 3.177749795555812e-05, "epoch": 1.77, "percentage": 88.63, "elapsed_time": "6:28:26", "remaining_time": "0:49:50"} +{"current_steps": 9570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 3.177749795555812e-05, "epoch": 1.77, "percentage": 88.63, "elapsed_time": "6:28:28", "remaining_time": "0:49:50"} +{"current_steps": 9570, "total_steps": 10798, "loss": 1.9375, "reward": null, "learning_rate": 3.177749795555812e-05, "epoch": 1.77, "percentage": 88.63, "elapsed_time": "6:34:30", "remaining_time": "0:50:37"} +{"current_steps": 9580, "total_steps": 10798, "loss": 1.9171, "reward": null, "learning_rate": 3.126914697153182e-05, "epoch": 1.77, "percentage": 88.72, "elapsed_time": "6:34:53", "remaining_time": "0:50:12"} +{"current_steps": 9580, "total_steps": 10798, "loss": 1.9171, "reward": null, "learning_rate": 3.126914697153182e-05, "epoch": 1.77, "percentage": 88.72, "elapsed_time": "6:28:49", "remaining_time": "0:49:26"} +{"current_steps": 9580, "total_steps": 10798, "loss": 1.9171, "reward": null, "learning_rate": 3.126914697153182e-05, "epoch": 1.77, "percentage": 88.72, "elapsed_time": "6:28:52", "remaining_time": "0:49:26"} +{"current_steps": 9580, "total_steps": 10798, "loss": 1.9171, "reward": null, "learning_rate": 3.126914697153182e-05, "epoch": 1.77, "percentage": 88.72, "elapsed_time": "6:28:50", "remaining_time": "0:49:26"} +{"current_steps": 9590, "total_steps": 10798, "loss": 1.8778, "reward": null, "learning_rate": 3.076476366472131e-05, "epoch": 1.78, "percentage": 88.81, "elapsed_time": "6:35:18", "remaining_time": "0:49:47"} +{"current_steps": 9590, "total_steps": 10798, "loss": 1.8778, "reward": null, "learning_rate": 3.076476366472131e-05, "epoch": 1.78, "percentage": 88.81, "elapsed_time": "6:29:17", "remaining_time": "0:49:02"} +{"current_steps": 9590, "total_steps": 10798, "loss": 1.8778, "reward": null, "learning_rate": 3.076476366472131e-05, "epoch": 1.78, "percentage": 88.81, "elapsed_time": "6:29:15", "remaining_time": "0:49:01"} +{"current_steps": 9590, "total_steps": 10798, "loss": 1.8778, "reward": null, "learning_rate": 3.076476366472131e-05, "epoch": 1.78, "percentage": 88.81, "elapsed_time": "6:29:14", "remaining_time": "0:49:01"} +{"current_steps": 9600, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 3.0264352304592123e-05, "epoch": 1.78, "percentage": 88.91, "elapsed_time": "6:35:44", "remaining_time": "0:49:23"} +{"current_steps": 9600, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 3.0264352304592123e-05, "epoch": 1.78, "percentage": 88.91, "elapsed_time": "6:29:39", "remaining_time": "0:48:37"} +{"current_steps": 9600, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 3.0264352304592123e-05, "epoch": 1.78, "percentage": 88.91, "elapsed_time": "6:29:43", "remaining_time": "0:48:38"} +{"current_steps": 9600, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 3.0264352304592123e-05, "epoch": 1.78, "percentage": 88.91, "elapsed_time": "6:29:41", "remaining_time": "0:48:37"} +{"current_steps": 9610, "total_steps": 10798, "loss": 1.891, "reward": null, "learning_rate": 2.9767917126987952e-05, "epoch": 1.78, "percentage": 89.0, "elapsed_time": "6:36:09", "remaining_time": "0:48:58"} +{"current_steps": 9610, "total_steps": 10798, "loss": 1.891, "reward": null, "learning_rate": 2.9767917126987952e-05, "epoch": 1.78, "percentage": 89.0, "elapsed_time": "6:30:07", "remaining_time": "0:48:13"} +{"current_steps": 9610, "total_steps": 10798, "loss": 1.891, "reward": null, "learning_rate": 2.9767917126987952e-05, "epoch": 1.78, "percentage": 89.0, "elapsed_time": "6:30:05", "remaining_time": "0:48:13"} +{"current_steps": 9610, "total_steps": 10798, "loss": 1.891, "reward": null, "learning_rate": 2.9767917126987952e-05, "epoch": 1.78, "percentage": 89.0, "elapsed_time": "6:30:04", "remaining_time": "0:48:13"} +{"current_steps": 9620, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 2.927546233409567e-05, "epoch": 1.78, "percentage": 89.09, "elapsed_time": "6:36:33", "remaining_time": "0:48:33"} +{"current_steps": 9620, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 2.927546233409567e-05, "epoch": 1.78, "percentage": 89.09, "elapsed_time": "6:30:32", "remaining_time": "0:47:49"} +{"current_steps": 9620, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 2.927546233409567e-05, "epoch": 1.78, "percentage": 89.09, "elapsed_time": "6:30:30", "remaining_time": "0:47:49"} +{"current_steps": 9620, "total_steps": 10798, "loss": 1.921, "reward": null, "learning_rate": 2.927546233409567e-05, "epoch": 1.78, "percentage": 89.09, "elapsed_time": "6:30:28", "remaining_time": "0:47:48"} +{"current_steps": 9630, "total_steps": 10798, "loss": 1.9178, "reward": null, "learning_rate": 2.8786992094409102e-05, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "6:36:58", "remaining_time": "0:48:08"} +{"current_steps": 9630, "total_steps": 10798, "loss": 1.9178, "reward": null, "learning_rate": 2.8786992094409102e-05, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "6:30:57", "remaining_time": "0:47:25"} +{"current_steps": 9630, "total_steps": 10798, "loss": 1.9178, "reward": null, "learning_rate": 2.8786992094409102e-05, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "6:30:54", "remaining_time": "0:47:24"} +{"current_steps": 9630, "total_steps": 10798, "loss": 1.9178, "reward": null, "learning_rate": 2.8786992094409102e-05, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "6:30:55", "remaining_time": "0:47:24"} +{"current_steps": 9640, "total_steps": 10798, "loss": 1.8917, "reward": null, "learning_rate": 2.8302510542693782e-05, "epoch": 1.79, "percentage": 89.28, "elapsed_time": "6:37:23", "remaining_time": "0:47:44"} +{"current_steps": 9640, "total_steps": 10798, "loss": 1.8917, "reward": null, "learning_rate": 2.8302510542693782e-05, "epoch": 1.79, "percentage": 89.28, "elapsed_time": "6:31:22", "remaining_time": "0:47:00"} +{"current_steps": 9640, "total_steps": 10798, "loss": 1.8917, "reward": null, "learning_rate": 2.8302510542693782e-05, "epoch": 1.79, "percentage": 89.28, "elapsed_time": "6:31:20", "remaining_time": "0:47:00"} +{"current_steps": 9640, "total_steps": 10798, "loss": 1.8917, "reward": null, "learning_rate": 2.8302510542693782e-05, "epoch": 1.79, "percentage": 89.28, "elapsed_time": "6:31:19", "remaining_time": "0:47:00"} +{"current_steps": 9650, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 2.7822021779952467e-05, "epoch": 1.79, "percentage": 89.37, "elapsed_time": "6:37:49", "remaining_time": "0:47:19"} +{"current_steps": 9650, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 2.7822021779952467e-05, "epoch": 1.79, "percentage": 89.37, "elapsed_time": "6:31:44", "remaining_time": "0:46:36"} +{"current_steps": 9650, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 2.7822021779952467e-05, "epoch": 1.79, "percentage": 89.37, "elapsed_time": "6:31:46", "remaining_time": "0:46:36"} +{"current_steps": 9650, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 2.7822021779952467e-05, "epoch": 1.79, "percentage": 89.37, "elapsed_time": "6:31:48", "remaining_time": "0:46:36"} +{"current_steps": 9660, "total_steps": 10798, "loss": 1.8737, "reward": null, "learning_rate": 2.7345529873389618e-05, "epoch": 1.79, "percentage": 89.46, "elapsed_time": "6:38:15", "remaining_time": "0:46:54"} +{"current_steps": 9660, "total_steps": 10798, "loss": 1.8737, "reward": null, "learning_rate": 2.7345529873389618e-05, "epoch": 1.79, "percentage": 89.46, "elapsed_time": "6:32:10", "remaining_time": "0:46:12"} +{"current_steps": 9660, "total_steps": 10798, "loss": 1.8737, "reward": null, "learning_rate": 2.7345529873389618e-05, "epoch": 1.79, "percentage": 89.46, "elapsed_time": "6:32:13", "remaining_time": "0:46:12"} +{"current_steps": 9660, "total_steps": 10798, "loss": 1.8737, "reward": null, "learning_rate": 2.7345529873389618e-05, "epoch": 1.79, "percentage": 89.46, "elapsed_time": "6:32:11", "remaining_time": "0:46:12"} +{"current_steps": 9670, "total_steps": 10798, "loss": 1.9349, "reward": null, "learning_rate": 2.687303885637765e-05, "epoch": 1.79, "percentage": 89.55, "elapsed_time": "6:38:40", "remaining_time": "0:46:30"} +{"current_steps": 9670, "total_steps": 10798, "loss": 1.9349, "reward": null, "learning_rate": 2.687303885637765e-05, "epoch": 1.79, "percentage": 89.55, "elapsed_time": "6:32:39", "remaining_time": "0:45:48"} +{"current_steps": 9670, "total_steps": 10798, "loss": 1.9349, "reward": null, "learning_rate": 2.687303885637765e-05, "epoch": 1.79, "percentage": 89.55, "elapsed_time": "6:32:37", "remaining_time": "0:45:47"} +{"current_steps": 9670, "total_steps": 10798, "loss": 1.9349, "reward": null, "learning_rate": 2.687303885637765e-05, "epoch": 1.79, "percentage": 89.55, "elapsed_time": "6:32:36", "remaining_time": "0:45:47"} +{"current_steps": 9680, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 2.6404552728422625e-05, "epoch": 1.79, "percentage": 89.65, "elapsed_time": "6:39:04", "remaining_time": "0:46:05"} +{"current_steps": 9680, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 2.6404552728422625e-05, "epoch": 1.79, "percentage": 89.65, "elapsed_time": "6:33:03", "remaining_time": "0:45:23"} +{"current_steps": 9680, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 2.6404552728422625e-05, "epoch": 1.79, "percentage": 89.65, "elapsed_time": "6:32:59", "remaining_time": "0:45:23"} +{"current_steps": 9680, "total_steps": 10798, "loss": 1.919, "reward": null, "learning_rate": 2.6404552728422625e-05, "epoch": 1.79, "percentage": 89.65, "elapsed_time": "6:33:01", "remaining_time": "0:45:23"} +{"current_steps": 9690, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 2.5940075455130217e-05, "epoch": 1.79, "percentage": 89.74, "elapsed_time": "6:39:28", "remaining_time": "0:45:40"} +{"current_steps": 9690, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 2.5940075455130217e-05, "epoch": 1.79, "percentage": 89.74, "elapsed_time": "6:33:27", "remaining_time": "0:44:59"} +{"current_steps": 9690, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 2.5940075455130217e-05, "epoch": 1.79, "percentage": 89.74, "elapsed_time": "6:33:23", "remaining_time": "0:44:58"} +{"current_steps": 9690, "total_steps": 10798, "loss": 1.9411, "reward": null, "learning_rate": 2.5940075455130217e-05, "epoch": 1.79, "percentage": 89.74, "elapsed_time": "6:33:25", "remaining_time": "0:44:59"} +{"current_steps": 9700, "total_steps": 10798, "loss": 1.9616, "reward": null, "learning_rate": 2.547961096817214e-05, "epoch": 1.8, "percentage": 89.83, "elapsed_time": "6:39:54", "remaining_time": "0:45:16"} +{"current_steps": 9700, "total_steps": 10798, "loss": 1.9616, "reward": null, "learning_rate": 2.547961096817214e-05, "epoch": 1.8, "percentage": 89.83, "elapsed_time": "6:33:50", "remaining_time": "0:44:34"} +{"current_steps": 9700, "total_steps": 10798, "loss": 1.9616, "reward": null, "learning_rate": 2.547961096817214e-05, "epoch": 1.8, "percentage": 89.83, "elapsed_time": "6:33:53", "remaining_time": "0:44:35"} +{"current_steps": 9700, "total_steps": 10798, "loss": 1.9616, "reward": null, "learning_rate": 2.547961096817214e-05, "epoch": 1.8, "percentage": 89.83, "elapsed_time": "6:33:51", "remaining_time": "0:44:35"} +{"current_steps": 9710, "total_steps": 10798, "loss": 1.9431, "reward": null, "learning_rate": 2.5023163165253272e-05, "epoch": 1.8, "percentage": 89.92, "elapsed_time": "6:40:20", "remaining_time": "0:44:51"} +{"current_steps": 9710, "total_steps": 10798, "loss": 1.9431, "reward": null, "learning_rate": 2.5023163165253272e-05, "epoch": 1.8, "percentage": 89.92, "elapsed_time": "6:34:15", "remaining_time": "0:44:10"} +{"current_steps": 9710, "total_steps": 10798, "loss": 1.9431, "reward": null, "learning_rate": 2.5023163165253272e-05, "epoch": 1.8, "percentage": 89.92, "elapsed_time": "6:34:16", "remaining_time": "0:44:10"} +{"current_steps": 9710, "total_steps": 10798, "loss": 1.9431, "reward": null, "learning_rate": 2.5023163165253272e-05, "epoch": 1.8, "percentage": 89.92, "elapsed_time": "6:34:18", "remaining_time": "0:44:10"} +{"current_steps": 9720, "total_steps": 10798, "loss": 1.9488, "reward": null, "learning_rate": 2.4570735910078078e-05, "epoch": 1.8, "percentage": 90.02, "elapsed_time": "6:40:44", "remaining_time": "0:44:26"} +{"current_steps": 9720, "total_steps": 10798, "loss": 1.9488, "reward": null, "learning_rate": 2.4570735910078078e-05, "epoch": 1.8, "percentage": 90.02, "elapsed_time": "6:34:43", "remaining_time": "0:43:46"} +{"current_steps": 9720, "total_steps": 10798, "loss": 1.9488, "reward": null, "learning_rate": 2.4570735910078078e-05, "epoch": 1.8, "percentage": 90.02, "elapsed_time": "6:34:41", "remaining_time": "0:43:46"} +{"current_steps": 9720, "total_steps": 10798, "loss": 1.9488, "reward": null, "learning_rate": 2.4570735910078078e-05, "epoch": 1.8, "percentage": 90.02, "elapsed_time": "6:34:39", "remaining_time": "0:43:46"} +{"current_steps": 9730, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 2.4122333032318367e-05, "epoch": 1.8, "percentage": 90.11, "elapsed_time": "6:41:08", "remaining_time": "0:44:01"} +{"current_steps": 9730, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 2.4122333032318367e-05, "epoch": 1.8, "percentage": 90.11, "elapsed_time": "6:35:05", "remaining_time": "0:43:22"} +{"current_steps": 9730, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 2.4122333032318367e-05, "epoch": 1.8, "percentage": 90.11, "elapsed_time": "6:35:04", "remaining_time": "0:43:21"} +{"current_steps": 9730, "total_steps": 10798, "loss": 1.9376, "reward": null, "learning_rate": 2.4122333032318367e-05, "epoch": 1.8, "percentage": 90.11, "elapsed_time": "6:35:07", "remaining_time": "0:43:22"} +{"current_steps": 9740, "total_steps": 10798, "loss": 1.9038, "reward": null, "learning_rate": 2.3677958327580683e-05, "epoch": 1.8, "percentage": 90.2, "elapsed_time": "6:41:33", "remaining_time": "0:43:37"} +{"current_steps": 9740, "total_steps": 10798, "loss": 1.9038, "reward": null, "learning_rate": 2.3677958327580683e-05, "epoch": 1.8, "percentage": 90.2, "elapsed_time": "6:35:28", "remaining_time": "0:42:57"} +{"current_steps": 9740, "total_steps": 10798, "loss": 1.9038, "reward": null, "learning_rate": 2.3677958327580683e-05, "epoch": 1.8, "percentage": 90.2, "elapsed_time": "6:35:31", "remaining_time": "0:42:57"} +{"current_steps": 9740, "total_steps": 10798, "loss": 1.9038, "reward": null, "learning_rate": 2.3677958327580683e-05, "epoch": 1.8, "percentage": 90.2, "elapsed_time": "6:35:29", "remaining_time": "0:42:57"} +{"current_steps": 9750, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 2.3237615557374137e-05, "epoch": 1.81, "percentage": 90.29, "elapsed_time": "6:35:52", "remaining_time": "0:42:33"} +{"current_steps": 9750, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 2.3237615557374137e-05, "epoch": 1.81, "percentage": 90.29, "elapsed_time": "6:35:54", "remaining_time": "0:42:33"} +{"current_steps": 9750, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 2.3237615557374137e-05, "epoch": 1.81, "percentage": 90.29, "elapsed_time": "6:35:55", "remaining_time": "0:42:33"} +{"current_steps": 9750, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 2.3237615557374137e-05, "epoch": 1.81, "percentage": 90.29, "elapsed_time": "6:41:57", "remaining_time": "0:43:12"} +{"current_steps": 9760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 2.2801308449078684e-05, "epoch": 1.81, "percentage": 90.39, "elapsed_time": "6:36:18", "remaining_time": "0:42:08"} +{"current_steps": 9760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 2.2801308449078684e-05, "epoch": 1.81, "percentage": 90.39, "elapsed_time": "6:42:21", "remaining_time": "0:42:47"} +{"current_steps": 9760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 2.2801308449078684e-05, "epoch": 1.81, "percentage": 90.39, "elapsed_time": "6:36:19", "remaining_time": "0:42:09"} +{"current_steps": 9760, "total_steps": 10798, "loss": 1.9058, "reward": null, "learning_rate": 2.2801308449078684e-05, "epoch": 1.81, "percentage": 90.39, "elapsed_time": "6:36:16", "remaining_time": "0:42:08"} +{"current_steps": 9770, "total_steps": 10798, "loss": 1.9275, "reward": null, "learning_rate": 2.2369040695913445e-05, "epoch": 1.81, "percentage": 90.48, "elapsed_time": "6:42:45", "remaining_time": "0:42:22"} +{"current_steps": 9770, "total_steps": 10798, "loss": 1.9275, "reward": null, "learning_rate": 2.2369040695913445e-05, "epoch": 1.81, "percentage": 90.48, "elapsed_time": "6:36:40", "remaining_time": "0:41:44"} +{"current_steps": 9770, "total_steps": 10798, "loss": 1.9275, "reward": null, "learning_rate": 2.2369040695913445e-05, "epoch": 1.81, "percentage": 90.48, "elapsed_time": "6:36:42", "remaining_time": "0:41:44"} +{"current_steps": 9770, "total_steps": 10798, "loss": 1.9275, "reward": null, "learning_rate": 2.2369040695913445e-05, "epoch": 1.81, "percentage": 90.48, "elapsed_time": "6:36:44", "remaining_time": "0:41:44"} +{"current_steps": 9780, "total_steps": 10798, "loss": 1.9646, "reward": null, "learning_rate": 2.1940815956905612e-05, "epoch": 1.81, "percentage": 90.57, "elapsed_time": "6:43:10", "remaining_time": "0:41:57"} +{"current_steps": 9780, "total_steps": 10798, "loss": 1.9646, "reward": null, "learning_rate": 2.1940815956905612e-05, "epoch": 1.81, "percentage": 90.57, "elapsed_time": "6:37:09", "remaining_time": "0:41:20"} +{"current_steps": 9780, "total_steps": 10798, "loss": 1.9646, "reward": null, "learning_rate": 2.1940815956905612e-05, "epoch": 1.81, "percentage": 90.57, "elapsed_time": "6:37:05", "remaining_time": "0:41:20"} +{"current_steps": 9780, "total_steps": 10798, "loss": 1.9646, "reward": null, "learning_rate": 2.1940815956905612e-05, "epoch": 1.81, "percentage": 90.57, "elapsed_time": "6:37:07", "remaining_time": "0:41:20"} +{"current_steps": 9790, "total_steps": 10798, "loss": 1.9127, "reward": null, "learning_rate": 2.1516637856859422e-05, "epoch": 1.81, "percentage": 90.66, "elapsed_time": "6:43:34", "remaining_time": "0:41:33"} +{"current_steps": 9790, "total_steps": 10798, "loss": 1.9127, "reward": null, "learning_rate": 2.1516637856859422e-05, "epoch": 1.81, "percentage": 90.66, "elapsed_time": "6:37:31", "remaining_time": "0:40:55"} +{"current_steps": 9790, "total_steps": 10798, "loss": 1.9127, "reward": null, "learning_rate": 2.1516637856859422e-05, "epoch": 1.81, "percentage": 90.66, "elapsed_time": "6:37:33", "remaining_time": "0:40:56"} +{"current_steps": 9790, "total_steps": 10798, "loss": 1.9127, "reward": null, "learning_rate": 2.1516637856859422e-05, "epoch": 1.81, "percentage": 90.66, "elapsed_time": "6:37:30", "remaining_time": "0:40:55"} +{"current_steps": 9800, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 2.109650998632512e-05, "epoch": 1.82, "percentage": 90.76, "elapsed_time": "6:43:59", "remaining_time": "0:41:08"} +{"current_steps": 9800, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 2.109650998632512e-05, "epoch": 1.82, "percentage": 90.76, "elapsed_time": "6:37:54", "remaining_time": "0:40:31"} +{"current_steps": 9800, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 2.109650998632512e-05, "epoch": 1.82, "percentage": 90.76, "elapsed_time": "6:37:56", "remaining_time": "0:40:31"} +{"current_steps": 9800, "total_steps": 10798, "loss": 1.9564, "reward": null, "learning_rate": 2.109650998632512e-05, "epoch": 1.82, "percentage": 90.76, "elapsed_time": "6:37:57", "remaining_time": "0:40:31"} +{"current_steps": 9810, "total_steps": 10798, "loss": 1.929, "reward": null, "learning_rate": 2.068043590156926e-05, "epoch": 1.82, "percentage": 90.85, "elapsed_time": "6:44:24", "remaining_time": "0:40:43"} +{"current_steps": 9810, "total_steps": 10798, "loss": 1.929, "reward": null, "learning_rate": 2.068043590156926e-05, "epoch": 1.82, "percentage": 90.85, "elapsed_time": "6:38:23", "remaining_time": "0:40:07"} +{"current_steps": 9810, "total_steps": 10798, "loss": 1.929, "reward": null, "learning_rate": 2.068043590156926e-05, "epoch": 1.82, "percentage": 90.85, "elapsed_time": "6:38:19", "remaining_time": "0:40:07"} +{"current_steps": 9810, "total_steps": 10798, "loss": 1.929, "reward": null, "learning_rate": 2.068043590156926e-05, "epoch": 1.82, "percentage": 90.85, "elapsed_time": "6:38:21", "remaining_time": "0:40:07"} +{"current_steps": 9820, "total_steps": 10798, "loss": 1.9185, "reward": null, "learning_rate": 2.0268419124544078e-05, "epoch": 1.82, "percentage": 90.94, "elapsed_time": "6:44:49", "remaining_time": "0:40:19"} +{"current_steps": 9820, "total_steps": 10798, "loss": 1.9185, "reward": null, "learning_rate": 2.0268419124544078e-05, "epoch": 1.82, "percentage": 90.94, "elapsed_time": "6:38:46", "remaining_time": "0:39:42"} +{"current_steps": 9820, "total_steps": 10798, "loss": 1.9185, "reward": null, "learning_rate": 2.0268419124544078e-05, "epoch": 1.82, "percentage": 90.94, "elapsed_time": "6:38:44", "remaining_time": "0:39:42"} +{"current_steps": 9820, "total_steps": 10798, "loss": 1.9185, "reward": null, "learning_rate": 2.0268419124544078e-05, "epoch": 1.82, "percentage": 90.94, "elapsed_time": "6:38:47", "remaining_time": "0:39:43"} +{"current_steps": 9830, "total_steps": 10798, "loss": 1.8714, "reward": null, "learning_rate": 1.986046314285772e-05, "epoch": 1.82, "percentage": 91.04, "elapsed_time": "6:45:13", "remaining_time": "0:39:54"} +{"current_steps": 9830, "total_steps": 10798, "loss": 1.8714, "reward": null, "learning_rate": 1.986046314285772e-05, "epoch": 1.82, "percentage": 91.04, "elapsed_time": "6:39:08", "remaining_time": "0:39:18"} +{"current_steps": 9830, "total_steps": 10798, "loss": 1.8714, "reward": null, "learning_rate": 1.986046314285772e-05, "epoch": 1.82, "percentage": 91.04, "elapsed_time": "6:39:11", "remaining_time": "0:39:18"} +{"current_steps": 9830, "total_steps": 10798, "loss": 1.8714, "reward": null, "learning_rate": 1.986046314285772e-05, "epoch": 1.82, "percentage": 91.04, "elapsed_time": "6:39:09", "remaining_time": "0:39:18"} +{"current_steps": 9840, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 1.9456571409744938e-05, "epoch": 1.82, "percentage": 91.13, "elapsed_time": "6:45:38", "remaining_time": "0:39:29"} +{"current_steps": 9840, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 1.9456571409744938e-05, "epoch": 1.82, "percentage": 91.13, "elapsed_time": "6:39:36", "remaining_time": "0:38:54"} +{"current_steps": 9840, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 1.9456571409744938e-05, "epoch": 1.82, "percentage": 91.13, "elapsed_time": "6:39:33", "remaining_time": "0:38:53"} +{"current_steps": 9840, "total_steps": 10798, "loss": 1.9149, "reward": null, "learning_rate": 1.9456571409744938e-05, "epoch": 1.82, "percentage": 91.13, "elapsed_time": "6:39:34", "remaining_time": "0:38:54"} +{"current_steps": 9850, "total_steps": 10798, "loss": 1.8945, "reward": null, "learning_rate": 1.9056747344037616e-05, "epoch": 1.82, "percentage": 91.22, "elapsed_time": "6:46:01", "remaining_time": "0:39:04"} +{"current_steps": 9850, "total_steps": 10798, "loss": 1.8945, "reward": null, "learning_rate": 1.9056747344037616e-05, "epoch": 1.82, "percentage": 91.22, "elapsed_time": "6:39:57", "remaining_time": "0:38:29"} +{"current_steps": 9850, "total_steps": 10798, "loss": 1.8945, "reward": null, "learning_rate": 1.9056747344037616e-05, "epoch": 1.82, "percentage": 91.22, "elapsed_time": "6:40:00", "remaining_time": "0:38:29"} +{"current_steps": 9850, "total_steps": 10798, "loss": 1.8945, "reward": null, "learning_rate": 1.9056747344037616e-05, "epoch": 1.82, "percentage": 91.22, "elapsed_time": "6:39:58", "remaining_time": "0:38:29"} +{"current_steps": 9860, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 1.8660994330136184e-05, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "6:40:22", "remaining_time": "0:38:05"} +{"current_steps": 9860, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 1.8660994330136184e-05, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "6:40:24", "remaining_time": "0:38:05"} +{"current_steps": 9860, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 1.8660994330136184e-05, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "6:40:21", "remaining_time": "0:38:05"} +{"current_steps": 9860, "total_steps": 10798, "loss": 1.9634, "reward": null, "learning_rate": 1.8660994330136184e-05, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "6:46:26", "remaining_time": "0:38:39"} +{"current_steps": 9870, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 1.8269315717980518e-05, "epoch": 1.83, "percentage": 91.41, "elapsed_time": "6:46:51", "remaining_time": "0:38:15"} +{"current_steps": 9870, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 1.8269315717980518e-05, "epoch": 1.83, "percentage": 91.41, "elapsed_time": "6:40:46", "remaining_time": "0:37:40"} +{"current_steps": 9870, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 1.8269315717980518e-05, "epoch": 1.83, "percentage": 91.41, "elapsed_time": "6:40:49", "remaining_time": "0:37:41"} +{"current_steps": 9870, "total_steps": 10798, "loss": 1.9449, "reward": null, "learning_rate": 1.8269315717980518e-05, "epoch": 1.83, "percentage": 91.41, "elapsed_time": "6:40:47", "remaining_time": "0:37:41"} +{"current_steps": 9880, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 1.7881714823021976e-05, "epoch": 1.83, "percentage": 91.5, "elapsed_time": "6:47:16", "remaining_time": "0:37:50"} +{"current_steps": 9880, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 1.7881714823021976e-05, "epoch": 1.83, "percentage": 91.5, "elapsed_time": "6:41:11", "remaining_time": "0:37:16"} +{"current_steps": 9880, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 1.7881714823021976e-05, "epoch": 1.83, "percentage": 91.5, "elapsed_time": "6:41:13", "remaining_time": "0:37:16"} +{"current_steps": 9880, "total_steps": 10798, "loss": 1.8911, "reward": null, "learning_rate": 1.7881714823021976e-05, "epoch": 1.83, "percentage": 91.5, "elapsed_time": "6:41:15", "remaining_time": "0:37:16"} +{"current_steps": 9890, "total_steps": 10798, "loss": 1.9169, "reward": null, "learning_rate": 1.7498194926194978e-05, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "6:47:40", "remaining_time": "0:37:25"} +{"current_steps": 9890, "total_steps": 10798, "loss": 1.9169, "reward": null, "learning_rate": 1.7498194926194978e-05, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "6:41:35", "remaining_time": "0:36:52"} +{"current_steps": 9890, "total_steps": 10798, "loss": 1.9169, "reward": null, "learning_rate": 1.7498194926194978e-05, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "6:41:38", "remaining_time": "0:36:52"} +{"current_steps": 9890, "total_steps": 10798, "loss": 1.9169, "reward": null, "learning_rate": 1.7498194926194978e-05, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "6:41:37", "remaining_time": "0:36:52"} +{"current_steps": 9900, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 1.7118759273889615e-05, "epoch": 1.83, "percentage": 91.68, "elapsed_time": "6:48:04", "remaining_time": "0:37:00"} +{"current_steps": 9900, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 1.7118759273889615e-05, "epoch": 1.83, "percentage": 91.68, "elapsed_time": "6:42:02", "remaining_time": "0:36:28"} +{"current_steps": 9900, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 1.7118759273889615e-05, "epoch": 1.83, "percentage": 91.68, "elapsed_time": "6:42:01", "remaining_time": "0:36:27"} +{"current_steps": 9900, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 1.7118759273889615e-05, "epoch": 1.83, "percentage": 91.68, "elapsed_time": "6:41:59", "remaining_time": "0:36:27"} +{"current_steps": 9910, "total_steps": 10798, "loss": 1.9187, "reward": null, "learning_rate": 1.674341107792382e-05, "epoch": 1.84, "percentage": 91.78, "elapsed_time": "6:48:29", "remaining_time": "0:36:36"} +{"current_steps": 9910, "total_steps": 10798, "loss": 1.9187, "reward": null, "learning_rate": 1.674341107792382e-05, "epoch": 1.84, "percentage": 91.78, "elapsed_time": "6:42:24", "remaining_time": "0:36:03"} +{"current_steps": 9910, "total_steps": 10798, "loss": 1.9187, "reward": null, "learning_rate": 1.674341107792382e-05, "epoch": 1.84, "percentage": 91.78, "elapsed_time": "6:42:26", "remaining_time": "0:36:03"} +{"current_steps": 9910, "total_steps": 10798, "loss": 1.9187, "reward": null, "learning_rate": 1.674341107792382e-05, "epoch": 1.84, "percentage": 91.78, "elapsed_time": "6:42:27", "remaining_time": "0:36:03"} +{"current_steps": 9920, "total_steps": 10798, "loss": 1.8754, "reward": null, "learning_rate": 1.6372153515516463e-05, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "6:42:51", "remaining_time": "0:35:39"} +{"current_steps": 9920, "total_steps": 10798, "loss": 1.8754, "reward": null, "learning_rate": 1.6372153515516463e-05, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "6:42:53", "remaining_time": "0:35:39"} +{"current_steps": 9920, "total_steps": 10798, "loss": 1.8754, "reward": null, "learning_rate": 1.6372153515516463e-05, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "6:48:54", "remaining_time": "0:36:11"} +{"current_steps": 9920, "total_steps": 10798, "loss": 1.8754, "reward": null, "learning_rate": 1.6372153515516463e-05, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "6:42:50", "remaining_time": "0:35:39"} +{"current_steps": 9930, "total_steps": 10798, "loss": 1.9913, "reward": null, "learning_rate": 1.600498972926029e-05, "epoch": 1.84, "percentage": 91.96, "elapsed_time": "6:43:16", "remaining_time": "0:35:15"} +{"current_steps": 9930, "total_steps": 10798, "loss": 1.9913, "reward": null, "learning_rate": 1.600498972926029e-05, "epoch": 1.84, "percentage": 91.96, "elapsed_time": "6:49:21", "remaining_time": "0:35:46"} +{"current_steps": 9930, "total_steps": 10798, "loss": 1.9913, "reward": null, "learning_rate": 1.600498972926029e-05, "epoch": 1.84, "percentage": 91.96, "elapsed_time": "6:43:17", "remaining_time": "0:35:15"} +{"current_steps": 9930, "total_steps": 10798, "loss": 1.9913, "reward": null, "learning_rate": 1.600498972926029e-05, "epoch": 1.84, "percentage": 91.96, "elapsed_time": "6:43:19", "remaining_time": "0:35:15"} +{"current_steps": 9940, "total_steps": 10798, "loss": 1.9162, "reward": null, "learning_rate": 1.5641922827095256e-05, "epoch": 1.84, "percentage": 92.05, "elapsed_time": "6:49:45", "remaining_time": "0:35:22"} +{"current_steps": 9940, "total_steps": 10798, "loss": 1.9162, "reward": null, "learning_rate": 1.5641922827095256e-05, "epoch": 1.84, "percentage": 92.05, "elapsed_time": "6:43:42", "remaining_time": "0:34:50"} +{"current_steps": 9940, "total_steps": 10798, "loss": 1.9162, "reward": null, "learning_rate": 1.5641922827095256e-05, "epoch": 1.84, "percentage": 92.05, "elapsed_time": "6:43:40", "remaining_time": "0:34:50"} +{"current_steps": 9940, "total_steps": 10798, "loss": 1.9162, "reward": null, "learning_rate": 1.5641922827095256e-05, "epoch": 1.84, "percentage": 92.05, "elapsed_time": "6:43:44", "remaining_time": "0:34:50"} +{"current_steps": 9950, "total_steps": 10798, "loss": 1.9475, "reward": null, "learning_rate": 1.528295588228251e-05, "epoch": 1.84, "percentage": 92.15, "elapsed_time": "6:50:11", "remaining_time": "0:34:57"} +{"current_steps": 9950, "total_steps": 10798, "loss": 1.9475, "reward": null, "learning_rate": 1.528295588228251e-05, "epoch": 1.84, "percentage": 92.15, "elapsed_time": "6:44:09", "remaining_time": "0:34:26"} +{"current_steps": 9950, "total_steps": 10798, "loss": 1.9475, "reward": null, "learning_rate": 1.528295588228251e-05, "epoch": 1.84, "percentage": 92.15, "elapsed_time": "6:44:06", "remaining_time": "0:34:26"} +{"current_steps": 9950, "total_steps": 10798, "loss": 1.9475, "reward": null, "learning_rate": 1.528295588228251e-05, "epoch": 1.84, "percentage": 92.15, "elapsed_time": "6:44:08", "remaining_time": "0:34:26"} +{"current_steps": 9960, "total_steps": 10798, "loss": 1.8907, "reward": null, "learning_rate": 1.4928091933378018e-05, "epoch": 1.84, "percentage": 92.24, "elapsed_time": "6:50:36", "remaining_time": "0:34:32"} +{"current_steps": 9960, "total_steps": 10798, "loss": 1.8907, "reward": null, "learning_rate": 1.4928091933378018e-05, "epoch": 1.84, "percentage": 92.24, "elapsed_time": "6:44:31", "remaining_time": "0:34:02"} +{"current_steps": 9960, "total_steps": 10798, "loss": 1.8907, "reward": null, "learning_rate": 1.4928091933378018e-05, "epoch": 1.84, "percentage": 92.24, "elapsed_time": "6:44:34", "remaining_time": "0:34:02"} +{"current_steps": 9960, "total_steps": 10798, "loss": 1.8907, "reward": null, "learning_rate": 1.4928091933378018e-05, "epoch": 1.84, "percentage": 92.24, "elapsed_time": "6:44:33", "remaining_time": "0:34:02"} +{"current_steps": 9970, "total_steps": 10798, "loss": 1.9031, "reward": null, "learning_rate": 1.4577333984207186e-05, "epoch": 1.85, "percentage": 92.33, "elapsed_time": "6:44:57", "remaining_time": "0:33:37"} +{"current_steps": 9970, "total_steps": 10798, "loss": 1.9031, "reward": null, "learning_rate": 1.4577333984207186e-05, "epoch": 1.85, "percentage": 92.33, "elapsed_time": "6:44:56", "remaining_time": "0:33:37"} +{"current_steps": 9970, "total_steps": 10798, "loss": 1.9031, "reward": null, "learning_rate": 1.4577333984207186e-05, "epoch": 1.85, "percentage": 92.33, "elapsed_time": "6:44:59", "remaining_time": "0:33:38"} +{"current_steps": 9970, "total_steps": 10798, "loss": 1.9031, "reward": null, "learning_rate": 1.4577333984207186e-05, "epoch": 1.85, "percentage": 92.33, "elapsed_time": "6:51:00", "remaining_time": "0:34:08"} +{"current_steps": 9980, "total_steps": 10798, "loss": 1.8969, "reward": null, "learning_rate": 1.4230685003839117e-05, "epoch": 1.85, "percentage": 92.42, "elapsed_time": "6:51:24", "remaining_time": "0:33:43"} +{"current_steps": 9980, "total_steps": 10798, "loss": 1.8969, "reward": null, "learning_rate": 1.4230685003839117e-05, "epoch": 1.85, "percentage": 92.42, "elapsed_time": "6:45:21", "remaining_time": "0:33:13"} +{"current_steps": 9980, "total_steps": 10798, "loss": 1.8969, "reward": null, "learning_rate": 1.4230685003839117e-05, "epoch": 1.85, "percentage": 92.42, "elapsed_time": "6:45:22", "remaining_time": "0:33:13"} +{"current_steps": 9980, "total_steps": 10798, "loss": 1.8969, "reward": null, "learning_rate": 1.4230685003839117e-05, "epoch": 1.85, "percentage": 92.42, "elapsed_time": "6:45:19", "remaining_time": "0:33:13"} +{"current_steps": 9990, "total_steps": 10798, "loss": 1.9272, "reward": null, "learning_rate": 1.3888147926561733e-05, "epoch": 1.85, "percentage": 92.52, "elapsed_time": "6:51:49", "remaining_time": "0:33:18"} +{"current_steps": 9990, "total_steps": 10798, "loss": 1.9272, "reward": null, "learning_rate": 1.3888147926561733e-05, "epoch": 1.85, "percentage": 92.52, "elapsed_time": "6:45:47", "remaining_time": "0:32:49"} +{"current_steps": 9990, "total_steps": 10798, "loss": 1.9272, "reward": null, "learning_rate": 1.3888147926561733e-05, "epoch": 1.85, "percentage": 92.52, "elapsed_time": "6:45:46", "remaining_time": "0:32:49"} +{"current_steps": 9990, "total_steps": 10798, "loss": 1.9272, "reward": null, "learning_rate": 1.3888147926561733e-05, "epoch": 1.85, "percentage": 92.52, "elapsed_time": "6:45:44", "remaining_time": "0:32:49"} +{"current_steps": 10000, "total_steps": 10798, "loss": 1.9313, "reward": null, "learning_rate": 1.3549725651856804e-05, "epoch": 1.85, "percentage": 92.61, "elapsed_time": "6:52:13", "remaining_time": "0:32:53"} +{"current_steps": 10000, "total_steps": 10798, "loss": 1.9313, "reward": null, "learning_rate": 1.3549725651856804e-05, "epoch": 1.85, "percentage": 92.61, "elapsed_time": "6:46:11", "remaining_time": "0:32:24"} +{"current_steps": 10000, "total_steps": 10798, "loss": 1.9313, "reward": null, "learning_rate": 1.3549725651856804e-05, "epoch": 1.85, "percentage": 92.61, "elapsed_time": "6:46:10", "remaining_time": "0:32:24"} +{"current_steps": 10000, "total_steps": 10798, "loss": 1.9313, "reward": null, "learning_rate": 1.3549725651856804e-05, "epoch": 1.85, "percentage": 92.61, "elapsed_time": "6:46:08", "remaining_time": "0:32:24"} +{"current_steps": 10010, "total_steps": 10798, "loss": 1.8596, "reward": null, "learning_rate": 1.3215421044375287e-05, "epoch": 1.85, "percentage": 92.7, "elapsed_time": "6:46:36", "remaining_time": "0:32:00"} +{"current_steps": 10010, "total_steps": 10798, "loss": 1.8596, "reward": null, "learning_rate": 1.3215421044375287e-05, "epoch": 1.85, "percentage": 92.7, "elapsed_time": "6:46:33", "remaining_time": "0:32:00"} +{"current_steps": 10010, "total_steps": 10798, "loss": 1.8596, "reward": null, "learning_rate": 1.3215421044375287e-05, "epoch": 1.85, "percentage": 92.7, "elapsed_time": "6:46:35", "remaining_time": "0:32:00"} +{"current_steps": 10010, "total_steps": 10798, "loss": 1.8596, "reward": null, "learning_rate": 1.3215421044375287e-05, "epoch": 1.85, "percentage": 92.7, "elapsed_time": "6:52:38", "remaining_time": "0:32:29"} +{"current_steps": 10020, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.288523693391358e-05, "epoch": 1.86, "percentage": 92.79, "elapsed_time": "6:46:58", "remaining_time": "0:31:35"} +{"current_steps": 10020, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.288523693391358e-05, "epoch": 1.86, "percentage": 92.79, "elapsed_time": "6:47:00", "remaining_time": "0:31:36"} +{"current_steps": 10020, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.288523693391358e-05, "epoch": 1.86, "percentage": 92.79, "elapsed_time": "6:47:02", "remaining_time": "0:31:36"} +{"current_steps": 10020, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.288523693391358e-05, "epoch": 1.86, "percentage": 92.79, "elapsed_time": "6:53:03", "remaining_time": "0:32:04"} +{"current_steps": 10030, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.255917611538876e-05, "epoch": 1.86, "percentage": 92.89, "elapsed_time": "6:53:28", "remaining_time": "0:31:39"} +{"current_steps": 10030, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.255917611538876e-05, "epoch": 1.86, "percentage": 92.89, "elapsed_time": "6:47:24", "remaining_time": "0:31:11"} +{"current_steps": 10030, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.255917611538876e-05, "epoch": 1.86, "percentage": 92.89, "elapsed_time": "6:47:23", "remaining_time": "0:31:11"} +{"current_steps": 10030, "total_steps": 10798, "loss": 1.9298, "reward": null, "learning_rate": 1.255917611538876e-05, "epoch": 1.86, "percentage": 92.89, "elapsed_time": "6:47:26", "remaining_time": "0:31:11"} +{"current_steps": 10040, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 1.2237241348815765e-05, "epoch": 1.86, "percentage": 92.98, "elapsed_time": "6:47:47", "remaining_time": "0:30:47"} +{"current_steps": 10040, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 1.2237241348815765e-05, "epoch": 1.86, "percentage": 92.98, "elapsed_time": "6:47:49", "remaining_time": "0:30:47"} +{"current_steps": 10040, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 1.2237241348815765e-05, "epoch": 1.86, "percentage": 92.98, "elapsed_time": "6:47:51", "remaining_time": "0:30:47"} +{"current_steps": 10040, "total_steps": 10798, "loss": 1.9296, "reward": null, "learning_rate": 1.2237241348815765e-05, "epoch": 1.86, "percentage": 92.98, "elapsed_time": "6:53:52", "remaining_time": "0:31:14"} +{"current_steps": 10050, "total_steps": 10798, "loss": 1.876, "reward": null, "learning_rate": 1.1919435359283414e-05, "epoch": 1.86, "percentage": 93.07, "elapsed_time": "6:48:17", "remaining_time": "0:30:23"} +{"current_steps": 10050, "total_steps": 10798, "loss": 1.876, "reward": null, "learning_rate": 1.1919435359283414e-05, "epoch": 1.86, "percentage": 93.07, "elapsed_time": "6:48:13", "remaining_time": "0:30:23"} +{"current_steps": 10050, "total_steps": 10798, "loss": 1.876, "reward": null, "learning_rate": 1.1919435359283414e-05, "epoch": 1.86, "percentage": 93.07, "elapsed_time": "6:54:18", "remaining_time": "0:30:50"} +{"current_steps": 10050, "total_steps": 10798, "loss": 1.876, "reward": null, "learning_rate": 1.1919435359283414e-05, "epoch": 1.86, "percentage": 93.07, "elapsed_time": "6:48:15", "remaining_time": "0:30:23"} +{"current_steps": 10060, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 1.16057608369316e-05, "epoch": 1.86, "percentage": 93.17, "elapsed_time": "6:54:44", "remaining_time": "0:30:25"} +{"current_steps": 10060, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 1.16057608369316e-05, "epoch": 1.86, "percentage": 93.17, "elapsed_time": "6:48:42", "remaining_time": "0:29:58"} +{"current_steps": 10060, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 1.16057608369316e-05, "epoch": 1.86, "percentage": 93.17, "elapsed_time": "6:48:40", "remaining_time": "0:29:58"} +{"current_steps": 10060, "total_steps": 10798, "loss": 1.9207, "reward": null, "learning_rate": 1.16057608369316e-05, "epoch": 1.86, "percentage": 93.17, "elapsed_time": "6:48:39", "remaining_time": "0:29:58"} +{"current_steps": 10070, "total_steps": 10798, "loss": 1.9311, "reward": null, "learning_rate": 1.1296220436928629e-05, "epoch": 1.87, "percentage": 93.26, "elapsed_time": "6:55:09", "remaining_time": "0:30:00"} +{"current_steps": 10070, "total_steps": 10798, "loss": 1.9311, "reward": null, "learning_rate": 1.1296220436928629e-05, "epoch": 1.87, "percentage": 93.26, "elapsed_time": "6:49:04", "remaining_time": "0:29:34"} +{"current_steps": 10070, "total_steps": 10798, "loss": 1.9311, "reward": null, "learning_rate": 1.1296220436928629e-05, "epoch": 1.87, "percentage": 93.26, "elapsed_time": "6:49:06", "remaining_time": "0:29:34"} +{"current_steps": 10070, "total_steps": 10798, "loss": 1.9311, "reward": null, "learning_rate": 1.1296220436928629e-05, "epoch": 1.87, "percentage": 93.26, "elapsed_time": "6:49:08", "remaining_time": "0:29:34"} +{"current_steps": 10080, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.0990816779448353e-05, "epoch": 1.87, "percentage": 93.35, "elapsed_time": "6:49:33", "remaining_time": "0:29:10"} +{"current_steps": 10080, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.0990816779448353e-05, "epoch": 1.87, "percentage": 93.35, "elapsed_time": "6:55:34", "remaining_time": "0:29:36"} +{"current_steps": 10080, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.0990816779448353e-05, "epoch": 1.87, "percentage": 93.35, "elapsed_time": "6:49:29", "remaining_time": "0:29:10"} +{"current_steps": 10080, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.0990816779448353e-05, "epoch": 1.87, "percentage": 93.35, "elapsed_time": "6:49:31", "remaining_time": "0:29:10"} +{"current_steps": 10090, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 1.0689552449648587e-05, "epoch": 1.87, "percentage": 93.44, "elapsed_time": "6:56:00", "remaining_time": "0:29:11"} +{"current_steps": 10090, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 1.0689552449648587e-05, "epoch": 1.87, "percentage": 93.44, "elapsed_time": "6:49:57", "remaining_time": "0:28:45"} +{"current_steps": 10090, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 1.0689552449648587e-05, "epoch": 1.87, "percentage": 93.44, "elapsed_time": "6:49:59", "remaining_time": "0:28:46"} +{"current_steps": 10090, "total_steps": 10798, "loss": 1.9191, "reward": null, "learning_rate": 1.0689552449648587e-05, "epoch": 1.87, "percentage": 93.44, "elapsed_time": "6:49:55", "remaining_time": "0:28:45"} +{"current_steps": 10100, "total_steps": 10798, "loss": 1.915, "reward": null, "learning_rate": 1.03924299976485e-05, "epoch": 1.87, "percentage": 93.54, "elapsed_time": "6:50:24", "remaining_time": "0:28:21"} +{"current_steps": 10100, "total_steps": 10798, "loss": 1.915, "reward": null, "learning_rate": 1.03924299976485e-05, "epoch": 1.87, "percentage": 93.54, "elapsed_time": "6:50:20", "remaining_time": "0:28:21"} +{"current_steps": 10100, "total_steps": 10798, "loss": 1.915, "reward": null, "learning_rate": 1.03924299976485e-05, "epoch": 1.87, "percentage": 93.54, "elapsed_time": "6:50:22", "remaining_time": "0:28:21"} +{"current_steps": 10100, "total_steps": 10798, "loss": 1.915, "reward": null, "learning_rate": 1.03924299976485e-05, "epoch": 1.87, "percentage": 93.54, "elapsed_time": "6:56:25", "remaining_time": "0:28:46"} +{"current_steps": 10110, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 1.0099451938507642e-05, "epoch": 1.87, "percentage": 93.63, "elapsed_time": "6:56:49", "remaining_time": "0:28:21"} +{"current_steps": 10110, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 1.0099451938507642e-05, "epoch": 1.87, "percentage": 93.63, "elapsed_time": "6:50:44", "remaining_time": "0:27:57"} +{"current_steps": 10110, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 1.0099451938507642e-05, "epoch": 1.87, "percentage": 93.63, "elapsed_time": "6:50:46", "remaining_time": "0:27:57"} +{"current_steps": 10110, "total_steps": 10798, "loss": 1.9141, "reward": null, "learning_rate": 1.0099451938507642e-05, "epoch": 1.87, "percentage": 93.63, "elapsed_time": "6:50:47", "remaining_time": "0:27:57"} +{"current_steps": 10120, "total_steps": 10798, "loss": 1.9291, "reward": null, "learning_rate": 9.810620752204346e-06, "epoch": 1.87, "percentage": 93.72, "elapsed_time": "6:57:14", "remaining_time": "0:27:57"} +{"current_steps": 10120, "total_steps": 10798, "loss": 1.9291, "reward": null, "learning_rate": 9.810620752204346e-06, "epoch": 1.87, "percentage": 93.72, "elapsed_time": "6:51:09", "remaining_time": "0:27:32"} +{"current_steps": 10120, "total_steps": 10798, "loss": 1.9291, "reward": null, "learning_rate": 9.810620752204346e-06, "epoch": 1.87, "percentage": 93.72, "elapsed_time": "6:51:12", "remaining_time": "0:27:32"} +{"current_steps": 10120, "total_steps": 10798, "loss": 1.9291, "reward": null, "learning_rate": 9.810620752204346e-06, "epoch": 1.87, "percentage": 93.72, "elapsed_time": "6:51:10", "remaining_time": "0:27:32"} +{"current_steps": 10130, "total_steps": 10798, "loss": 1.9239, "reward": null, "learning_rate": 9.525938883614915e-06, "epoch": 1.88, "percentage": 93.81, "elapsed_time": "6:57:38", "remaining_time": "0:27:32"} +{"current_steps": 10130, "total_steps": 10798, "loss": 1.9239, "reward": null, "learning_rate": 9.525938883614915e-06, "epoch": 1.88, "percentage": 93.81, "elapsed_time": "6:51:33", "remaining_time": "0:27:08"} +{"current_steps": 10130, "total_steps": 10798, "loss": 1.9239, "reward": null, "learning_rate": 9.525938883614915e-06, "epoch": 1.88, "percentage": 93.81, "elapsed_time": "6:51:37", "remaining_time": "0:27:08"} +{"current_steps": 10130, "total_steps": 10798, "loss": 1.9239, "reward": null, "learning_rate": 9.525938883614915e-06, "epoch": 1.88, "percentage": 93.81, "elapsed_time": "6:51:35", "remaining_time": "0:27:08"} +{"current_steps": 10140, "total_steps": 10798, "loss": 1.9016, "reward": null, "learning_rate": 9.24540874249269e-06, "epoch": 1.88, "percentage": 93.91, "elapsed_time": "6:58:02", "remaining_time": "0:27:07"} +{"current_steps": 10140, "total_steps": 10798, "loss": 1.9016, "reward": null, "learning_rate": 9.24540874249269e-06, "epoch": 1.88, "percentage": 93.91, "elapsed_time": "6:52:01", "remaining_time": "0:26:44"} +{"current_steps": 10140, "total_steps": 10798, "loss": 1.9016, "reward": null, "learning_rate": 9.24540874249269e-06, "epoch": 1.88, "percentage": 93.91, "elapsed_time": "6:51:57", "remaining_time": "0:26:43"} +{"current_steps": 10140, "total_steps": 10798, "loss": 1.9016, "reward": null, "learning_rate": 9.24540874249269e-06, "epoch": 1.88, "percentage": 93.91, "elapsed_time": "6:51:59", "remaining_time": "0:26:44"} +{"current_steps": 10150, "total_steps": 10798, "loss": 1.9208, "reward": null, "learning_rate": 8.969032703447843e-06, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "6:58:26", "remaining_time": "0:26:42"} +{"current_steps": 10150, "total_steps": 10798, "loss": 1.9208, "reward": null, "learning_rate": 8.969032703447843e-06, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "6:52:23", "remaining_time": "0:26:19"} +{"current_steps": 10150, "total_steps": 10798, "loss": 1.9208, "reward": null, "learning_rate": 8.969032703447843e-06, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "6:52:25", "remaining_time": "0:26:19"} +{"current_steps": 10150, "total_steps": 10798, "loss": 1.9208, "reward": null, "learning_rate": 8.969032703447843e-06, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "6:52:22", "remaining_time": "0:26:19"} +{"current_steps": 10160, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.69681310592718e-06, "epoch": 1.88, "percentage": 94.09, "elapsed_time": "6:58:51", "remaining_time": "0:26:18"} +{"current_steps": 10160, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.69681310592718e-06, "epoch": 1.88, "percentage": 94.09, "elapsed_time": "6:52:46", "remaining_time": "0:25:55"} +{"current_steps": 10160, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.69681310592718e-06, "epoch": 1.88, "percentage": 94.09, "elapsed_time": "6:52:48", "remaining_time": "0:25:55"} +{"current_steps": 10160, "total_steps": 10798, "loss": 1.9126, "reward": null, "learning_rate": 8.69681310592718e-06, "epoch": 1.88, "percentage": 94.09, "elapsed_time": "6:52:50", "remaining_time": "0:25:55"} +{"current_steps": 10170, "total_steps": 10798, "loss": 1.9194, "reward": null, "learning_rate": 8.428752254194427e-06, "epoch": 1.88, "percentage": 94.18, "elapsed_time": "6:53:11", "remaining_time": "0:25:30"} +{"current_steps": 10170, "total_steps": 10798, "loss": 1.9194, "reward": null, "learning_rate": 8.428752254194427e-06, "epoch": 1.88, "percentage": 94.18, "elapsed_time": "6:53:15", "remaining_time": "0:25:31"} +{"current_steps": 10170, "total_steps": 10798, "loss": 1.9194, "reward": null, "learning_rate": 8.428752254194427e-06, "epoch": 1.88, "percentage": 94.18, "elapsed_time": "6:53:13", "remaining_time": "0:25:30"} +{"current_steps": 10170, "total_steps": 10798, "loss": 1.9194, "reward": null, "learning_rate": 8.428752254194427e-06, "epoch": 1.88, "percentage": 94.18, "elapsed_time": "6:59:16", "remaining_time": "0:25:53"} +{"current_steps": 10180, "total_steps": 10798, "loss": 1.9257, "reward": null, "learning_rate": 8.164852417310742e-06, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "6:59:43", "remaining_time": "0:25:28"} +{"current_steps": 10180, "total_steps": 10798, "loss": 1.9257, "reward": null, "learning_rate": 8.164852417310742e-06, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "6:53:41", "remaining_time": "0:25:06"} +{"current_steps": 10180, "total_steps": 10798, "loss": 1.9257, "reward": null, "learning_rate": 8.164852417310742e-06, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "6:53:39", "remaining_time": "0:25:06"} +{"current_steps": 10180, "total_steps": 10798, "loss": 1.9257, "reward": null, "learning_rate": 8.164852417310742e-06, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "6:53:38", "remaining_time": "0:25:06"} +{"current_steps": 10190, "total_steps": 10798, "loss": 1.8922, "reward": null, "learning_rate": 7.905115829115238e-06, "epoch": 1.89, "percentage": 94.37, "elapsed_time": "7:00:07", "remaining_time": "0:25:04"} +{"current_steps": 10190, "total_steps": 10798, "loss": 1.8922, "reward": null, "learning_rate": 7.905115829115238e-06, "epoch": 1.89, "percentage": 94.37, "elapsed_time": "6:54:04", "remaining_time": "0:24:42"} +{"current_steps": 10190, "total_steps": 10798, "loss": 1.8922, "reward": null, "learning_rate": 7.905115829115238e-06, "epoch": 1.89, "percentage": 94.37, "elapsed_time": "6:54:06", "remaining_time": "0:24:42"} +{"current_steps": 10190, "total_steps": 10798, "loss": 1.8922, "reward": null, "learning_rate": 7.905115829115238e-06, "epoch": 1.89, "percentage": 94.37, "elapsed_time": "6:54:02", "remaining_time": "0:24:42"} +{"current_steps": 10200, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 7.6495446882065e-06, "epoch": 1.89, "percentage": 94.46, "elapsed_time": "7:00:33", "remaining_time": "0:24:39"} +{"current_steps": 10200, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 7.6495446882065e-06, "epoch": 1.89, "percentage": 94.46, "elapsed_time": "6:54:30", "remaining_time": "0:24:18"} +{"current_steps": 10200, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 7.6495446882065e-06, "epoch": 1.89, "percentage": 94.46, "elapsed_time": "6:54:32", "remaining_time": "0:24:18"} +{"current_steps": 10200, "total_steps": 10798, "loss": 1.8865, "reward": null, "learning_rate": 7.6495446882065e-06, "epoch": 1.89, "percentage": 94.46, "elapsed_time": "6:54:28", "remaining_time": "0:24:17"} +{"current_steps": 10210, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 7.398141157923588e-06, "epoch": 1.89, "percentage": 94.55, "elapsed_time": "7:00:56", "remaining_time": "0:24:14"} +{"current_steps": 10210, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 7.398141157923588e-06, "epoch": 1.89, "percentage": 94.55, "elapsed_time": "6:54:55", "remaining_time": "0:23:53"} +{"current_steps": 10210, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 7.398141157923588e-06, "epoch": 1.89, "percentage": 94.55, "elapsed_time": "6:54:51", "remaining_time": "0:23:53"} +{"current_steps": 10210, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 7.398141157923588e-06, "epoch": 1.89, "percentage": 94.55, "elapsed_time": "6:54:53", "remaining_time": "0:23:53"} +{"current_steps": 10220, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 7.150907366327952e-06, "epoch": 1.89, "percentage": 94.65, "elapsed_time": "7:01:21", "remaining_time": "0:23:49"} +{"current_steps": 10220, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 7.150907366327952e-06, "epoch": 1.89, "percentage": 94.65, "elapsed_time": "6:55:18", "remaining_time": "0:23:29"} +{"current_steps": 10220, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 7.150907366327952e-06, "epoch": 1.89, "percentage": 94.65, "elapsed_time": "6:55:17", "remaining_time": "0:23:29"} +{"current_steps": 10220, "total_steps": 10798, "loss": 1.9036, "reward": null, "learning_rate": 7.150907366327952e-06, "epoch": 1.89, "percentage": 94.65, "elapsed_time": "6:55:20", "remaining_time": "0:23:29"} +{"current_steps": 10230, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 6.907845406185387e-06, "epoch": 1.89, "percentage": 94.74, "elapsed_time": "7:01:46", "remaining_time": "0:23:25"} +{"current_steps": 10230, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 6.907845406185387e-06, "epoch": 1.89, "percentage": 94.74, "elapsed_time": "6:55:41", "remaining_time": "0:23:04"} +{"current_steps": 10230, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 6.907845406185387e-06, "epoch": 1.89, "percentage": 94.74, "elapsed_time": "6:55:45", "remaining_time": "0:23:05"} +{"current_steps": 10230, "total_steps": 10798, "loss": 1.9347, "reward": null, "learning_rate": 6.907845406185387e-06, "epoch": 1.89, "percentage": 94.74, "elapsed_time": "6:55:43", "remaining_time": "0:23:04"} +{"current_steps": 10240, "total_steps": 10798, "loss": 1.9144, "reward": null, "learning_rate": 6.6689573349482666e-06, "epoch": 1.9, "percentage": 94.83, "elapsed_time": "7:02:11", "remaining_time": "0:23:00"} +{"current_steps": 10240, "total_steps": 10798, "loss": 1.9144, "reward": null, "learning_rate": 6.6689573349482666e-06, "epoch": 1.9, "percentage": 94.83, "elapsed_time": "6:56:06", "remaining_time": "0:22:40"} +{"current_steps": 10240, "total_steps": 10798, "loss": 1.9144, "reward": null, "learning_rate": 6.6689573349482666e-06, "epoch": 1.9, "percentage": 94.83, "elapsed_time": "6:56:08", "remaining_time": "0:22:40"} +{"current_steps": 10240, "total_steps": 10798, "loss": 1.9144, "reward": null, "learning_rate": 6.6689573349482666e-06, "epoch": 1.9, "percentage": 94.83, "elapsed_time": "6:56:10", "remaining_time": "0:22:40"} +{"current_steps": 10250, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 6.434245174738063e-06, "epoch": 1.9, "percentage": 94.92, "elapsed_time": "6:56:32", "remaining_time": "0:22:16"} +{"current_steps": 10250, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 6.434245174738063e-06, "epoch": 1.9, "percentage": 94.92, "elapsed_time": "7:02:35", "remaining_time": "0:22:35"} +{"current_steps": 10250, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 6.434245174738063e-06, "epoch": 1.9, "percentage": 94.92, "elapsed_time": "6:56:31", "remaining_time": "0:22:16"} +{"current_steps": 10250, "total_steps": 10798, "loss": 1.9082, "reward": null, "learning_rate": 6.434245174738063e-06, "epoch": 1.9, "percentage": 94.92, "elapsed_time": "6:56:34", "remaining_time": "0:22:16"} +{"current_steps": 10260, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 6.203710912328464e-06, "epoch": 1.9, "percentage": 95.02, "elapsed_time": "6:56:58", "remaining_time": "0:21:51"} +{"current_steps": 10260, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 6.203710912328464e-06, "epoch": 1.9, "percentage": 95.02, "elapsed_time": "6:56:55", "remaining_time": "0:21:51"} +{"current_steps": 10260, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 6.203710912328464e-06, "epoch": 1.9, "percentage": 95.02, "elapsed_time": "7:03:00", "remaining_time": "0:22:10"} +{"current_steps": 10260, "total_steps": 10798, "loss": 1.8831, "reward": null, "learning_rate": 6.203710912328464e-06, "epoch": 1.9, "percentage": 95.02, "elapsed_time": "6:56:57", "remaining_time": "0:21:51"} +{"current_steps": 10270, "total_steps": 10798, "loss": 1.9163, "reward": null, "learning_rate": 5.9773564991283395e-06, "epoch": 1.9, "percentage": 95.11, "elapsed_time": "7:03:25", "remaining_time": "0:21:46"} +{"current_steps": 10270, "total_steps": 10798, "loss": 1.9163, "reward": null, "learning_rate": 5.9773564991283395e-06, "epoch": 1.9, "percentage": 95.11, "elapsed_time": "6:57:24", "remaining_time": "0:21:27"} +{"current_steps": 10270, "total_steps": 10798, "loss": 1.9163, "reward": null, "learning_rate": 5.9773564991283395e-06, "epoch": 1.9, "percentage": 95.11, "elapsed_time": "6:57:22", "remaining_time": "0:21:27"} +{"current_steps": 10270, "total_steps": 10798, "loss": 1.9163, "reward": null, "learning_rate": 5.9773564991283395e-06, "epoch": 1.9, "percentage": 95.11, "elapsed_time": "6:57:20", "remaining_time": "0:21:27"} +{"current_steps": 10280, "total_steps": 10798, "loss": 1.8726, "reward": null, "learning_rate": 5.755183851165246e-06, "epoch": 1.9, "percentage": 95.2, "elapsed_time": "7:03:50", "remaining_time": "0:21:21"} +{"current_steps": 10280, "total_steps": 10798, "loss": 1.8726, "reward": null, "learning_rate": 5.755183851165246e-06, "epoch": 1.9, "percentage": 95.2, "elapsed_time": "6:57:49", "remaining_time": "0:21:03"} +{"current_steps": 10280, "total_steps": 10798, "loss": 1.8726, "reward": null, "learning_rate": 5.755183851165246e-06, "epoch": 1.9, "percentage": 95.2, "elapsed_time": "6:57:47", "remaining_time": "0:21:03"} +{"current_steps": 10280, "total_steps": 10798, "loss": 1.8726, "reward": null, "learning_rate": 5.755183851165246e-06, "epoch": 1.9, "percentage": 95.2, "elapsed_time": "6:57:45", "remaining_time": "0:21:03"} +{"current_steps": 10290, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 5.537194849069283e-06, "epoch": 1.91, "percentage": 95.3, "elapsed_time": "6:58:10", "remaining_time": "0:20:38"} +{"current_steps": 10290, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 5.537194849069283e-06, "epoch": 1.91, "percentage": 95.3, "elapsed_time": "6:58:11", "remaining_time": "0:20:38"} +{"current_steps": 10290, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 5.537194849069283e-06, "epoch": 1.91, "percentage": 95.3, "elapsed_time": "6:58:13", "remaining_time": "0:20:38"} +{"current_steps": 10290, "total_steps": 10798, "loss": 1.9452, "reward": null, "learning_rate": 5.537194849069283e-06, "epoch": 1.91, "percentage": 95.3, "elapsed_time": "7:04:15", "remaining_time": "0:20:56"} +{"current_steps": 10300, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 5.323391338057204e-06, "epoch": 1.91, "percentage": 95.39, "elapsed_time": "7:04:40", "remaining_time": "0:20:31"} +{"current_steps": 10300, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 5.323391338057204e-06, "epoch": 1.91, "percentage": 95.39, "elapsed_time": "6:58:37", "remaining_time": "0:20:14"} +{"current_steps": 10300, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 5.323391338057204e-06, "epoch": 1.91, "percentage": 95.39, "elapsed_time": "6:58:39", "remaining_time": "0:20:14"} +{"current_steps": 10300, "total_steps": 10798, "loss": 1.9356, "reward": null, "learning_rate": 5.323391338057204e-06, "epoch": 1.91, "percentage": 95.39, "elapsed_time": "6:58:35", "remaining_time": "0:20:14"} +{"current_steps": 10310, "total_steps": 10798, "loss": 1.8665, "reward": null, "learning_rate": 5.113775127916553e-06, "epoch": 1.91, "percentage": 95.48, "elapsed_time": "7:05:04", "remaining_time": "0:20:07"} +{"current_steps": 10310, "total_steps": 10798, "loss": 1.8665, "reward": null, "learning_rate": 5.113775127916553e-06, "epoch": 1.91, "percentage": 95.48, "elapsed_time": "6:59:00", "remaining_time": "0:19:49"} +{"current_steps": 10310, "total_steps": 10798, "loss": 1.8665, "reward": null, "learning_rate": 5.113775127916553e-06, "epoch": 1.91, "percentage": 95.48, "elapsed_time": "6:59:01", "remaining_time": "0:19:50"} +{"current_steps": 10310, "total_steps": 10798, "loss": 1.8665, "reward": null, "learning_rate": 5.113775127916553e-06, "epoch": 1.91, "percentage": 95.48, "elapsed_time": "6:59:03", "remaining_time": "0:19:50"} +{"current_steps": 10320, "total_steps": 10798, "loss": 1.9132, "reward": null, "learning_rate": 4.908347992990836e-06, "epoch": 1.91, "percentage": 95.57, "elapsed_time": "7:05:30", "remaining_time": "0:19:42"} +{"current_steps": 10320, "total_steps": 10798, "loss": 1.9132, "reward": null, "learning_rate": 4.908347992990836e-06, "epoch": 1.91, "percentage": 95.57, "elapsed_time": "6:59:29", "remaining_time": "0:19:25"} +{"current_steps": 10320, "total_steps": 10798, "loss": 1.9132, "reward": null, "learning_rate": 4.908347992990836e-06, "epoch": 1.91, "percentage": 95.57, "elapsed_time": "6:59:25", "remaining_time": "0:19:25"} +{"current_steps": 10320, "total_steps": 10798, "loss": 1.9132, "reward": null, "learning_rate": 4.908347992990836e-06, "epoch": 1.91, "percentage": 95.57, "elapsed_time": "6:59:27", "remaining_time": "0:19:25"} +{"current_steps": 10330, "total_steps": 10798, "loss": 1.912, "reward": null, "learning_rate": 4.7071116721638104e-06, "epoch": 1.91, "percentage": 95.67, "elapsed_time": "7:05:55", "remaining_time": "0:19:17"} +{"current_steps": 10330, "total_steps": 10798, "loss": 1.912, "reward": null, "learning_rate": 4.7071116721638104e-06, "epoch": 1.91, "percentage": 95.67, "elapsed_time": "6:59:50", "remaining_time": "0:19:01"} +{"current_steps": 10330, "total_steps": 10798, "loss": 1.912, "reward": null, "learning_rate": 4.7071116721638104e-06, "epoch": 1.91, "percentage": 95.67, "elapsed_time": "6:59:52", "remaining_time": "0:19:01"} +{"current_steps": 10330, "total_steps": 10798, "loss": 1.912, "reward": null, "learning_rate": 4.7071116721638104e-06, "epoch": 1.91, "percentage": 95.67, "elapsed_time": "6:59:54", "remaining_time": "0:19:01"} +{"current_steps": 10340, "total_steps": 10798, "loss": 1.9069, "reward": null, "learning_rate": 4.5100678688455576e-06, "epoch": 1.92, "percentage": 95.76, "elapsed_time": "7:06:19", "remaining_time": "0:18:53"} +{"current_steps": 10340, "total_steps": 10798, "loss": 1.9069, "reward": null, "learning_rate": 4.5100678688455576e-06, "epoch": 1.92, "percentage": 95.76, "elapsed_time": "7:00:16", "remaining_time": "0:18:36"} +{"current_steps": 10340, "total_steps": 10798, "loss": 1.9069, "reward": null, "learning_rate": 4.5100678688455576e-06, "epoch": 1.92, "percentage": 95.76, "elapsed_time": "7:00:14", "remaining_time": "0:18:36"} +{"current_steps": 10340, "total_steps": 10798, "loss": 1.9069, "reward": null, "learning_rate": 4.5100678688455576e-06, "epoch": 1.92, "percentage": 95.76, "elapsed_time": "7:00:18", "remaining_time": "0:18:37"} +{"current_steps": 10350, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 4.317218250957322e-06, "epoch": 1.92, "percentage": 95.85, "elapsed_time": "7:06:43", "remaining_time": "0:18:28"} +{"current_steps": 10350, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 4.317218250957322e-06, "epoch": 1.92, "percentage": 95.85, "elapsed_time": "7:00:39", "remaining_time": "0:18:12"} +{"current_steps": 10350, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 4.317218250957322e-06, "epoch": 1.92, "percentage": 95.85, "elapsed_time": "7:00:40", "remaining_time": "0:18:12"} +{"current_steps": 10350, "total_steps": 10798, "loss": 1.9197, "reward": null, "learning_rate": 4.317218250957322e-06, "epoch": 1.92, "percentage": 95.85, "elapsed_time": "7:00:42", "remaining_time": "0:18:12"} +{"current_steps": 10360, "total_steps": 10798, "loss": 1.8681, "reward": null, "learning_rate": 4.12856445091786e-06, "epoch": 1.92, "percentage": 95.94, "elapsed_time": "7:01:04", "remaining_time": "0:17:48"} +{"current_steps": 10360, "total_steps": 10798, "loss": 1.8681, "reward": null, "learning_rate": 4.12856445091786e-06, "epoch": 1.92, "percentage": 95.94, "elapsed_time": "7:01:06", "remaining_time": "0:17:48"} +{"current_steps": 10360, "total_steps": 10798, "loss": 1.8681, "reward": null, "learning_rate": 4.12856445091786e-06, "epoch": 1.92, "percentage": 95.94, "elapsed_time": "7:01:07", "remaining_time": "0:17:48"} +{"current_steps": 10360, "total_steps": 10798, "loss": 1.8681, "reward": null, "learning_rate": 4.12856445091786e-06, "epoch": 1.92, "percentage": 95.94, "elapsed_time": "7:07:09", "remaining_time": "0:18:03"} +{"current_steps": 10370, "total_steps": 10798, "loss": 1.9463, "reward": null, "learning_rate": 3.944108065629559e-06, "epoch": 1.92, "percentage": 96.04, "elapsed_time": "7:07:34", "remaining_time": "0:17:38"} +{"current_steps": 10370, "total_steps": 10798, "loss": 1.9463, "reward": null, "learning_rate": 3.944108065629559e-06, "epoch": 1.92, "percentage": 96.04, "elapsed_time": "7:01:29", "remaining_time": "0:17:23"} +{"current_steps": 10370, "total_steps": 10798, "loss": 1.9463, "reward": null, "learning_rate": 3.944108065629559e-06, "epoch": 1.92, "percentage": 96.04, "elapsed_time": "7:01:31", "remaining_time": "0:17:23"} +{"current_steps": 10370, "total_steps": 10798, "loss": 1.9463, "reward": null, "learning_rate": 3.944108065629559e-06, "epoch": 1.92, "percentage": 96.04, "elapsed_time": "7:01:32", "remaining_time": "0:17:23"} +{"current_steps": 10380, "total_steps": 10798, "loss": 1.8796, "reward": null, "learning_rate": 3.763850656464729e-06, "epoch": 1.92, "percentage": 96.13, "elapsed_time": "7:07:57", "remaining_time": "0:17:14"} +{"current_steps": 10380, "total_steps": 10798, "loss": 1.8796, "reward": null, "learning_rate": 3.763850656464729e-06, "epoch": 1.92, "percentage": 96.13, "elapsed_time": "7:01:53", "remaining_time": "0:16:59"} +{"current_steps": 10380, "total_steps": 10798, "loss": 1.8796, "reward": null, "learning_rate": 3.763850656464729e-06, "epoch": 1.92, "percentage": 96.13, "elapsed_time": "7:01:54", "remaining_time": "0:16:59"} +{"current_steps": 10380, "total_steps": 10798, "loss": 1.8796, "reward": null, "learning_rate": 3.763850656464729e-06, "epoch": 1.92, "percentage": 96.13, "elapsed_time": "7:01:56", "remaining_time": "0:16:59"} +{"current_steps": 10390, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 3.58779374925261e-06, "epoch": 1.92, "percentage": 96.22, "elapsed_time": "7:08:21", "remaining_time": "0:16:49"} +{"current_steps": 10390, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 3.58779374925261e-06, "epoch": 1.92, "percentage": 96.22, "elapsed_time": "7:02:16", "remaining_time": "0:16:34"} +{"current_steps": 10390, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 3.58779374925261e-06, "epoch": 1.92, "percentage": 96.22, "elapsed_time": "7:02:20", "remaining_time": "0:16:35"} +{"current_steps": 10390, "total_steps": 10798, "loss": 1.8699, "reward": null, "learning_rate": 3.58779374925261e-06, "epoch": 1.92, "percentage": 96.22, "elapsed_time": "7:02:18", "remaining_time": "0:16:35"} +{"current_steps": 10400, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 3.415938834266219e-06, "epoch": 1.93, "percentage": 96.31, "elapsed_time": "7:08:47", "remaining_time": "0:16:24"} +{"current_steps": 10400, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 3.415938834266219e-06, "epoch": 1.93, "percentage": 96.31, "elapsed_time": "7:02:42", "remaining_time": "0:16:10"} +{"current_steps": 10400, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 3.415938834266219e-06, "epoch": 1.93, "percentage": 96.31, "elapsed_time": "7:02:45", "remaining_time": "0:16:10"} +{"current_steps": 10400, "total_steps": 10798, "loss": 1.951, "reward": null, "learning_rate": 3.415938834266219e-06, "epoch": 1.93, "percentage": 96.31, "elapsed_time": "7:02:43", "remaining_time": "0:16:10"} +{"current_steps": 10410, "total_steps": 10798, "loss": 1.9231, "reward": null, "learning_rate": 3.248287366209912e-06, "epoch": 1.93, "percentage": 96.41, "elapsed_time": "7:09:11", "remaining_time": "0:15:59"} +{"current_steps": 10410, "total_steps": 10798, "loss": 1.9231, "reward": null, "learning_rate": 3.248287366209912e-06, "epoch": 1.93, "percentage": 96.41, "elapsed_time": "7:03:07", "remaining_time": "0:15:46"} +{"current_steps": 10410, "total_steps": 10798, "loss": 1.9231, "reward": null, "learning_rate": 3.248287366209912e-06, "epoch": 1.93, "percentage": 96.41, "elapsed_time": "7:03:10", "remaining_time": "0:15:46"} +{"current_steps": 10410, "total_steps": 10798, "loss": 1.9231, "reward": null, "learning_rate": 3.248287366209912e-06, "epoch": 1.93, "percentage": 96.41, "elapsed_time": "7:03:08", "remaining_time": "0:15:46"} +{"current_steps": 10420, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 3.0848407642072306e-06, "epoch": 1.93, "percentage": 96.5, "elapsed_time": "7:09:36", "remaining_time": "0:15:35"} +{"current_steps": 10420, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 3.0848407642072306e-06, "epoch": 1.93, "percentage": 96.5, "elapsed_time": "7:03:31", "remaining_time": "0:15:21"} +{"current_steps": 10420, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 3.0848407642072306e-06, "epoch": 1.93, "percentage": 96.5, "elapsed_time": "7:03:35", "remaining_time": "0:15:21"} +{"current_steps": 10420, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 3.0848407642072306e-06, "epoch": 1.93, "percentage": 96.5, "elapsed_time": "7:03:33", "remaining_time": "0:15:21"} +{"current_steps": 10430, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 2.9256004117883538e-06, "epoch": 1.93, "percentage": 96.59, "elapsed_time": "7:10:00", "remaining_time": "0:15:10"} +{"current_steps": 10430, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 2.9256004117883538e-06, "epoch": 1.93, "percentage": 96.59, "elapsed_time": "7:03:55", "remaining_time": "0:14:57"} +{"current_steps": 10430, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 2.9256004117883538e-06, "epoch": 1.93, "percentage": 96.59, "elapsed_time": "7:03:57", "remaining_time": "0:14:57"} +{"current_steps": 10430, "total_steps": 10798, "loss": 1.9499, "reward": null, "learning_rate": 2.9256004117883538e-06, "epoch": 1.93, "percentage": 96.59, "elapsed_time": "7:03:58", "remaining_time": "0:14:57"} +{"current_steps": 10440, "total_steps": 10798, "loss": 1.9403, "reward": null, "learning_rate": 2.770567656878997e-06, "epoch": 1.93, "percentage": 96.68, "elapsed_time": "7:10:26", "remaining_time": "0:14:45"} +{"current_steps": 10440, "total_steps": 10798, "loss": 1.9403, "reward": null, "learning_rate": 2.770567656878997e-06, "epoch": 1.93, "percentage": 96.68, "elapsed_time": "7:04:25", "remaining_time": "0:14:33"} +{"current_steps": 10440, "total_steps": 10798, "loss": 1.9403, "reward": null, "learning_rate": 2.770567656878997e-06, "epoch": 1.93, "percentage": 96.68, "elapsed_time": "7:04:23", "remaining_time": "0:14:33"} +{"current_steps": 10440, "total_steps": 10798, "loss": 1.9403, "reward": null, "learning_rate": 2.770567656878997e-06, "epoch": 1.93, "percentage": 96.68, "elapsed_time": "7:04:22", "remaining_time": "0:14:33"} +{"current_steps": 10450, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 2.6197438117885884e-06, "epoch": 1.94, "percentage": 96.78, "elapsed_time": "7:04:47", "remaining_time": "0:14:08"} +{"current_steps": 10450, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 2.6197438117885884e-06, "epoch": 1.94, "percentage": 96.78, "elapsed_time": "7:10:52", "remaining_time": "0:14:20"} +{"current_steps": 10450, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 2.6197438117885884e-06, "epoch": 1.94, "percentage": 96.78, "elapsed_time": "7:04:48", "remaining_time": "0:14:08"} +{"current_steps": 10450, "total_steps": 10798, "loss": 1.9381, "reward": null, "learning_rate": 2.6197438117885884e-06, "epoch": 1.94, "percentage": 96.78, "elapsed_time": "7:04:50", "remaining_time": "0:14:08"} +{"current_steps": 10460, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 2.4731301531992214e-06, "epoch": 1.94, "percentage": 96.87, "elapsed_time": "7:11:16", "remaining_time": "0:13:56"} +{"current_steps": 10460, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 2.4731301531992214e-06, "epoch": 1.94, "percentage": 96.87, "elapsed_time": "7:05:15", "remaining_time": "0:13:44"} +{"current_steps": 10460, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 2.4731301531992214e-06, "epoch": 1.94, "percentage": 96.87, "elapsed_time": "7:05:13", "remaining_time": "0:13:44"} +{"current_steps": 10460, "total_steps": 10798, "loss": 1.9282, "reward": null, "learning_rate": 2.4731301531992214e-06, "epoch": 1.94, "percentage": 96.87, "elapsed_time": "7:05:12", "remaining_time": "0:13:44"} +{"current_steps": 10470, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 2.3307279221551623e-06, "epoch": 1.94, "percentage": 96.96, "elapsed_time": "7:05:36", "remaining_time": "0:13:20"} +{"current_steps": 10470, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 2.3307279221551623e-06, "epoch": 1.94, "percentage": 96.96, "elapsed_time": "7:05:40", "remaining_time": "0:13:20"} +{"current_steps": 10470, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 2.3307279221551623e-06, "epoch": 1.94, "percentage": 96.96, "elapsed_time": "7:05:38", "remaining_time": "0:13:20"} +{"current_steps": 10470, "total_steps": 10798, "loss": 1.9598, "reward": null, "learning_rate": 2.3307279221551623e-06, "epoch": 1.94, "percentage": 96.96, "elapsed_time": "7:11:41", "remaining_time": "0:13:31"} +{"current_steps": 10480, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 2.192538324051918e-06, "epoch": 1.94, "percentage": 97.06, "elapsed_time": "7:06:04", "remaining_time": "0:12:55"} +{"current_steps": 10480, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 2.192538324051918e-06, "epoch": 1.94, "percentage": 97.06, "elapsed_time": "7:06:01", "remaining_time": "0:12:55"} +{"current_steps": 10480, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 2.192538324051918e-06, "epoch": 1.94, "percentage": 97.06, "elapsed_time": "7:06:02", "remaining_time": "0:12:55"} +{"current_steps": 10480, "total_steps": 10798, "loss": 1.8994, "reward": null, "learning_rate": 2.192538324051918e-06, "epoch": 1.94, "percentage": 97.06, "elapsed_time": "7:12:05", "remaining_time": "0:13:06"} +{"current_steps": 10490, "total_steps": 10798, "loss": 1.8849, "reward": null, "learning_rate": 2.05856252862624e-06, "epoch": 1.94, "percentage": 97.15, "elapsed_time": "7:06:24", "remaining_time": "0:12:31"} +{"current_steps": 10490, "total_steps": 10798, "loss": 1.8849, "reward": null, "learning_rate": 2.05856252862624e-06, "epoch": 1.94, "percentage": 97.15, "elapsed_time": "7:06:28", "remaining_time": "0:12:31"} +{"current_steps": 10490, "total_steps": 10798, "loss": 1.8849, "reward": null, "learning_rate": 2.05856252862624e-06, "epoch": 1.94, "percentage": 97.15, "elapsed_time": "7:06:26", "remaining_time": "0:12:31"} +{"current_steps": 10490, "total_steps": 10798, "loss": 1.8849, "reward": null, "learning_rate": 2.05856252862624e-06, "epoch": 1.94, "percentage": 97.15, "elapsed_time": "7:12:29", "remaining_time": "0:12:41"} +{"current_steps": 10500, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 1.9288016699463006e-06, "epoch": 1.94, "percentage": 97.24, "elapsed_time": "7:12:52", "remaining_time": "0:12:17"} +{"current_steps": 10500, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 1.9288016699463006e-06, "epoch": 1.94, "percentage": 97.24, "elapsed_time": "7:06:48", "remaining_time": "0:12:06"} +{"current_steps": 10500, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 1.9288016699463006e-06, "epoch": 1.94, "percentage": 97.24, "elapsed_time": "7:06:51", "remaining_time": "0:12:06"} +{"current_steps": 10500, "total_steps": 10798, "loss": 1.9451, "reward": null, "learning_rate": 1.9288016699463006e-06, "epoch": 1.94, "percentage": 97.24, "elapsed_time": "7:06:49", "remaining_time": "0:12:06"} +{"current_steps": 10510, "total_steps": 10798, "loss": 1.8973, "reward": null, "learning_rate": 1.8032568464018129e-06, "epoch": 1.95, "percentage": 97.33, "elapsed_time": "7:07:12", "remaining_time": "0:11:42"} +{"current_steps": 10510, "total_steps": 10798, "loss": 1.8973, "reward": null, "learning_rate": 1.8032568464018129e-06, "epoch": 1.95, "percentage": 97.33, "elapsed_time": "7:07:15", "remaining_time": "0:11:42"} +{"current_steps": 10510, "total_steps": 10798, "loss": 1.8973, "reward": null, "learning_rate": 1.8032568464018129e-06, "epoch": 1.95, "percentage": 97.33, "elapsed_time": "7:07:14", "remaining_time": "0:11:42"} +{"current_steps": 10510, "total_steps": 10798, "loss": 1.8973, "reward": null, "learning_rate": 1.8032568464018129e-06, "epoch": 1.95, "percentage": 97.33, "elapsed_time": "7:13:17", "remaining_time": "0:11:52"} +{"current_steps": 10520, "total_steps": 10798, "loss": 1.9224, "reward": null, "learning_rate": 1.681929120695147e-06, "epoch": 1.95, "percentage": 97.43, "elapsed_time": "7:13:42", "remaining_time": "0:11:27"} +{"current_steps": 10520, "total_steps": 10798, "loss": 1.9224, "reward": null, "learning_rate": 1.681929120695147e-06, "epoch": 1.95, "percentage": 97.43, "elapsed_time": "7:07:37", "remaining_time": "0:11:18"} +{"current_steps": 10520, "total_steps": 10798, "loss": 1.9224, "reward": null, "learning_rate": 1.681929120695147e-06, "epoch": 1.95, "percentage": 97.43, "elapsed_time": "7:07:39", "remaining_time": "0:11:18"} +{"current_steps": 10520, "total_steps": 10798, "loss": 1.9224, "reward": null, "learning_rate": 1.681929120695147e-06, "epoch": 1.95, "percentage": 97.43, "elapsed_time": "7:07:40", "remaining_time": "0:11:18"} +{"current_steps": 10530, "total_steps": 10798, "loss": 1.9441, "reward": null, "learning_rate": 1.564819519832006e-06, "epoch": 1.95, "percentage": 97.52, "elapsed_time": "7:14:08", "remaining_time": "0:11:02"} +{"current_steps": 10530, "total_steps": 10798, "loss": 1.9441, "reward": null, "learning_rate": 1.564819519832006e-06, "epoch": 1.95, "percentage": 97.52, "elapsed_time": "7:08:03", "remaining_time": "0:10:53"} +{"current_steps": 10530, "total_steps": 10798, "loss": 1.9441, "reward": null, "learning_rate": 1.564819519832006e-06, "epoch": 1.95, "percentage": 97.52, "elapsed_time": "7:08:04", "remaining_time": "0:10:53"} +{"current_steps": 10530, "total_steps": 10798, "loss": 1.9441, "reward": null, "learning_rate": 1.564819519832006e-06, "epoch": 1.95, "percentage": 97.52, "elapsed_time": "7:08:06", "remaining_time": "0:10:53"} +{"current_steps": 10540, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.451929035112709e-06, "epoch": 1.95, "percentage": 97.61, "elapsed_time": "7:14:33", "remaining_time": "0:10:38"} +{"current_steps": 10540, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.451929035112709e-06, "epoch": 1.95, "percentage": 97.61, "elapsed_time": "7:08:28", "remaining_time": "0:10:29"} +{"current_steps": 10540, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.451929035112709e-06, "epoch": 1.95, "percentage": 97.61, "elapsed_time": "7:08:29", "remaining_time": "0:10:29"} +{"current_steps": 10540, "total_steps": 10798, "loss": 1.9274, "reward": null, "learning_rate": 1.451929035112709e-06, "epoch": 1.95, "percentage": 97.61, "elapsed_time": "7:08:31", "remaining_time": "0:10:29"} +{"current_steps": 10550, "total_steps": 10798, "loss": 1.9057, "reward": null, "learning_rate": 1.3432586221240884e-06, "epoch": 1.95, "percentage": 97.7, "elapsed_time": "7:14:58", "remaining_time": "0:10:13"} +{"current_steps": 10550, "total_steps": 10798, "loss": 1.9057, "reward": null, "learning_rate": 1.3432586221240884e-06, "epoch": 1.95, "percentage": 97.7, "elapsed_time": "7:08:54", "remaining_time": "0:10:04"} +{"current_steps": 10550, "total_steps": 10798, "loss": 1.9057, "reward": null, "learning_rate": 1.3432586221240884e-06, "epoch": 1.95, "percentage": 97.7, "elapsed_time": "7:08:55", "remaining_time": "0:10:04"} +{"current_steps": 10550, "total_steps": 10798, "loss": 1.9057, "reward": null, "learning_rate": 1.3432586221240884e-06, "epoch": 1.95, "percentage": 97.7, "elapsed_time": "7:08:57", "remaining_time": "0:10:05"} +{"current_steps": 10560, "total_steps": 10798, "loss": 1.9153, "reward": null, "learning_rate": 1.2388092007312169e-06, "epoch": 1.96, "percentage": 97.8, "elapsed_time": "7:15:23", "remaining_time": "0:09:48"} +{"current_steps": 10560, "total_steps": 10798, "loss": 1.9153, "reward": null, "learning_rate": 1.2388092007312169e-06, "epoch": 1.96, "percentage": 97.8, "elapsed_time": "7:09:21", "remaining_time": "0:09:40"} +{"current_steps": 10560, "total_steps": 10798, "loss": 1.9153, "reward": null, "learning_rate": 1.2388092007312169e-06, "epoch": 1.96, "percentage": 97.8, "elapsed_time": "7:09:20", "remaining_time": "0:09:40"} +{"current_steps": 10560, "total_steps": 10798, "loss": 1.9153, "reward": null, "learning_rate": 1.2388092007312169e-06, "epoch": 1.96, "percentage": 97.8, "elapsed_time": "7:09:18", "remaining_time": "0:09:40"} +{"current_steps": 10570, "total_steps": 10798, "loss": 1.878, "reward": null, "learning_rate": 1.138581655069526e-06, "epoch": 1.96, "percentage": 97.89, "elapsed_time": "7:15:47", "remaining_time": "0:09:24"} +{"current_steps": 10570, "total_steps": 10798, "loss": 1.878, "reward": null, "learning_rate": 1.138581655069526e-06, "epoch": 1.96, "percentage": 97.89, "elapsed_time": "7:09:46", "remaining_time": "0:09:16"} +{"current_steps": 10570, "total_steps": 10798, "loss": 1.878, "reward": null, "learning_rate": 1.138581655069526e-06, "epoch": 1.96, "percentage": 97.89, "elapsed_time": "7:09:44", "remaining_time": "0:09:16"} +{"current_steps": 10570, "total_steps": 10798, "loss": 1.878, "reward": null, "learning_rate": 1.138581655069526e-06, "epoch": 1.96, "percentage": 97.89, "elapsed_time": "7:09:42", "remaining_time": "0:09:16"} +{"current_steps": 10580, "total_steps": 10798, "loss": 1.8931, "reward": null, "learning_rate": 1.0425768335375897e-06, "epoch": 1.96, "percentage": 97.98, "elapsed_time": "7:16:12", "remaining_time": "0:08:59"} +{"current_steps": 10580, "total_steps": 10798, "loss": 1.8931, "reward": null, "learning_rate": 1.0425768335375897e-06, "epoch": 1.96, "percentage": 97.98, "elapsed_time": "7:10:08", "remaining_time": "0:08:51"} +{"current_steps": 10580, "total_steps": 10798, "loss": 1.8931, "reward": null, "learning_rate": 1.0425768335375897e-06, "epoch": 1.96, "percentage": 97.98, "elapsed_time": "7:10:10", "remaining_time": "0:08:51"} +{"current_steps": 10580, "total_steps": 10798, "loss": 1.8931, "reward": null, "learning_rate": 1.0425768335375897e-06, "epoch": 1.96, "percentage": 97.98, "elapsed_time": "7:10:07", "remaining_time": "0:08:51"} +{"current_steps": 10590, "total_steps": 10798, "loss": 1.9034, "reward": null, "learning_rate": 9.507955487896291e-07, "epoch": 1.96, "percentage": 98.07, "elapsed_time": "7:16:37", "remaining_time": "0:08:34"} +{"current_steps": 10590, "total_steps": 10798, "loss": 1.9034, "reward": null, "learning_rate": 9.507955487896291e-07, "epoch": 1.96, "percentage": 98.07, "elapsed_time": "7:10:33", "remaining_time": "0:08:27"} +{"current_steps": 10590, "total_steps": 10798, "loss": 1.9034, "reward": null, "learning_rate": 9.507955487896291e-07, "epoch": 1.96, "percentage": 98.07, "elapsed_time": "7:10:36", "remaining_time": "0:08:27"} +{"current_steps": 10590, "total_steps": 10798, "loss": 1.9034, "reward": null, "learning_rate": 9.507955487896291e-07, "epoch": 1.96, "percentage": 98.07, "elapsed_time": "7:10:34", "remaining_time": "0:08:27"} +{"current_steps": 10600, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 8.632385777289087e-07, "epoch": 1.96, "percentage": 98.17, "elapsed_time": "7:10:58", "remaining_time": "0:08:03"} +{"current_steps": 10600, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 8.632385777289087e-07, "epoch": 1.96, "percentage": 98.17, "elapsed_time": "7:11:02", "remaining_time": "0:08:03"} +{"current_steps": 10600, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 8.632385777289087e-07, "epoch": 1.96, "percentage": 98.17, "elapsed_time": "7:11:00", "remaining_time": "0:08:03"} +{"current_steps": 10600, "total_steps": 10798, "loss": 1.9457, "reward": null, "learning_rate": 8.632385777289087e-07, "epoch": 1.96, "percentage": 98.17, "elapsed_time": "7:17:03", "remaining_time": "0:08:09"} +{"current_steps": 10610, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 7.799066615010175e-07, "epoch": 1.97, "percentage": 98.26, "elapsed_time": "7:11:22", "remaining_time": "0:07:38"} +{"current_steps": 10610, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 7.799066615010175e-07, "epoch": 1.97, "percentage": 98.26, "elapsed_time": "7:11:25", "remaining_time": "0:07:38"} +{"current_steps": 10610, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 7.799066615010175e-07, "epoch": 1.97, "percentage": 98.26, "elapsed_time": "7:11:24", "remaining_time": "0:07:38"} +{"current_steps": 10610, "total_steps": 10798, "loss": 1.9204, "reward": null, "learning_rate": 7.799066615010175e-07, "epoch": 1.97, "percentage": 98.26, "elapsed_time": "7:17:27", "remaining_time": "0:07:45"} +{"current_steps": 10620, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 7.008005054875422e-07, "epoch": 1.97, "percentage": 98.35, "elapsed_time": "7:17:52", "remaining_time": "0:07:20"} +{"current_steps": 10620, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 7.008005054875422e-07, "epoch": 1.97, "percentage": 98.35, "elapsed_time": "7:11:47", "remaining_time": "0:07:14"} +{"current_steps": 10620, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 7.008005054875422e-07, "epoch": 1.97, "percentage": 98.35, "elapsed_time": "7:11:50", "remaining_time": "0:07:14"} +{"current_steps": 10620, "total_steps": 10798, "loss": 1.9366, "reward": null, "learning_rate": 7.008005054875422e-07, "epoch": 1.97, "percentage": 98.35, "elapsed_time": "7:11:49", "remaining_time": "0:07:14"} +{"current_steps": 10630, "total_steps": 10798, "loss": 1.8985, "reward": null, "learning_rate": 6.259207793003486e-07, "epoch": 1.97, "percentage": 98.44, "elapsed_time": "7:12:15", "remaining_time": "0:06:49"} +{"current_steps": 10630, "total_steps": 10798, "loss": 1.8985, "reward": null, "learning_rate": 6.259207793003486e-07, "epoch": 1.97, "percentage": 98.44, "elapsed_time": "7:18:16", "remaining_time": "0:06:55"} +{"current_steps": 10630, "total_steps": 10798, "loss": 1.8985, "reward": null, "learning_rate": 6.259207793003486e-07, "epoch": 1.97, "percentage": 98.44, "elapsed_time": "7:12:11", "remaining_time": "0:06:49"} +{"current_steps": 10630, "total_steps": 10798, "loss": 1.8985, "reward": null, "learning_rate": 6.259207793003486e-07, "epoch": 1.97, "percentage": 98.44, "elapsed_time": "7:12:13", "remaining_time": "0:06:49"} +{"current_steps": 10640, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 5.552681167755868e-07, "epoch": 1.97, "percentage": 98.54, "elapsed_time": "7:18:40", "remaining_time": "0:06:30"} +{"current_steps": 10640, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 5.552681167755868e-07, "epoch": 1.97, "percentage": 98.54, "elapsed_time": "7:12:35", "remaining_time": "0:06:25"} +{"current_steps": 10640, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 5.552681167755868e-07, "epoch": 1.97, "percentage": 98.54, "elapsed_time": "7:12:37", "remaining_time": "0:06:25"} +{"current_steps": 10640, "total_steps": 10798, "loss": 1.9348, "reward": null, "learning_rate": 5.552681167755868e-07, "epoch": 1.97, "percentage": 98.54, "elapsed_time": "7:12:38", "remaining_time": "0:06:25"} +{"current_steps": 10650, "total_steps": 10798, "loss": 1.9268, "reward": null, "learning_rate": 4.888431159685291e-07, "epoch": 1.97, "percentage": 98.63, "elapsed_time": "7:13:00", "remaining_time": "0:06:01"} +{"current_steps": 10650, "total_steps": 10798, "loss": 1.9268, "reward": null, "learning_rate": 4.888431159685291e-07, "epoch": 1.97, "percentage": 98.63, "elapsed_time": "7:19:05", "remaining_time": "0:06:06"} +{"current_steps": 10650, "total_steps": 10798, "loss": 1.9268, "reward": null, "learning_rate": 4.888431159685291e-07, "epoch": 1.97, "percentage": 98.63, "elapsed_time": "7:13:02", "remaining_time": "0:06:01"} +{"current_steps": 10650, "total_steps": 10798, "loss": 1.9268, "reward": null, "learning_rate": 4.888431159685291e-07, "epoch": 1.97, "percentage": 98.63, "elapsed_time": "7:13:03", "remaining_time": "0:06:01"} +{"current_steps": 10660, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 4.266463391484621e-07, "epoch": 1.97, "percentage": 98.72, "elapsed_time": "7:19:30", "remaining_time": "0:05:41"} +{"current_steps": 10660, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 4.266463391484621e-07, "epoch": 1.97, "percentage": 98.72, "elapsed_time": "7:13:27", "remaining_time": "0:05:36"} +{"current_steps": 10660, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 4.266463391484621e-07, "epoch": 1.97, "percentage": 98.72, "elapsed_time": "7:13:25", "remaining_time": "0:05:36"} +{"current_steps": 10660, "total_steps": 10798, "loss": 1.9166, "reward": null, "learning_rate": 4.266463391484621e-07, "epoch": 1.97, "percentage": 98.72, "elapsed_time": "7:13:29", "remaining_time": "0:05:36"} +{"current_steps": 10670, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 3.6867831279396856e-07, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "7:19:55", "remaining_time": "0:05:16"} +{"current_steps": 10670, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 3.6867831279396856e-07, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "7:13:53", "remaining_time": "0:05:12"} +{"current_steps": 10670, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 3.6867831279396856e-07, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "7:13:52", "remaining_time": "0:05:12"} +{"current_steps": 10670, "total_steps": 10798, "loss": 1.9312, "reward": null, "learning_rate": 3.6867831279396856e-07, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "7:13:50", "remaining_time": "0:05:12"} +{"current_steps": 10680, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 3.1493952758832046e-07, "epoch": 1.98, "percentage": 98.91, "elapsed_time": "7:20:19", "remaining_time": "0:04:51"} +{"current_steps": 10680, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 3.1493952758832046e-07, "epoch": 1.98, "percentage": 98.91, "elapsed_time": "7:14:14", "remaining_time": "0:04:47"} +{"current_steps": 10680, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 3.1493952758832046e-07, "epoch": 1.98, "percentage": 98.91, "elapsed_time": "7:14:16", "remaining_time": "0:04:47"} +{"current_steps": 10680, "total_steps": 10798, "loss": 1.9247, "reward": null, "learning_rate": 3.1493952758832046e-07, "epoch": 1.98, "percentage": 98.91, "elapsed_time": "7:14:18", "remaining_time": "0:04:47"} +{"current_steps": 10690, "total_steps": 10798, "loss": 1.917, "reward": null, "learning_rate": 2.6543043841548153e-07, "epoch": 1.98, "percentage": 99.0, "elapsed_time": "7:20:44", "remaining_time": "0:04:27"} +{"current_steps": 10690, "total_steps": 10798, "loss": 1.917, "reward": null, "learning_rate": 2.6543043841548153e-07, "epoch": 1.98, "percentage": 99.0, "elapsed_time": "7:14:39", "remaining_time": "0:04:23"} +{"current_steps": 10690, "total_steps": 10798, "loss": 1.917, "reward": null, "learning_rate": 2.6543043841548153e-07, "epoch": 1.98, "percentage": 99.0, "elapsed_time": "7:14:41", "remaining_time": "0:04:23"} +{"current_steps": 10690, "total_steps": 10798, "loss": 1.917, "reward": null, "learning_rate": 2.6543043841548153e-07, "epoch": 1.98, "percentage": 99.0, "elapsed_time": "7:14:42", "remaining_time": "0:04:23"} +{"current_steps": 10700, "total_steps": 10798, "loss": 1.8837, "reward": null, "learning_rate": 2.2015146435627742e-07, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "7:21:08", "remaining_time": "0:04:02"} +{"current_steps": 10700, "total_steps": 10798, "loss": 1.8837, "reward": null, "learning_rate": 2.2015146435627742e-07, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "7:15:05", "remaining_time": "0:03:59"} +{"current_steps": 10700, "total_steps": 10798, "loss": 1.8837, "reward": null, "learning_rate": 2.2015146435627742e-07, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "7:15:03", "remaining_time": "0:03:59"} +{"current_steps": 10700, "total_steps": 10798, "loss": 1.8837, "reward": null, "learning_rate": 2.2015146435627742e-07, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "7:15:07", "remaining_time": "0:03:59"} +{"current_steps": 10710, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 1.7910298868467623e-07, "epoch": 1.98, "percentage": 99.19, "elapsed_time": "7:15:32", "remaining_time": "0:03:34"} +{"current_steps": 10710, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 1.7910298868467623e-07, "epoch": 1.98, "percentage": 99.19, "elapsed_time": "7:15:29", "remaining_time": "0:03:34"} +{"current_steps": 10710, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 1.7910298868467623e-07, "epoch": 1.98, "percentage": 99.19, "elapsed_time": "7:15:30", "remaining_time": "0:03:34"} +{"current_steps": 10710, "total_steps": 10798, "loss": 1.9174, "reward": null, "learning_rate": 1.7910298868467623e-07, "epoch": 1.98, "percentage": 99.19, "elapsed_time": "7:21:33", "remaining_time": "0:03:37"} +{"current_steps": 10720, "total_steps": 10798, "loss": 1.9107, "reward": null, "learning_rate": 1.422853588647355e-07, "epoch": 1.99, "percentage": 99.28, "elapsed_time": "7:21:59", "remaining_time": "0:03:12"} +{"current_steps": 10720, "total_steps": 10798, "loss": 1.9107, "reward": null, "learning_rate": 1.422853588647355e-07, "epoch": 1.99, "percentage": 99.28, "elapsed_time": "7:15:55", "remaining_time": "0:03:10"} +{"current_steps": 10720, "total_steps": 10798, "loss": 1.9107, "reward": null, "learning_rate": 1.422853588647355e-07, "epoch": 1.99, "percentage": 99.28, "elapsed_time": "7:15:57", "remaining_time": "0:03:10"} +{"current_steps": 10720, "total_steps": 10798, "loss": 1.9107, "reward": null, "learning_rate": 1.422853588647355e-07, "epoch": 1.99, "percentage": 99.28, "elapsed_time": "7:15:54", "remaining_time": "0:03:10"} +{"current_steps": 10730, "total_steps": 10798, "loss": 1.9253, "reward": null, "learning_rate": 1.0969888654749349e-07, "epoch": 1.99, "percentage": 99.37, "elapsed_time": "7:22:25", "remaining_time": "0:02:48"} +{"current_steps": 10730, "total_steps": 10798, "loss": 1.9253, "reward": null, "learning_rate": 1.0969888654749349e-07, "epoch": 1.99, "percentage": 99.37, "elapsed_time": "7:16:20", "remaining_time": "0:02:45"} +{"current_steps": 10730, "total_steps": 10798, "loss": 1.9253, "reward": null, "learning_rate": 1.0969888654749349e-07, "epoch": 1.99, "percentage": 99.37, "elapsed_time": "7:16:22", "remaining_time": "0:02:45"} +{"current_steps": 10730, "total_steps": 10798, "loss": 1.9253, "reward": null, "learning_rate": 1.0969888654749349e-07, "epoch": 1.99, "percentage": 99.37, "elapsed_time": "7:16:23", "remaining_time": "0:02:45"} +{"current_steps": 10740, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 8.134384756841584e-08, "epoch": 1.99, "percentage": 99.46, "elapsed_time": "7:22:48", "remaining_time": "0:02:23"} +{"current_steps": 10740, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 8.134384756841584e-08, "epoch": 1.99, "percentage": 99.46, "elapsed_time": "7:16:43", "remaining_time": "0:02:21"} +{"current_steps": 10740, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 8.134384756841584e-08, "epoch": 1.99, "percentage": 99.46, "elapsed_time": "7:16:45", "remaining_time": "0:02:21"} +{"current_steps": 10740, "total_steps": 10798, "loss": 1.9154, "reward": null, "learning_rate": 8.134384756841584e-08, "epoch": 1.99, "percentage": 99.46, "elapsed_time": "7:16:47", "remaining_time": "0:02:21"} +{"current_steps": 10750, "total_steps": 10798, "loss": 1.893, "reward": null, "learning_rate": 5.722048194511942e-08, "epoch": 1.99, "percentage": 99.56, "elapsed_time": "7:23:13", "remaining_time": "0:01:58"} +{"current_steps": 10750, "total_steps": 10798, "loss": 1.893, "reward": null, "learning_rate": 5.722048194511942e-08, "epoch": 1.99, "percentage": 99.56, "elapsed_time": "7:17:08", "remaining_time": "0:01:57"} +{"current_steps": 10750, "total_steps": 10798, "loss": 1.893, "reward": null, "learning_rate": 5.722048194511942e-08, "epoch": 1.99, "percentage": 99.56, "elapsed_time": "7:17:12", "remaining_time": "0:01:57"} +{"current_steps": 10750, "total_steps": 10798, "loss": 1.893, "reward": null, "learning_rate": 5.722048194511942e-08, "epoch": 1.99, "percentage": 99.56, "elapsed_time": "7:17:10", "remaining_time": "0:01:57"} +{"current_steps": 10760, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 3.73289938752075e-08, "epoch": 1.99, "percentage": 99.65, "elapsed_time": "7:23:37", "remaining_time": "0:01:34"} +{"current_steps": 10760, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 3.73289938752075e-08, "epoch": 1.99, "percentage": 99.65, "elapsed_time": "7:17:36", "remaining_time": "0:01:32"} +{"current_steps": 10760, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 3.73289938752075e-08, "epoch": 1.99, "percentage": 99.65, "elapsed_time": "7:17:33", "remaining_time": "0:01:32"} +{"current_steps": 10760, "total_steps": 10798, "loss": 1.91, "reward": null, "learning_rate": 3.73289938752075e-08, "epoch": 1.99, "percentage": 99.65, "elapsed_time": "7:17:34", "remaining_time": "0:01:32"} +{"current_steps": 10770, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 2.1669551734604385e-08, "epoch": 1.99, "percentage": 99.74, "elapsed_time": "7:24:03", "remaining_time": "0:01:09"} +{"current_steps": 10770, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 2.1669551734604385e-08, "epoch": 1.99, "percentage": 99.74, "elapsed_time": "7:17:58", "remaining_time": "0:01:08"} +{"current_steps": 10770, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 2.1669551734604385e-08, "epoch": 1.99, "percentage": 99.74, "elapsed_time": "7:18:01", "remaining_time": "0:01:08"} +{"current_steps": 10770, "total_steps": 10798, "loss": 1.9416, "reward": null, "learning_rate": 2.1669551734604385e-08, "epoch": 1.99, "percentage": 99.74, "elapsed_time": "7:18:00", "remaining_time": "0:01:08"} +{"current_steps": 10780, "total_steps": 10798, "loss": 1.9549, "reward": null, "learning_rate": 1.0242288076223182e-08, "epoch": 2.0, "percentage": 99.83, "elapsed_time": "7:24:28", "remaining_time": "0:00:44"} +{"current_steps": 10780, "total_steps": 10798, "loss": 1.9549, "reward": null, "learning_rate": 1.0242288076223182e-08, "epoch": 2.0, "percentage": 99.83, "elapsed_time": "7:18:24", "remaining_time": "0:00:43"} +{"current_steps": 10780, "total_steps": 10798, "loss": 1.9549, "reward": null, "learning_rate": 1.0242288076223182e-08, "epoch": 2.0, "percentage": 99.83, "elapsed_time": "7:18:23", "remaining_time": "0:00:43"} +{"current_steps": 10780, "total_steps": 10798, "loss": 1.9549, "reward": null, "learning_rate": 1.0242288076223182e-08, "epoch": 2.0, "percentage": 99.83, "elapsed_time": "7:18:26", "remaining_time": "0:00:43"} +{"current_steps": 10790, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 3.047299628633482e-09, "epoch": 2.0, "percentage": 99.93, "elapsed_time": "7:24:53", "remaining_time": "0:00:19"} +{"current_steps": 10790, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 3.047299628633482e-09, "epoch": 2.0, "percentage": 99.93, "elapsed_time": "7:18:48", "remaining_time": "0:00:19"} +{"current_steps": 10790, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 3.047299628633482e-09, "epoch": 2.0, "percentage": 99.93, "elapsed_time": "7:18:50", "remaining_time": "0:00:19"} +{"current_steps": 10790, "total_steps": 10798, "loss": 1.9516, "reward": null, "learning_rate": 3.047299628633482e-09, "epoch": 2.0, "percentage": 99.93, "elapsed_time": "7:18:51", "remaining_time": "0:00:19"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..a22339fad4a77b31851d6c82c18aba70403be560 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,6499 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.0, + "global_step": 10798, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0009999978838190456, + "loss": 2.9794, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0009999915352940948, + "loss": 2.3885, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999980954478887, + "loss": 2.3057, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999966141462985, + "loss": 2.2692, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 0.000999947096371777, + "loss": 2.2576, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009999238193664748, + "loss": 2.2388, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998963106441117, + "loss": 2.2523, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.0009998645704375414, + "loss": 2.218, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999828599015436, + "loss": 2.2457, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997883966822835, + "loss": 2.198, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009997439637783859, + "loss": 2.2013, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 0.000999695300679855, + "loss": 2.1765, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 0.0009996424077986109, + "loss": 2.1741, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999585285582377, + "loss": 2.1898, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009995239345146772, + "loss": 2.1466, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009994583551148314, + "loss": 2.1423, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0009993885479379506, + "loss": 2.1451, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 0.000999314513574934, + "loss": 2.202, + "step": 180 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009992362526524616, + "loss": 2.1208, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009991537658329906, + "loss": 2.1591, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 0.000999067053814749, + "loss": 2.1788, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 0.0009989761173317304, + "loss": 2.147, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998880957153687, + "loss": 2.1249, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 0.000998781574086123, + "loss": 2.165, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 0.000998677968970289, + "loss": 2.1428, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009985701426831735, + "loss": 2.1384, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009984580961374964, + "loss": 2.1585, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009983418302817008, + "loss": 2.1156, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 0.0009982213460999448, + "loss": 2.0811, + "step": 290 + }, + { + "epoch": 0.06, + "learning_rate": 0.000998096644612094, + "loss": 2.1081, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009979677268737118, + "loss": 2.1246, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009978345939760515, + "loss": 2.1229, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997697247046046, + "loss": 2.1033, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0009975556872462994, + "loss": 2.0931, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 0.000997409915775076, + "loss": 2.1206, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009972599338662915, + "loss": 2.0537, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009971057427895012, + "loss": 2.0762, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009969473438498897, + "loss": 2.0883, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009967847383882604, + "loss": 2.1174, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 0.0009966179277810239, + "loss": 2.1111, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009964469134401855, + "loss": 2.1288, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009962716968133346, + "loss": 2.0967, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009960922793836318, + "loss": 2.1216, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009959086626697955, + "loss": 2.0924, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 0.0009957208482260908, + "loss": 2.0809, + "step": 450 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009955288376423152, + "loss": 2.1082, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009953326325437852, + "loss": 2.0885, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009951322345913224, + "loss": 2.1133, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009949276454812408, + "loss": 2.0844, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00099471886694533, + "loss": 2.0796, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0009945059007508434, + "loss": 2.1255, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009942887487004804, + "loss": 2.0913, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009940674126323733, + "loss": 2.1003, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009938418944200709, + "loss": 2.0541, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009936121959725223, + "loss": 2.0523, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 0.0009933783192340618, + "loss": 2.1225, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009931402661843911, + "loss": 2.0446, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 0.000992898038838564, + "loss": 2.0921, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009926516392469674, + "loss": 2.1081, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009924010694953064, + "loss": 2.0734, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009921463317045843, + "loss": 2.0652, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 0.0009918874280310862, + "loss": 2.0818, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009916243606663605, + "loss": 2.0776, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009913571318371994, + "loss": 2.1025, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009910857438056215, + "loss": 2.066, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009908101988688512, + "loss": 2.0575, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0009905304993593008, + "loss": 2.1269, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009902466476445486, + "loss": 2.0518, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009899586461273218, + "loss": 2.0698, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 0.000989666497245473, + "loss": 2.0988, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009893702034719624, + "loss": 2.0986, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0009890697673148345, + "loss": 2.0237, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009887651913171986, + "loss": 2.0027, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009884564780572064, + "loss": 2.0563, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009881436301480305, + "loss": 2.0624, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987826650237842, + "loss": 2.0926, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 0.000987505541009788, + "loss": 2.0585, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0009871803051819696, + "loss": 2.0494, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009868509455074183, + "loss": 2.0106, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009865174647740729, + "loss": 2.0861, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009861798658047556, + "loss": 2.0478, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0009858381514571484, + "loss": 2.0469, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 0.000985492324623769, + "loss": 2.0671, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009851423882319458, + "loss": 2.0808, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009847883452437937, + "loss": 2.0331, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009844301986561893, + "loss": 2.0295, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 0.000984067951500744, + "loss": 2.0873, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 0.00098370160684378, + "loss": 2.1038, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 0.0009833311677863042, + "loss": 2.0337, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009829566374639801, + "loss": 2.0407, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009825780190471042, + "loss": 2.1049, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 0.000982195315740576, + "loss": 2.0475, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0009818085307838741, + "loss": 2.0624, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 0.000981417667451026, + "loss": 2.0714, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009810227290505816, + "loss": 2.0947, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009806237189255859, + "loss": 2.0591, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009802206404535489, + "loss": 2.0301, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 0.000979813497046419, + "loss": 2.0556, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 0.0009794022921505523, + "loss": 2.0753, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 0.000978987029246685, + "loss": 2.0898, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009785677118499029, + "loss": 2.0464, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009781443435096116, + "loss": 2.0828, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009777169278095074, + "loss": 2.1137, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 0.0009772854683675462, + "loss": 2.0167, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 0.000976849968835913, + "loss": 2.07, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009764104329009909, + "loss": 2.0409, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009759668642833304, + "loss": 2.015, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009755192667376173, + "loss": 2.0175, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009750676440526411, + "loss": 2.0773, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 0.0009746120000512632, + "loss": 2.0245, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009741523385903841, + "loss": 2.094, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009736886635609112, + "loss": 2.0506, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009732209788877258, + "loss": 2.0287, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009727492885296489, + "loss": 2.1162, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009722735964794099, + "loss": 2.1096, + "step": 1150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0009717939067636099, + "loss": 2.0621, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009713102234426903, + "loss": 2.0796, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009708225506108965, + "loss": 2.0565, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009703308923962447, + "loss": 2.0669, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009698352529604857, + "loss": 2.0638, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 0.0009693356364990705, + "loss": 2.0358, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009688320472411143, + "loss": 2.0859, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009683244894493613, + "loss": 2.0932, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009678129674201479, + "loss": 2.0129, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009672974854833669, + "loss": 2.055, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0009667780480024304, + "loss": 2.0665, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009662546593742334, + "loss": 2.0488, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009657273240291159, + "loss": 2.0543, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009651960464308261, + "loss": 2.0418, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009646608310764819, + "loss": 2.033, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009641216824965338, + "loss": 2.1034, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 0.0009635786052547253, + "loss": 2.0866, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009630316039480556, + "loss": 2.0607, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009624806832067394, + "loss": 2.0457, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009619258476941686, + "loss": 2.032, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 0.000961367102106873, + "loss": 2.0519, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 0.0009608044511744791, + "loss": 2.0449, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009602378996596721, + "loss": 1.9949, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009596674523581539, + "loss": 2.0394, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009590931140986035, + "loss": 2.0386, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009585148897426354, + "loss": 2.0254, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0009579327841847593, + "loss": 2.0238, + "step": 1420 + }, + { + "epoch": 0.26, + "learning_rate": 0.000957346802352338, + "loss": 2.0509, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009567569492055456, + "loss": 2.0004, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009561632297373263, + "loss": 2.0203, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009555656489733513, + "loss": 2.0182, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 0.000954964211971977, + "loss": 1.9754, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0009543589238242012, + "loss": 2.0374, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953749789653621, + "loss": 2.0367, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 0.000953136814616389, + "loss": 2.0866, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009525200039011694, + "loss": 2.0083, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009518993627290948, + "loss": 2.0525, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 0.0009512748963537212, + "loss": 2.0636, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 0.000950646610060984, + "loss": 2.0522, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009500145091691532, + "loss": 2.05, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009493785990287882, + "loss": 1.9887, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009487388850226926, + "loss": 2.0309, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 0.000948095372565869, + "loss": 1.9954, + "step": 1580 + }, + { + "epoch": 0.29, + "learning_rate": 0.0009474480671054726, + "loss": 2.0078, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009467969741207652, + "loss": 2.0395, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009461420991230693, + "loss": 2.0415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009454834476557207, + "loss": 2.0308, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009448210252940223, + "loss": 2.0826, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 0.0009441548376451963, + "loss": 2.0424, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009434848903483373, + "loss": 2.0125, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009428111890743639, + "loss": 2.0139, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009421337395259717, + "loss": 2.0682, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009414525474375837, + "loss": 2.0577, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009407676185753029, + "loss": 2.0262, + "step": 1690 + }, + { + "epoch": 0.31, + "learning_rate": 0.0009400789587368632, + "loss": 2.0515, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009393865737515794, + "loss": 2.0398, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009386904694802997, + "loss": 2.0146, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009379906518153543, + "loss": 2.0438, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 0.0009372871266805063, + "loss": 2.0377, + "step": 1740 + }, + { + "epoch": 0.32, + "learning_rate": 0.000936579900030902, + "loss": 2.0789, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009358689778530193, + "loss": 2.0201, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009351543661646185, + "loss": 2.0114, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009344360710146898, + "loss": 2.0242, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009337140984834034, + "loss": 2.0436, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 0.0009329884546820572, + "loss": 2.0452, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 0.000932259145753026, + "loss": 2.0254, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009315261778697083, + "loss": 2.0409, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009307895572364746, + "loss": 2.0301, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009300492900886154, + "loss": 2.0078, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009293053826922873, + "loss": 1.9851, + "step": 1850 + }, + { + "epoch": 0.34, + "learning_rate": 0.0009285578413444613, + "loss": 1.9947, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009278066723728682, + "loss": 2.0331, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009270518821359461, + "loss": 2.0058, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009262934770227858, + "loss": 2.05, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009255314634530771, + "loss": 2.0444, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0009247658478770543, + "loss": 2.0045, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 0.000923996636775442, + "loss": 2.0211, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009232238366593997, + "loss": 2.0124, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009224474540704671, + "loss": 2.0067, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009216674955805079, + "loss": 2.0247, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009208839677916557, + "loss": 2.0314, + "step": 1960 + }, + { + "epoch": 0.36, + "learning_rate": 0.0009200968773362568, + "loss": 2.067, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009193062308768145, + "loss": 2.0168, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009185120351059326, + "loss": 2.0649, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009177142967462591, + "loss": 2.0208, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009169130225504289, + "loss": 2.016, + "step": 2010 + }, + { + "epoch": 0.37, + "learning_rate": 0.0009161082193010066, + "loss": 2.0331, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009152998938104296, + "loss": 2.0757, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009144880529209498, + "loss": 2.0093, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009136727035045765, + "loss": 1.954, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009128538524630167, + "loss": 2.0062, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0009120315067276187, + "loss": 2.0179, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009112056732593119, + "loss": 2.0301, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009103763590485488, + "loss": 2.0223, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009095435711152449, + "loss": 2.0208, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 0.00090870731650872, + "loss": 2.0492, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009078676023076385, + "loss": 1.9917, + "step": 2120 + }, + { + "epoch": 0.39, + "learning_rate": 0.0009070244356199492, + "loss": 2.0235, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009061778235828253, + "loss": 2.01, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009054129328980229, + "loss": 1.9999, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 0.000904559794464287, + "loss": 2.0022, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009037032315436229, + "loss": 2.0004, + "step": 2170 + }, + { + "epoch": 0.4, + "learning_rate": 0.0009028432513865994, + "loss": 1.9936, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 0.000901979861272711, + "loss": 2.0098, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009011130685103166, + "loss": 1.9829, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 0.0009002428804365775, + "loss": 2.0135, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008993693044173954, + "loss": 2.0526, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008984923478473499, + "loss": 2.0145, + "step": 2230 + }, + { + "epoch": 0.41, + "learning_rate": 0.0008976120181496365, + "loss": 2.0364, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008967283227760028, + "loss": 2.019, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 0.000895841269206686, + "loss": 1.9874, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008949508649503495, + "loss": 2.0699, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008940571175440196, + "loss": 2.0407, + "step": 2280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0008931600345530213, + "loss": 2.0176, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008922596235709142, + "loss": 2.0235, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008913558922194287, + "loss": 2.0268, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 0.000890448848148401, + "loss": 2.0279, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008895384990357087, + "loss": 2.0073, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 0.0008886248525872056, + "loss": 2.0262, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008877079165366566, + "loss": 2.0112, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 0.000886787698645672, + "loss": 2.042, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008858642067036424, + "loss": 2.0129, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008849374485276715, + "loss": 2.0264, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 0.000884007431962512, + "loss": 2.0211, + "step": 2390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0008830741648804967, + "loss": 2.0175, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008821376551814739, + "loss": 2.0423, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008811979107927396, + "loss": 2.0112, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008802549396689705, + "loss": 2.0422, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008793087497921566, + "loss": 2.0075, + "step": 2440 + }, + { + "epoch": 0.45, + "learning_rate": 0.0008784544334882426, + "loss": 1.9958, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 0.000877502150068553, + "loss": 2.0348, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008765466711974225, + "loss": 2.0232, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008755880049627157, + "loss": 1.9953, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008746261594792776, + "loss": 2.0223, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008736611428888644, + "loss": 2.0332, + "step": 2500 + }, + { + "epoch": 0.46, + "learning_rate": 0.0008726929633600753, + "loss": 2.0075, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008717216290882824, + "loss": 2.002, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008707471482955622, + "loss": 2.0594, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008697695292306253, + "loss": 2.0214, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008687887801687473, + "loss": 1.994, + "step": 2550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0008678049094116979, + "loss": 2.0338, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008668179252876714, + "loss": 2.0176, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008658278361512161, + "loss": 2.0013, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008648346503831627, + "loss": 2.0141, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008638383763905546, + "loss": 1.9655, + "step": 2600 + }, + { + "epoch": 0.48, + "learning_rate": 0.0008628390226065761, + "loss": 2.039, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008618365974904808, + "loss": 1.9418, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008608311095275205, + "loss": 2.011, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008598225672288731, + "loss": 2.0174, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008588109791315707, + "loss": 1.984, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 0.000857796353798427, + "loss": 2.0437, + "step": 2660 + }, + { + "epoch": 0.49, + "learning_rate": 0.0008567786998179654, + "loss": 2.0255, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008557580258043459, + "loss": 2.0067, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008547343403972918, + "loss": 2.0201, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008537076522620175, + "loss": 2.0258, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008526779700891545, + "loss": 1.9977, + "step": 2710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0008516453025946781, + "loss": 1.9835, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008506096585198333, + "loss": 2.0428, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008495710466310613, + "loss": 1.9554, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008485294757199248, + "loss": 2.0497, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008474849546030339, + "loss": 2.001, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008464374921219714, + "loss": 1.9824, + "step": 2770 + }, + { + "epoch": 0.51, + "learning_rate": 0.0008453870971432179, + "loss": 2.0378, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008443337785580769, + "loss": 1.9756, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008432775452825992, + "loss": 2.0563, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008422184062575077, + "loss": 2.0115, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008411563704481217, + "loss": 2.0301, + "step": 2820 + }, + { + "epoch": 0.52, + "learning_rate": 0.0008400914468442814, + "loss": 1.9912, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008390236444602706, + "loss": 2.0669, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008379529723347417, + "loss": 2.0138, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008368794395306386, + "loss": 2.0486, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008358030551351199, + "loss": 2.0342, + "step": 2870 + }, + { + "epoch": 0.53, + "learning_rate": 0.0008347238282594823, + "loss": 2.0474, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008336417680390829, + "loss": 2.006, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008325568836332633, + "loss": 1.99, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.00083146918422527, + "loss": 2.0148, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008303786790221778, + "loss": 2.0381, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008292853772548126, + "loss": 2.0591, + "step": 2930 + }, + { + "epoch": 0.54, + "learning_rate": 0.0008281892881776714, + "loss": 2.0238, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008270904210688459, + "loss": 1.9939, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008259887852299427, + "loss": 1.9941, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008248843899860045, + "loss": 2.0193, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008237772446854325, + "loss": 2.0166, + "step": 2980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0008226673586999058, + "loss": 2.0219, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008215547414243025, + "loss": 2.0078, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008204394022766208, + "loss": 2.0022, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008193213506978983, + "loss": 2.0009, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008182005961521331, + "loss": 2.0197, + "step": 3030 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008170771481262027, + "loss": 2.0101, + "step": 3040 + }, + { + "epoch": 0.56, + "learning_rate": 0.0008159510161297846, + "loss": 2.0307, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008148222096952748, + "loss": 2.0075, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008136907383777081, + "loss": 2.0415, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 0.000812556611754677, + "loss": 2.0031, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008114198394262497, + "loss": 2.0025, + "step": 3090 + }, + { + "epoch": 0.57, + "learning_rate": 0.0008102804310148905, + "loss": 1.983, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008091383961653765, + "loss": 2.0056, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008079937445447175, + "loss": 1.9679, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008068464858420732, + "loss": 1.9897, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008056966297686717, + "loss": 1.9833, + "step": 3140 + }, + { + "epoch": 0.58, + "learning_rate": 0.0008045441860577273, + "loss": 2.0088, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008033891644643576, + "loss": 1.9985, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008022315747655011, + "loss": 2.013, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 0.0008010714267598354, + "loss": 1.9902, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007999087302676926, + "loss": 2.0133, + "step": 3190 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007987434951309774, + "loss": 2.0092, + "step": 3200 + }, + { + "epoch": 0.59, + "learning_rate": 0.0007975757312130836, + "loss": 1.9894, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007964054483988103, + "loss": 1.9742, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 0.000795232656594278, + "loss": 2.016, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007940573657268458, + "loss": 2.0386, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007928795857450259, + "loss": 1.9602, + "step": 3250 + }, + { + "epoch": 0.6, + "learning_rate": 0.0007916993266184007, + "loss": 1.9681, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007905165983375379, + "loss": 2.0326, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007893314109139058, + "loss": 1.9958, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007881437743797882, + "loss": 2.0077, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007869536987882008, + "loss": 1.9813, + "step": 3300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007857611942128044, + "loss": 1.9538, + "step": 3310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0007845662707478214, + "loss": 1.9919, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007833689385079485, + "loss": 1.9922, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007821692076282725, + "loss": 1.9973, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007809670882641842, + "loss": 2.0231, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007797625905912915, + "loss": 1.9971, + "step": 3360 + }, + { + "epoch": 0.62, + "learning_rate": 0.0007785557248053351, + "loss": 1.9934, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007773465011221002, + "loss": 1.9855, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007761349297773315, + "loss": 2.0421, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007749210210266457, + "loss": 1.9795, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007737047851454451, + "loss": 2.0006, + "step": 3410 + }, + { + "epoch": 0.63, + "learning_rate": 0.0007724862324288309, + "loss": 2.011, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007712653731915147, + "loss": 1.9969, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007700422177677331, + "loss": 1.9581, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007688167765111592, + "loss": 1.9858, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007675890597948141, + "loss": 1.9945, + "step": 3460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007663590780109814, + "loss": 2.0116, + "step": 3470 + }, + { + "epoch": 0.64, + "learning_rate": 0.0007651268415711168, + "loss": 1.9831, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007638923609057616, + "loss": 2.0113, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007626556464644538, + "loss": 1.9927, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007614167087156393, + "loss": 2.0209, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007601755581465844, + "loss": 1.9941, + "step": 3520 + }, + { + "epoch": 0.65, + "learning_rate": 0.0007589322052632855, + "loss": 2.0443, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007576866605903812, + "loss": 1.975, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007564389346710638, + "loss": 1.9655, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007551890380669879, + "loss": 2.0034, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007539369813581836, + "loss": 1.953, + "step": 3570 + }, + { + "epoch": 0.66, + "learning_rate": 0.000752682775142965, + "loss": 2.0162, + "step": 3580 + }, + { + "epoch": 0.66, + "learning_rate": 0.0007514264300378411, + "loss": 2.0096, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007501679566774267, + "loss": 2.0431, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007489073657143506, + "loss": 1.961, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007476446678191676, + "loss": 2.0179, + "step": 3620 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007463798736802665, + "loss": 1.9885, + "step": 3630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0007451129940037804, + "loss": 1.9955, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 0.000743844039513496, + "loss": 1.9671, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007425730209507622, + "loss": 1.9866, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007412999490744008, + "loss": 1.9508, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007400248346606129, + "loss": 2.0261, + "step": 3680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0007387476885028902, + "loss": 1.9946, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007374685214119221, + "loss": 1.969, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007361873442155049, + "loss": 1.9802, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007349041677584496, + "loss": 1.9739, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007336190029024907, + "loss": 1.964, + "step": 3730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007323318605261933, + "loss": 2.0009, + "step": 3740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0007310427515248626, + "loss": 1.9825, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007297516868104501, + "loss": 1.9744, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 0.000728458677311462, + "loss": 2.0197, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007271637339728667, + "loss": 2.0016, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007258668677560019, + "loss": 1.9721, + "step": 3790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0007245680896384818, + "loss": 1.9591, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007232674106141048, + "loss": 1.9762, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007219648416927592, + "loss": 2.0026, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007206603939003314, + "loss": 1.9876, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007193540782786117, + "loss": 1.9991, + "step": 3840 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007180459058852011, + "loss": 1.9897, + "step": 3850 + }, + { + "epoch": 0.71, + "learning_rate": 0.0007167358877934176, + "loss": 2.0581, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007154240350922025, + "loss": 1.9588, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007141103588860265, + "loss": 2.0151, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 0.000712794870294796, + "loss": 1.9494, + "step": 3890 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007114775804537586, + "loss": 1.9936, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0007101585005134088, + "loss": 2.0016, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007088376416393944, + "loss": 1.9628, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007075150150124208, + "loss": 1.9955, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007061906318281568, + "loss": 1.9731, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007048645032971407, + "loss": 1.9554, + "step": 3950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0007035366406446839, + "loss": 1.985, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007022070551107774, + "loss": 1.9961, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 0.0007008757579499954, + "loss": 2.0112, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006995427604314004, + "loss": 2.0086, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006982080738384487, + "loss": 2.019, + "step": 4000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006968717094688933, + "loss": 1.9983, + "step": 4010 + }, + { + "epoch": 0.74, + "learning_rate": 0.0006955336786346898, + "loss": 1.981, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006941939926618997, + "loss": 1.9878, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006928526628905942, + "loss": 2.0067, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006915097006747601, + "loss": 2.035, + "step": 4050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006901651173822013, + "loss": 1.9614, + "step": 4060 + }, + { + "epoch": 0.75, + "learning_rate": 0.0006888189243944439, + "loss": 1.9655, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006874711331066401, + "loss": 1.9692, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006861217549274705, + "loss": 1.9791, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006847708012790492, + "loss": 1.9804, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006834182835968253, + "loss": 1.9973, + "step": 4110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006820642133294876, + "loss": 2.0153, + "step": 4120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0006807086019388669, + "loss": 1.9639, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006793514608998393, + "loss": 2.0162, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 0.000677992801700229, + "loss": 1.994, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006766326358407104, + "loss": 1.9992, + "step": 4160 + }, + { + "epoch": 0.77, + "learning_rate": 0.0006752709748347125, + "loss": 1.976, + "step": 4170 + }, + { + "epoch": 0.77, + "learning_rate": 0.000673907830208319, + "loss": 1.9452, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006725432135001732, + "loss": 1.9982, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006711771362613785, + "loss": 1.9766, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006698096100554014, + "loss": 1.9838, + "step": 4210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006684406464579735, + "loss": 1.9746, + "step": 4220 + }, + { + "epoch": 0.78, + "learning_rate": 0.0006670702570569937, + "loss": 1.9838, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006656984534524296, + "loss": 1.9747, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006643252472562201, + "loss": 1.9896, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 0.000662950650092176, + "loss": 1.9607, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006615746735958832, + "loss": 2.0075, + "step": 4270 + }, + { + "epoch": 0.79, + "learning_rate": 0.0006603351250463683, + "loss": 1.9918, + "step": 4280 + }, + { + "epoch": 0.79, + "learning_rate": 0.000658956559916577, + "loss": 1.9669, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006575766492634068, + "loss": 1.9645, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006561954047674206, + "loss": 1.9511, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006548128381204714, + "loss": 1.9934, + "step": 4320 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006534289610256039, + "loss": 1.9973, + "step": 4330 + }, + { + "epoch": 0.8, + "learning_rate": 0.0006520437851969557, + "loss": 1.9983, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006506573223596575, + "loss": 1.9906, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006492695842497347, + "loss": 1.9392, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006478805826140066, + "loss": 2.0015, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006464903292099886, + "loss": 2.0168, + "step": 4380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006450988358057919, + "loss": 1.9676, + "step": 4390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0006437061141800238, + "loss": 1.9798, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006423121761216881, + "loss": 1.9753, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006409170334300858, + "loss": 1.9965, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006395206979147141, + "loss": 1.9532, + "step": 4430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006381231813951678, + "loss": 1.9962, + "step": 4440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0006367244957010379, + "loss": 1.9758, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 0.000635324652671813, + "loss": 1.9606, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006339236641567774, + "loss": 1.9785, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006325215420149119, + "loss": 1.9334, + "step": 4480 + }, + { + "epoch": 0.83, + "learning_rate": 0.0006311182981147935, + "loss": 1.9829, + "step": 4490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000629713944334494, + "loss": 1.9671, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006283084925614805, + "loss": 2.0108, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006269019546925139, + "loss": 1.9341, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006254943426335488, + "loss": 1.9378, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006240856682996326, + "loss": 1.9619, + "step": 4540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006226759436148044, + "loss": 1.9516, + "step": 4550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0006212651805119946, + "loss": 1.9882, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 0.000619853390932923, + "loss": 1.9636, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006184405868279985, + "loss": 1.9894, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006170267801562176, + "loss": 1.9365, + "step": 4590 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006156119828850633, + "loss": 2.0264, + "step": 4600 + }, + { + "epoch": 0.85, + "learning_rate": 0.0006141962069904041, + "loss": 1.9659, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006127794644563915, + "loss": 1.9368, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006113617672753598, + "loss": 1.959, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006099431274477245, + "loss": 1.9832, + "step": 4640 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006085235569818795, + "loss": 1.9572, + "step": 4650 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006071030678940969, + "loss": 1.99, + "step": 4660 + }, + { + "epoch": 0.86, + "learning_rate": 0.0006056816722084248, + "loss": 1.9963, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006042593819565846, + "loss": 1.9997, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006028362091778706, + "loss": 1.9221, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0006014121659190476, + "loss": 1.9623, + "step": 4700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005999872642342484, + "loss": 1.9949, + "step": 4710 + }, + { + "epoch": 0.87, + "learning_rate": 0.0005985615161848721, + "loss": 1.9688, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 0.000597134933839482, + "loss": 1.975, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005957075292737042, + "loss": 2.0048, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005942793145701235, + "loss": 1.9591, + "step": 4750 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005928503018181833, + "loss": 1.9957, + "step": 4760 + }, + { + "epoch": 0.88, + "learning_rate": 0.0005914205031140819, + "loss": 1.9823, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005899899305606703, + "loss": 2.0032, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005885585962673501, + "loss": 1.9722, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005871265123499708, + "loss": 1.9903, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005856936909307273, + "loss": 2.0258, + "step": 4810 + }, + { + "epoch": 0.89, + "learning_rate": 0.000584260144138057, + "loss": 2.0444, + "step": 4820 + }, + { + "epoch": 0.89, + "learning_rate": 0.0005828258841065377, + "loss": 1.968, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005813909229767846, + "loss": 1.9598, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005799552728953472, + "loss": 2.0047, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 0.000578518946014607, + "loss": 1.939, + "step": 4860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005770819544926741, + "loss": 1.9835, + "step": 4870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0005756443104932852, + "loss": 2.028, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005742060261856996, + "loss": 1.973, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005727671137445967, + "loss": 1.9734, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005713275853499729, + "loss": 1.9921, + "step": 4910 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005698874531870386, + "loss": 1.9607, + "step": 4920 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005684467294461146, + "loss": 1.9468, + "step": 4930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0005670054263225297, + "loss": 1.9524, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005655635560165166, + "loss": 1.9737, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005641211307331093, + "loss": 1.9532, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005626781626820395, + "loss": 2.0048, + "step": 4970 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005612346640776331, + "loss": 2.0276, + "step": 4980 + }, + { + "epoch": 0.92, + "learning_rate": 0.0005597906471387074, + "loss": 1.9476, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005583461240884666, + "loss": 1.943, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005569011071543997, + "loss": 1.9859, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005554556085681757, + "loss": 1.9607, + "step": 5020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005540096405655409, + "loss": 1.9825, + "step": 5030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0005525632153862152, + "loss": 1.9875, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005511163452737884, + "loss": 2.0051, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005496690424756164, + "loss": 2.0089, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005482213192427174, + "loss": 1.9495, + "step": 5070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005467731878296688, + "loss": 1.9701, + "step": 5080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005453246604945034, + "loss": 1.9588, + "step": 5090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0005438757494986044, + "loss": 1.9833, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005424264671066038, + "loss": 1.9974, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005409768255862766, + "loss": 1.9746, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005395268372084378, + "loss": 1.9757, + "step": 5130 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005380765142468387, + "loss": 1.9908, + "step": 5140 + }, + { + "epoch": 0.95, + "learning_rate": 0.0005366258689780625, + "loss": 2.006, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005351749136814208, + "loss": 1.9957, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005337236606388495, + "loss": 1.959, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005322721221348047, + "loss": 2.0027, + "step": 5180 + }, + { + "epoch": 0.96, + "learning_rate": 0.000530820310456159, + "loss": 1.9248, + "step": 5190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0005293682378920974, + "loss": 1.9742, + "step": 5200 + }, + { + "epoch": 0.96, + "learning_rate": 0.000527915916734013, + "loss": 1.9844, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005264633592754035, + "loss": 1.9985, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005250105778117661, + "loss": 2.0074, + "step": 5230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005235575846404952, + "loss": 1.9901, + "step": 5240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005221043920607763, + "loss": 1.9861, + "step": 5250 + }, + { + "epoch": 0.97, + "learning_rate": 0.0005206510123734837, + "loss": 1.9576, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005191974578810746, + "loss": 1.9741, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005177437408874868, + "loss": 1.9794, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005162898736980327, + "loss": 1.9883, + "step": 5290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005148358686192967, + "loss": 1.969, + "step": 5300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0005133817379590302, + "loss": 2.0018, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005119274940260476, + "loss": 1.971, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005104731491301225, + "loss": 1.9564, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005090187155818823, + "loss": 1.9798, + "step": 5340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005075642056927057, + "loss": 2.0331, + "step": 5350 + }, + { + "epoch": 0.99, + "learning_rate": 0.000506109631774617, + "loss": 1.9505, + "step": 5360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0005046550061401825, + "loss": 1.9348, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005032003411024067, + "loss": 2.0099, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005017456489746275, + "loss": 1.9756, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 0.0005002909420704116, + "loss": 1.9444, + "step": 5400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004988362327034516, + "loss": 1.976, + "step": 5410 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004973815331874603, + "loss": 1.9593, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004959268558360675, + "loss": 1.9251, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004944722129627151, + "loss": 1.972, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004930176168805531, + "loss": 1.9307, + "step": 5450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004915630799023359, + "loss": 1.9541, + "step": 5460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004901086143403172, + "loss": 1.9212, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004886542325061464, + "loss": 1.965, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004871999467107639, + "loss": 2.0083, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004857457692642974, + "loss": 1.9676, + "step": 5500 + }, + { + "epoch": 1.02, + "learning_rate": 0.000484291712475957, + "loss": 1.9384, + "step": 5510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00048283778865393243, + "loss": 1.9339, + "step": 5520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004813840101052869, + "loss": 2.0182, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004799303891358545, + "loss": 1.9262, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004784769380501352, + "loss": 1.9397, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004770236691511908, + "loss": 1.9404, + "step": 5560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004755705947405417, + "loss": 1.9415, + "step": 5570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00047411772711806105, + "loss": 1.9292, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000472665078581872, + "loss": 1.9487, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00047121266142824354, + "loss": 1.9435, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004697604879514853, + "loss": 1.9145, + "step": 5610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004683085704438451, + "loss": 1.9975, + "step": 5620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046685692119540357, + "loss": 1.9696, + "step": 5630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00046540555249397056, + "loss": 1.9598, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046395447662498117, + "loss": 1.9366, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046250370587139206, + "loss": 1.9748, + "step": 5660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00046105325251357695, + "loss": 1.9125, + "step": 5670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045960312882922306, + "loss": 1.9595, + "step": 5680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00045815334709322665, + "loss": 1.9369, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004567039195775899, + "loss": 1.9564, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 0.000455254858551316, + "loss": 1.9274, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045380617628030693, + "loss": 1.9366, + "step": 5720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045235788502725777, + "loss": 1.9446, + "step": 5730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00045090999705155383, + "loss": 1.9236, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004494625246091672, + "loss": 1.9397, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044801547995255194, + "loss": 1.9849, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00044656887533054193, + "loss": 1.9367, + "step": 5770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004451227229882455, + "loss": 1.9451, + "step": 5780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004436770351669429, + "loss": 1.9578, + "step": 5790 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004422318241039821, + "loss": 1.9095, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00044078710203267576, + "loss": 1.9337, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004393428811821971, + "loss": 1.9904, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043789917377747695, + "loss": 1.9569, + "step": 5830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004364559920390996, + "loss": 1.9423, + "step": 5840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00043501334818320004, + "loss": 2.0013, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004335712544213597, + "loss": 1.9585, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004321297229605044, + "loss": 1.9148, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00043068876600279964, + "loss": 1.9558, + "step": 5880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004292483957455482, + "loss": 1.9899, + "step": 5890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042780862438108655, + "loss": 1.9597, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00042636946409668123, + "loss": 1.9603, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042493092707442717, + "loss": 1.9771, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004234930254911427, + "loss": 1.9416, + "step": 5930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042205577151826747, + "loss": 1.9417, + "step": 5940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00042061917732175966, + "loss": 1.9636, + "step": 5950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000419183255061992, + "loss": 1.966, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004177480168936504, + "loss": 1.9885, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041631347496562913, + "loss": 1.9525, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004148796414209297, + "loss": 1.9809, + "step": 5990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004134465283965568, + "loss": 1.8982, + "step": 6000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00041201414802341643, + "loss": 1.8978, + "step": 6010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00041058251242621295, + "loss": 1.9406, + "step": 6020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004091516337233464, + "loss": 1.919, + "step": 6030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040772152402680973, + "loss": 1.9897, + "step": 6040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040629219544208644, + "loss": 1.9473, + "step": 6050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040486366006804817, + "loss": 1.9589, + "step": 6060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00040343592999685264, + "loss": 1.8972, + "step": 6070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004020090173138404, + "loss": 1.9611, + "step": 6080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00040058293409743316, + "loss": 1.9164, + "step": 6090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00039915769241903175, + "loss": 1.939, + "step": 6100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003977333043429129, + "loss": 1.9233, + "step": 6110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0003963097819261288, + "loss": 1.9742, + "step": 6120 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003948871372184033, + "loss": 1.9719, + "step": 6130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003934653822620309, + "loss": 1.9861, + "step": 6140 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003920445290917747, + "loss": 1.9514, + "step": 6150 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003906245897347643, + "loss": 2.0047, + "step": 6160 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003892055762103943, + "loss": 1.934, + "step": 6170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0003877875005302223, + "loss": 1.9619, + "step": 6180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038637037469786727, + "loss": 1.9085, + "step": 6190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038495421070890796, + "loss": 1.9222, + "step": 6200 + }, + { + "epoch": 1.15, + "learning_rate": 0.0003835390205507812, + "loss": 1.9409, + "step": 6210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00038212481620268125, + "loss": 1.9439, + "step": 6220 + }, + { + "epoch": 1.15, + "learning_rate": 0.000380711609635457, + "loss": 1.974, + "step": 6230 + }, + { + "epoch": 1.16, + "learning_rate": 0.000379299412811512, + "loss": 1.9141, + "step": 6240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037788823768470227, + "loss": 1.8982, + "step": 6250 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003764780962002352, + "loss": 1.9384, + "step": 6260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0003750690002945695, + "loss": 1.9174, + "step": 6270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00037366096189531253, + "loss": 1.927, + "step": 6280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003722539929211205, + "loss": 1.9449, + "step": 6290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003708481052815973, + "loss": 2.008, + "step": 6300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003694433108771933, + "loss": 1.9345, + "step": 6310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00036803962159910543, + "loss": 1.8619, + "step": 6320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003666370493291757, + "loss": 1.9612, + "step": 6330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0003652356059397909, + "loss": 1.9371, + "step": 6340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036383530329378225, + "loss": 1.9193, + "step": 6350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036243615324432494, + "loss": 1.9509, + "step": 6360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00036103816763483775, + "loss": 1.9517, + "step": 6370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035964135829888287, + "loss": 1.9141, + "step": 6380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00035824573706006547, + "loss": 1.9985, + "step": 6390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035685131573193386, + "loss": 1.9791, + "step": 6400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035545810611787925, + "loss": 1.8865, + "step": 6410 + }, + { + "epoch": 1.19, + "learning_rate": 0.0003540661200110367, + "loss": 1.9409, + "step": 6420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035267536919418395, + "loss": 1.9928, + "step": 6430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00035128586543964243, + "loss": 1.9149, + "step": 6440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00034989762050917784, + "loss": 1.9837, + "step": 6450 + }, + { + "epoch": 1.2, + "learning_rate": 0.0003485106461538999, + "loss": 1.9142, + "step": 6460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034712495411416385, + "loss": 1.9284, + "step": 6470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034574055611946984, + "loss": 1.8848, + "step": 6480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034435746388836457, + "loss": 1.9295, + "step": 6490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00034297568912834177, + "loss": 1.9635, + "step": 6500 + }, + { + "epoch": 1.21, + "learning_rate": 0.0003415952435357431, + "loss": 1.9794, + "step": 6510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00034021613879565944, + "loss": 1.9347, + "step": 6520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033883838658183154, + "loss": 1.9282, + "step": 6530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00033746199855655125, + "loss": 1.9973, + "step": 6540 + }, + { + "epoch": 1.21, + "learning_rate": 0.000336086986370563, + "loss": 1.9718, + "step": 6550 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003347133616629652, + "loss": 1.9157, + "step": 6560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033334113606111194, + "loss": 1.9528, + "step": 6570 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003319703211805135, + "loss": 1.9369, + "step": 6580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00033060092862473967, + "loss": 1.9552, + "step": 6590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00032923296998532003, + "loss": 1.9581, + "step": 6600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0003278664568416465, + "loss": 1.9406, + "step": 6610 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003265014007608758, + "loss": 1.9672, + "step": 6620 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003251378132978304, + "loss": 1.9166, + "step": 6630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032377570599490164, + "loss": 1.9356, + "step": 6640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00032241509038195165, + "loss": 1.9092, + "step": 6650 + }, + { + "epoch": 1.23, + "learning_rate": 0.0003210559779762157, + "loss": 1.9343, + "step": 6660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031969838028220513, + "loss": 1.9796, + "step": 6670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031834230879160947, + "loss": 1.8932, + "step": 6680 + }, + { + "epoch": 1.24, + "learning_rate": 0.0003169877749831993, + "loss": 1.9279, + "step": 6690 + }, + { + "epoch": 1.24, + "learning_rate": 0.000315634790322729, + "loss": 1.9444, + "step": 6700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031428336626284037, + "loss": 1.9296, + "step": 6710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00031293351424296467, + "loss": 1.9341, + "step": 6720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031158524568922663, + "loss": 1.9589, + "step": 6730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00031023857201434703, + "loss": 1.8997, + "step": 6740 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003088935046175466, + "loss": 1.9417, + "step": 6750 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003075500548844492, + "loss": 1.9058, + "step": 6760 + }, + { + "epoch": 1.25, + "learning_rate": 0.0003062082341869862, + "loss": 1.9511, + "step": 6770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030486805388329894, + "loss": 1.922, + "step": 6780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00030352952531764363, + "loss": 1.9634, + "step": 6790 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003021926598202949, + "loss": 1.9555, + "step": 6800 + }, + { + "epoch": 1.26, + "learning_rate": 0.0003008574687074498, + "loss": 1.9254, + "step": 6810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00029952396328113265, + "loss": 1.9211, + "step": 6820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029819215482909846, + "loss": 1.9504, + "step": 6830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029686205462473784, + "loss": 1.9174, + "step": 6840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029553367392698177, + "loss": 1.9368, + "step": 6850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029420702398020595, + "loss": 1.8939, + "step": 6860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029288211601413586, + "loss": 1.9097, + "step": 6870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00029155896124375156, + "loss": 1.9885, + "step": 6880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002902375708691925, + "loss": 1.9752, + "step": 6890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002889179560756634, + "loss": 1.9321, + "step": 6900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002876001280333391, + "loss": 1.9345, + "step": 6910 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002862840978972698, + "loss": 1.9192, + "step": 6920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002849698768072877, + "loss": 1.9499, + "step": 6930 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002836574758879107, + "loss": 1.9217, + "step": 6940 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002823469062482503, + "loss": 1.9318, + "step": 6950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002810381789819167, + "loss": 1.9422, + "step": 6960 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002797313051669247, + "loss": 1.9562, + "step": 6970 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002784262958656003, + "loss": 1.9189, + "step": 6980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00027712316212448663, + "loss": 1.9453, + "step": 6990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027582191497425114, + "loss": 1.9335, + "step": 7000 + }, + { + "epoch": 1.3, + "learning_rate": 0.000274522565429591, + "loss": 1.9724, + "step": 7010 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002732251244891421, + "loss": 1.9236, + "step": 7020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027192960313538307, + "loss": 1.9407, + "step": 7030 + }, + { + "epoch": 1.3, + "learning_rate": 0.0002706360123345445, + "loss": 1.8948, + "step": 7040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026934436303651554, + "loss": 1.9354, + "step": 7050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026805466617475007, + "loss": 1.955, + "step": 7060 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002667669326661767, + "loss": 1.9595, + "step": 7070 + }, + { + "epoch": 1.31, + "learning_rate": 0.0002654811734111033, + "loss": 1.9766, + "step": 7080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00026419739929312713, + "loss": 1.9626, + "step": 7090 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002629156211790417, + "loss": 1.9096, + "step": 7100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026163584991874413, + "loss": 1.9522, + "step": 7110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00026035809634514543, + "loss": 1.9387, + "step": 7120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00025908237127407626, + "loss": 1.8788, + "step": 7130 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002578086855041973, + "loss": 1.9326, + "step": 7140 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002565370498169064, + "loss": 1.92, + "step": 7150 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002552674749762487, + "loss": 1.9131, + "step": 7160 + }, + { + "epoch": 1.33, + "learning_rate": 0.0002539999717288246, + "loss": 1.9263, + "step": 7170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025286099888629365, + "loss": 1.919, + "step": 7180 + }, + { + "epoch": 1.33, + "learning_rate": 0.000251597461210021, + "loss": 1.9281, + "step": 7190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00025033602619263507, + "loss": 1.9831, + "step": 7200 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024907670451183454, + "loss": 1.9535, + "step": 7210 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024781950682742983, + "loss": 1.8798, + "step": 7220 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024656444378125204, + "loss": 1.9124, + "step": 7230 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024531152599706346, + "loss": 1.9472, + "step": 7240 + }, + { + "epoch": 1.34, + "learning_rate": 0.0002440607640804668, + "loss": 1.9697, + "step": 7250 + }, + { + "epoch": 1.34, + "learning_rate": 0.00024281216861881633, + "loss": 1.938, + "step": 7260 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024156575018112787, + "loss": 1.9035, + "step": 7270 + }, + { + "epoch": 1.35, + "learning_rate": 0.00024032151931798918, + "loss": 1.9379, + "step": 7280 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002390794865614711, + "loss": 1.9176, + "step": 7290 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002378396624250375, + "loss": 1.9392, + "step": 7300 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002366020574034576, + "loss": 1.9235, + "step": 7310 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023536668197271588, + "loss": 1.939, + "step": 7320 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002341335465899243, + "loss": 1.889, + "step": 7330 + }, + { + "epoch": 1.36, + "learning_rate": 0.00023290266169323354, + "loss": 1.9247, + "step": 7340 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002316740377017438, + "loss": 1.935, + "step": 7350 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002304476850154183, + "loss": 1.9198, + "step": 7360 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022922361401499325, + "loss": 1.9068, + "step": 7370 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022800183506189238, + "loss": 1.9505, + "step": 7380 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022678235849813645, + "loss": 1.9459, + "step": 7390 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022556519464625807, + "loss": 1.9302, + "step": 7400 + }, + { + "epoch": 1.37, + "learning_rate": 0.00022435035380921321, + "loss": 1.9345, + "step": 7410 + }, + { + "epoch": 1.37, + "learning_rate": 0.0002231378462702935, + "loss": 1.9304, + "step": 7420 + }, + { + "epoch": 1.38, + "learning_rate": 0.00022192768229304107, + "loss": 1.9457, + "step": 7430 + }, + { + "epoch": 1.38, + "learning_rate": 0.0002207198721211593, + "loss": 1.9395, + "step": 7440 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021951442597842785, + "loss": 1.9867, + "step": 7450 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021831135406861558, + "loss": 1.9217, + "step": 7460 + }, + { + "epoch": 1.38, + "learning_rate": 0.00021711066657539342, + "loss": 1.991, + "step": 7470 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021591237366225008, + "loss": 1.9492, + "step": 7480 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021471648547240365, + "loss": 1.9376, + "step": 7490 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021352301212871762, + "loss": 1.9436, + "step": 7500 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021233196373361397, + "loss": 1.9267, + "step": 7510 + }, + { + "epoch": 1.39, + "learning_rate": 0.00021114335036898852, + "loss": 1.9483, + "step": 7520 + }, + { + "epoch": 1.39, + "learning_rate": 0.0002099571820961252, + "loss": 1.9485, + "step": 7530 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020877346895561082, + "loss": 1.9607, + "step": 7540 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020759222096725034, + "loss": 1.9665, + "step": 7550 + }, + { + "epoch": 1.4, + "learning_rate": 0.0002064134481299814, + "loss": 1.9202, + "step": 7560 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020523716042179075, + "loss": 1.9375, + "step": 7570 + }, + { + "epoch": 1.4, + "learning_rate": 0.00020406336779962888, + "loss": 1.9406, + "step": 7580 + }, + { + "epoch": 1.41, + "learning_rate": 0.00020289208019932635, + "loss": 1.9357, + "step": 7590 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002017233075355089, + "loss": 1.9432, + "step": 7600 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002005570597015145, + "loss": 1.962, + "step": 7610 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019939334656930892, + "loss": 1.9237, + "step": 7620 + }, + { + "epoch": 1.41, + "learning_rate": 0.00019823217798940247, + "loss": 1.9688, + "step": 7630 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019707356379076668, + "loss": 1.9524, + "step": 7640 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019591751378075035, + "loss": 1.981, + "step": 7650 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019476403774499774, + "loss": 1.9405, + "step": 7660 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001936131454473649, + "loss": 1.9, + "step": 7670 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019246484662983733, + "loss": 1.8852, + "step": 7680 + }, + { + "epoch": 1.42, + "learning_rate": 0.00019131915101244752, + "loss": 1.9447, + "step": 7690 + }, + { + "epoch": 1.43, + "learning_rate": 0.00019017606829319205, + "loss": 1.9221, + "step": 7700 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018903560814795086, + "loss": 1.9481, + "step": 7710 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018789778023040355, + "loss": 1.8919, + "step": 7720 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001867625941719499, + "loss": 1.94, + "step": 7730 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018563005958162587, + "loss": 1.9089, + "step": 7740 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018450018604602414, + "loss": 1.9105, + "step": 7750 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001833729831292123, + "loss": 1.9568, + "step": 7760 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018224846037265125, + "loss": 1.9156, + "step": 7770 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001811266272951162, + "loss": 1.9445, + "step": 7780 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001800074933926138, + "loss": 1.8871, + "step": 7790 + }, + { + "epoch": 1.44, + "learning_rate": 0.00017889106813830363, + "loss": 1.9684, + "step": 7800 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001777773609824173, + "loss": 1.9411, + "step": 7810 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017666638135217783, + "loss": 1.9295, + "step": 7820 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001755581386517216, + "loss": 1.9499, + "step": 7830 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001744526422620165, + "loss": 1.9499, + "step": 7840 + }, + { + "epoch": 1.45, + "learning_rate": 0.00017334990154078446, + "loss": 1.9262, + "step": 7850 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017224992582242076, + "loss": 1.9554, + "step": 7860 + }, + { + "epoch": 1.46, + "learning_rate": 0.00017115272441791635, + "loss": 1.9685, + "step": 7870 + }, + { + "epoch": 1.46, + "learning_rate": 0.000170058306614778, + "loss": 1.9021, + "step": 7880 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016896668167695018, + "loss": 1.8804, + "step": 7890 + }, + { + "epoch": 1.46, + "learning_rate": 0.00016787785884473665, + "loss": 1.9164, + "step": 7900 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016679184733472163, + "loss": 1.9409, + "step": 7910 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016570865633969283, + "loss": 1.9329, + "step": 7920 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016462829502856286, + "loss": 1.9518, + "step": 7930 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016355077254629196, + "loss": 1.9494, + "step": 7940 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016247609801381003, + "loss": 1.9376, + "step": 7950 + }, + { + "epoch": 1.47, + "learning_rate": 0.00016140428052794042, + "loss": 1.9312, + "step": 7960 + }, + { + "epoch": 1.48, + "learning_rate": 0.00016033532916132203, + "loss": 1.9528, + "step": 7970 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015926925296233296, + "loss": 1.9698, + "step": 7980 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015820606095501405, + "loss": 1.936, + "step": 7990 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015714576213899167, + "loss": 1.962, + "step": 8000 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015608836548940252, + "loss": 1.9439, + "step": 8010 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015503387995681732, + "loss": 1.9274, + "step": 8020 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001539823144671648, + "loss": 1.9029, + "step": 8030 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015293367792165664, + "loss": 1.928, + "step": 8040 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015188797919671115, + "loss": 1.9405, + "step": 8050 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015084522714387967, + "loss": 1.909, + "step": 8060 + }, + { + "epoch": 1.49, + "learning_rate": 0.00014980543058976977, + "loss": 1.9286, + "step": 8070 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014876859833597278, + "loss": 1.9358, + "step": 8080 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014773473915898695, + "loss": 1.9073, + "step": 8090 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014670386181014477, + "loss": 1.9044, + "step": 8100 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014567597501553847, + "loss": 1.9133, + "step": 8110 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001446510874759454, + "loss": 1.9583, + "step": 8120 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014362920786675616, + "loss": 1.9381, + "step": 8130 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014261034483789892, + "loss": 1.951, + "step": 8140 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014159450701376803, + "loss": 1.9806, + "step": 8150 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014058170299315027, + "loss": 1.9101, + "step": 8160 + }, + { + "epoch": 1.51, + "learning_rate": 0.00013957194134915147, + "loss": 1.9122, + "step": 8170 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013856523062912569, + "loss": 1.91, + "step": 8180 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001375615793546006, + "loss": 1.9182, + "step": 8190 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013656099602120752, + "loss": 1.9312, + "step": 8200 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013556348909860762, + "loss": 1.9327, + "step": 8210 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013456906703042165, + "loss": 1.9184, + "step": 8220 + }, + { + "epoch": 1.52, + "learning_rate": 0.00013357773823415782, + "loss": 1.8876, + "step": 8230 + }, + { + "epoch": 1.53, + "learning_rate": 0.00013258951110114054, + "loss": 1.927, + "step": 8240 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001316043939964398, + "loss": 1.9525, + "step": 8250 + }, + { + "epoch": 1.53, + "learning_rate": 0.00013062239525879943, + "loss": 1.8933, + "step": 8260 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001296435232005677, + "loss": 1.9433, + "step": 8270 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001286677861076263, + "loss": 1.9306, + "step": 8280 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012769519223932034, + "loss": 1.8962, + "step": 8290 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012672574982838802, + "loss": 1.9322, + "step": 8300 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012575946708089176, + "loss": 1.9191, + "step": 8310 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001247963521761481, + "loss": 1.9308, + "step": 8320 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012383641326665874, + "loss": 1.8876, + "step": 8330 + }, + { + "epoch": 1.54, + "learning_rate": 0.00012287965847804162, + "loss": 1.9103, + "step": 8340 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012192609590896142, + "loss": 1.8804, + "step": 8350 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012097573363106218, + "loss": 1.944, + "step": 8360 + }, + { + "epoch": 1.55, + "learning_rate": 0.00012002857968889797, + "loss": 1.9259, + "step": 8370 + }, + { + "epoch": 1.55, + "learning_rate": 0.00011908464209986541, + "loss": 1.9421, + "step": 8380 + }, + { + "epoch": 1.55, + "learning_rate": 0.00011814392885413567, + "loss": 1.9251, + "step": 8390 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011720644791458623, + "loss": 1.9106, + "step": 8400 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011627220721673459, + "loss": 1.8928, + "step": 8410 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011534121466866986, + "loss": 1.9323, + "step": 8420 + }, + { + "epoch": 1.56, + "learning_rate": 0.00011441347815098735, + "loss": 1.9238, + "step": 8430 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001134890055167201, + "loss": 1.9831, + "step": 8440 + }, + { + "epoch": 1.57, + "learning_rate": 0.00011256780459127374, + "loss": 1.85, + "step": 8450 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001116498831723598, + "loss": 1.9391, + "step": 8460 + }, + { + "epoch": 1.57, + "learning_rate": 0.00011073524902992921, + "loss": 1.9071, + "step": 8470 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010982390990610791, + "loss": 1.9538, + "step": 8480 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010891587351512949, + "loss": 1.8972, + "step": 8490 + }, + { + "epoch": 1.57, + "learning_rate": 0.00010801114754327135, + "loss": 1.9184, + "step": 8500 + }, + { + "epoch": 1.58, + "learning_rate": 0.00010710973964878906, + "loss": 1.9567, + "step": 8510 + }, + { + "epoch": 1.58, + "learning_rate": 0.00010621165746185113, + "loss": 1.9755, + "step": 8520 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001053169085844758, + "loss": 1.9256, + "step": 8530 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001044255005904648, + "loss": 1.9742, + "step": 8540 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001035374410253408, + "loss": 1.9562, + "step": 8550 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001026527374062825, + "loss": 1.9432, + "step": 8560 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010177139722206191, + "loss": 1.9007, + "step": 8570 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010089342793298028, + "loss": 1.9834, + "step": 8580 + }, + { + "epoch": 1.59, + "learning_rate": 0.00010001883697080504, + "loss": 1.9063, + "step": 8590 + }, + { + "epoch": 1.59, + "learning_rate": 9.914763173870738e-05, + "loss": 1.9063, + "step": 8600 + }, + { + "epoch": 1.59, + "learning_rate": 9.827981961119869e-05, + "loss": 1.9149, + "step": 8610 + }, + { + "epoch": 1.6, + "learning_rate": 9.741540793406911e-05, + "loss": 1.9096, + "step": 8620 + }, + { + "epoch": 1.6, + "learning_rate": 9.655440402432464e-05, + "loss": 1.8657, + "step": 8630 + }, + { + "epoch": 1.6, + "learning_rate": 9.569681517012585e-05, + "loss": 1.9237, + "step": 8640 + }, + { + "epoch": 1.6, + "learning_rate": 9.484264863072523e-05, + "loss": 1.9739, + "step": 8650 + }, + { + "epoch": 1.6, + "learning_rate": 9.399191163640675e-05, + "loss": 1.9199, + "step": 8660 + }, + { + "epoch": 1.61, + "learning_rate": 9.314461138842406e-05, + "loss": 1.9639, + "step": 8670 + }, + { + "epoch": 1.61, + "learning_rate": 9.230075505893987e-05, + "loss": 1.9391, + "step": 8680 + }, + { + "epoch": 1.61, + "learning_rate": 9.146034979096496e-05, + "loss": 1.9326, + "step": 8690 + }, + { + "epoch": 1.61, + "learning_rate": 9.06234026982976e-05, + "loss": 1.9501, + "step": 8700 + }, + { + "epoch": 1.61, + "learning_rate": 8.9789920865464e-05, + "loss": 1.9041, + "step": 8710 + }, + { + "epoch": 1.62, + "learning_rate": 8.895991134765758e-05, + "loss": 1.931, + "step": 8720 + }, + { + "epoch": 1.62, + "learning_rate": 8.813338117067965e-05, + "loss": 1.9589, + "step": 8730 + }, + { + "epoch": 1.62, + "learning_rate": 8.731033733088012e-05, + "loss": 1.9226, + "step": 8740 + }, + { + "epoch": 1.62, + "learning_rate": 8.649078679509742e-05, + "loss": 1.911, + "step": 8750 + }, + { + "epoch": 1.62, + "learning_rate": 8.567473650060082e-05, + "loss": 1.9641, + "step": 8760 + }, + { + "epoch": 1.62, + "learning_rate": 8.486219335503026e-05, + "loss": 1.8924, + "step": 8770 + }, + { + "epoch": 1.63, + "learning_rate": 8.405316423633958e-05, + "loss": 1.9583, + "step": 8780 + }, + { + "epoch": 1.63, + "learning_rate": 8.324765599273649e-05, + "loss": 1.9399, + "step": 8790 + }, + { + "epoch": 1.63, + "learning_rate": 8.244567544262588e-05, + "loss": 1.9362, + "step": 8800 + }, + { + "epoch": 1.63, + "learning_rate": 8.164722937455177e-05, + "loss": 1.9283, + "step": 8810 + }, + { + "epoch": 1.63, + "learning_rate": 8.08523245471392e-05, + "loss": 1.9588, + "step": 8820 + }, + { + "epoch": 1.64, + "learning_rate": 8.006096768903848e-05, + "loss": 1.9126, + "step": 8830 + }, + { + "epoch": 1.64, + "learning_rate": 7.927316549886659e-05, + "loss": 1.9331, + "step": 8840 + }, + { + "epoch": 1.64, + "learning_rate": 7.84889246451515e-05, + "loss": 1.8967, + "step": 8850 + }, + { + "epoch": 1.64, + "learning_rate": 7.77082517662756e-05, + "loss": 1.927, + "step": 8860 + }, + { + "epoch": 1.64, + "learning_rate": 7.693115347041884e-05, + "loss": 1.8978, + "step": 8870 + }, + { + "epoch": 1.64, + "learning_rate": 7.615763633550421e-05, + "loss": 1.9142, + "step": 8880 + }, + { + "epoch": 1.65, + "learning_rate": 7.538770690914015e-05, + "loss": 1.9001, + "step": 8890 + }, + { + "epoch": 1.65, + "learning_rate": 7.462137170856698e-05, + "loss": 1.8979, + "step": 8900 + }, + { + "epoch": 1.65, + "learning_rate": 7.385863722060022e-05, + "loss": 1.892, + "step": 8910 + }, + { + "epoch": 1.65, + "learning_rate": 7.309950990157677e-05, + "loss": 1.9496, + "step": 8920 + }, + { + "epoch": 1.65, + "learning_rate": 7.234399617729976e-05, + "loss": 1.8879, + "step": 8930 + }, + { + "epoch": 1.66, + "learning_rate": 7.159210244298414e-05, + "loss": 1.921, + "step": 8940 + }, + { + "epoch": 1.66, + "learning_rate": 7.084383506320291e-05, + "loss": 1.9408, + "step": 8950 + }, + { + "epoch": 1.66, + "learning_rate": 7.009920037183248e-05, + "loss": 1.9258, + "step": 8960 + }, + { + "epoch": 1.66, + "learning_rate": 6.935820467200005e-05, + "loss": 1.9182, + "step": 8970 + }, + { + "epoch": 1.66, + "learning_rate": 6.862085423602955e-05, + "loss": 1.9668, + "step": 8980 + }, + { + "epoch": 1.67, + "learning_rate": 6.78871553053888e-05, + "loss": 1.898, + "step": 8990 + }, + { + "epoch": 1.67, + "learning_rate": 6.715711409063652e-05, + "loss": 1.9261, + "step": 9000 + }, + { + "epoch": 1.67, + "learning_rate": 6.643073677136996e-05, + "loss": 1.9167, + "step": 9010 + }, + { + "epoch": 1.67, + "learning_rate": 6.570802949617261e-05, + "loss": 1.9066, + "step": 9020 + }, + { + "epoch": 1.67, + "learning_rate": 6.49889983825619e-05, + "loss": 1.9091, + "step": 9030 + }, + { + "epoch": 1.67, + "learning_rate": 6.427364951693776e-05, + "loss": 1.8853, + "step": 9040 + }, + { + "epoch": 1.68, + "learning_rate": 6.356198895453053e-05, + "loss": 1.9459, + "step": 9050 + }, + { + "epoch": 1.68, + "learning_rate": 6.285402271935048e-05, + "loss": 1.9073, + "step": 9060 + }, + { + "epoch": 1.68, + "learning_rate": 6.214975680413621e-05, + "loss": 1.902, + "step": 9070 + }, + { + "epoch": 1.68, + "learning_rate": 6.144919717030417e-05, + "loss": 1.8812, + "step": 9080 + }, + { + "epoch": 1.68, + "learning_rate": 6.075234974789839e-05, + "loss": 1.8672, + "step": 9090 + }, + { + "epoch": 1.69, + "learning_rate": 6.005922043553952e-05, + "loss": 1.9297, + "step": 9100 + }, + { + "epoch": 1.69, + "learning_rate": 5.9369815100376037e-05, + "loss": 1.8775, + "step": 9110 + }, + { + "epoch": 1.69, + "learning_rate": 5.868413957803331e-05, + "loss": 1.8831, + "step": 9120 + }, + { + "epoch": 1.69, + "learning_rate": 5.800219967256576e-05, + "loss": 1.9026, + "step": 9130 + }, + { + "epoch": 1.69, + "learning_rate": 5.7324001156406014e-05, + "loss": 1.8944, + "step": 9140 + }, + { + "epoch": 1.69, + "learning_rate": 5.664954977031733e-05, + "loss": 1.9154, + "step": 9150 + }, + { + "epoch": 1.7, + "learning_rate": 5.5978851223344455e-05, + "loss": 1.8994, + "step": 9160 + }, + { + "epoch": 1.7, + "learning_rate": 5.531191119276513e-05, + "loss": 1.9397, + "step": 9170 + }, + { + "epoch": 1.7, + "learning_rate": 5.4648735324042855e-05, + "loss": 1.9416, + "step": 9180 + }, + { + "epoch": 1.7, + "learning_rate": 5.398932923077793e-05, + "loss": 1.9207, + "step": 9190 + }, + { + "epoch": 1.7, + "learning_rate": 5.333369849466091e-05, + "loss": 1.9061, + "step": 9200 + }, + { + "epoch": 1.71, + "learning_rate": 5.268184866542502e-05, + "loss": 1.8861, + "step": 9210 + }, + { + "epoch": 1.71, + "learning_rate": 5.2033785260798716e-05, + "loss": 1.9433, + "step": 9220 + }, + { + "epoch": 1.71, + "learning_rate": 5.138951376646012e-05, + "loss": 1.9158, + "step": 9230 + }, + { + "epoch": 1.71, + "learning_rate": 5.074903963598926e-05, + "loss": 1.8898, + "step": 9240 + }, + { + "epoch": 1.71, + "learning_rate": 5.0112368290822885e-05, + "loss": 1.9041, + "step": 9250 + }, + { + "epoch": 1.72, + "learning_rate": 4.9479505120207934e-05, + "loss": 1.9605, + "step": 9260 + }, + { + "epoch": 1.72, + "learning_rate": 4.885045548115646e-05, + "loss": 1.8975, + "step": 9270 + }, + { + "epoch": 1.72, + "learning_rate": 4.822522469839996e-05, + "loss": 1.9396, + "step": 9280 + }, + { + "epoch": 1.72, + "learning_rate": 4.760381806434427e-05, + "loss": 1.9263, + "step": 9290 + }, + { + "epoch": 1.72, + "learning_rate": 4.698624083902503e-05, + "loss": 1.948, + "step": 9300 + }, + { + "epoch": 1.72, + "learning_rate": 4.637249825006273e-05, + "loss": 1.9206, + "step": 9310 + }, + { + "epoch": 1.73, + "learning_rate": 4.5762595492618906e-05, + "loss": 1.9129, + "step": 9320 + }, + { + "epoch": 1.73, + "learning_rate": 4.515653772935207e-05, + "loss": 1.9036, + "step": 9330 + }, + { + "epoch": 1.73, + "learning_rate": 4.455433009037385e-05, + "loss": 1.928, + "step": 9340 + }, + { + "epoch": 1.73, + "learning_rate": 4.395597767320536e-05, + "loss": 1.9427, + "step": 9350 + }, + { + "epoch": 1.73, + "learning_rate": 4.336148554273467e-05, + "loss": 1.8882, + "step": 9360 + }, + { + "epoch": 1.74, + "learning_rate": 4.277085873117354e-05, + "loss": 1.9412, + "step": 9370 + }, + { + "epoch": 1.74, + "learning_rate": 4.218410223801472e-05, + "loss": 1.9014, + "step": 9380 + }, + { + "epoch": 1.74, + "learning_rate": 4.1601221029989976e-05, + "loss": 1.9056, + "step": 9390 + }, + { + "epoch": 1.74, + "learning_rate": 4.102222004102768e-05, + "loss": 1.9665, + "step": 9400 + }, + { + "epoch": 1.74, + "learning_rate": 4.04471041722112e-05, + "loss": 1.8911, + "step": 9410 + }, + { + "epoch": 1.74, + "learning_rate": 3.987587829173772e-05, + "loss": 1.885, + "step": 9420 + }, + { + "epoch": 1.75, + "learning_rate": 3.930854723487642e-05, + "loss": 1.8958, + "step": 9430 + }, + { + "epoch": 1.75, + "learning_rate": 3.874511580392814e-05, + "loss": 1.9197, + "step": 9440 + }, + { + "epoch": 1.75, + "learning_rate": 3.818558876818418e-05, + "loss": 1.9174, + "step": 9450 + }, + { + "epoch": 1.75, + "learning_rate": 3.762997086388653e-05, + "loss": 1.9321, + "step": 9460 + }, + { + "epoch": 1.75, + "learning_rate": 3.707826679418702e-05, + "loss": 1.8835, + "step": 9470 + }, + { + "epoch": 1.76, + "learning_rate": 3.653048122910862e-05, + "loss": 1.9083, + "step": 9480 + }, + { + "epoch": 1.76, + "learning_rate": 3.598661880550452e-05, + "loss": 1.9082, + "step": 9490 + }, + { + "epoch": 1.76, + "learning_rate": 3.544668412702007e-05, + "loss": 1.9696, + "step": 9500 + }, + { + "epoch": 1.76, + "learning_rate": 3.491068176405326e-05, + "loss": 1.9232, + "step": 9510 + }, + { + "epoch": 1.76, + "learning_rate": 3.43786162537158e-05, + "loss": 1.8944, + "step": 9520 + }, + { + "epoch": 1.77, + "learning_rate": 3.385049209979568e-05, + "loss": 1.9341, + "step": 9530 + }, + { + "epoch": 1.77, + "learning_rate": 3.3326313772717667e-05, + "loss": 1.9, + "step": 9540 + }, + { + "epoch": 1.77, + "learning_rate": 3.2806085709506716e-05, + "loss": 1.9157, + "step": 9550 + }, + { + "epoch": 1.77, + "learning_rate": 3.228981231374972e-05, + "loss": 1.9287, + "step": 9560 + }, + { + "epoch": 1.77, + "learning_rate": 3.177749795555812e-05, + "loss": 1.9375, + "step": 9570 + }, + { + "epoch": 1.77, + "learning_rate": 3.126914697153182e-05, + "loss": 1.9171, + "step": 9580 + }, + { + "epoch": 1.78, + "learning_rate": 3.076476366472131e-05, + "loss": 1.8778, + "step": 9590 + }, + { + "epoch": 1.78, + "learning_rate": 3.0264352304592123e-05, + "loss": 1.919, + "step": 9600 + }, + { + "epoch": 1.78, + "learning_rate": 2.9767917126987952e-05, + "loss": 1.891, + "step": 9610 + }, + { + "epoch": 1.78, + "learning_rate": 2.927546233409567e-05, + "loss": 1.921, + "step": 9620 + }, + { + "epoch": 1.78, + "learning_rate": 2.8786992094409102e-05, + "loss": 1.9178, + "step": 9630 + }, + { + "epoch": 1.79, + "learning_rate": 2.8302510542693782e-05, + "loss": 1.8917, + "step": 9640 + }, + { + "epoch": 1.79, + "learning_rate": 2.7822021779952467e-05, + "loss": 1.9141, + "step": 9650 + }, + { + "epoch": 1.79, + "learning_rate": 2.7345529873389618e-05, + "loss": 1.8737, + "step": 9660 + }, + { + "epoch": 1.79, + "learning_rate": 2.687303885637765e-05, + "loss": 1.9349, + "step": 9670 + }, + { + "epoch": 1.79, + "learning_rate": 2.6404552728422625e-05, + "loss": 1.919, + "step": 9680 + }, + { + "epoch": 1.79, + "learning_rate": 2.5940075455130217e-05, + "loss": 1.9411, + "step": 9690 + }, + { + "epoch": 1.8, + "learning_rate": 2.547961096817214e-05, + "loss": 1.9616, + "step": 9700 + }, + { + "epoch": 1.8, + "learning_rate": 2.5023163165253272e-05, + "loss": 1.9431, + "step": 9710 + }, + { + "epoch": 1.8, + "learning_rate": 2.4570735910078078e-05, + "loss": 1.9488, + "step": 9720 + }, + { + "epoch": 1.8, + "learning_rate": 2.4122333032318367e-05, + "loss": 1.9376, + "step": 9730 + }, + { + "epoch": 1.8, + "learning_rate": 2.3677958327580683e-05, + "loss": 1.9038, + "step": 9740 + }, + { + "epoch": 1.81, + "learning_rate": 2.3237615557374137e-05, + "loss": 1.91, + "step": 9750 + }, + { + "epoch": 1.81, + "learning_rate": 2.2801308449078684e-05, + "loss": 1.9058, + "step": 9760 + }, + { + "epoch": 1.81, + "learning_rate": 2.2369040695913445e-05, + "loss": 1.9275, + "step": 9770 + }, + { + "epoch": 1.81, + "learning_rate": 2.1940815956905612e-05, + "loss": 1.9646, + "step": 9780 + }, + { + "epoch": 1.81, + "learning_rate": 2.1516637856859422e-05, + "loss": 1.9127, + "step": 9790 + }, + { + "epoch": 1.82, + "learning_rate": 2.109650998632512e-05, + "loss": 1.9564, + "step": 9800 + }, + { + "epoch": 1.82, + "learning_rate": 2.068043590156926e-05, + "loss": 1.929, + "step": 9810 + }, + { + "epoch": 1.82, + "learning_rate": 2.0268419124544078e-05, + "loss": 1.9185, + "step": 9820 + }, + { + "epoch": 1.82, + "learning_rate": 1.986046314285772e-05, + "loss": 1.8714, + "step": 9830 + }, + { + "epoch": 1.82, + "learning_rate": 1.9456571409744938e-05, + "loss": 1.9149, + "step": 9840 + }, + { + "epoch": 1.82, + "learning_rate": 1.9056747344037616e-05, + "loss": 1.8945, + "step": 9850 + }, + { + "epoch": 1.83, + "learning_rate": 1.8660994330136184e-05, + "loss": 1.9634, + "step": 9860 + }, + { + "epoch": 1.83, + "learning_rate": 1.8269315717980518e-05, + "loss": 1.9449, + "step": 9870 + }, + { + "epoch": 1.83, + "learning_rate": 1.7881714823021976e-05, + "loss": 1.8911, + "step": 9880 + }, + { + "epoch": 1.83, + "learning_rate": 1.7498194926194978e-05, + "loss": 1.9169, + "step": 9890 + }, + { + "epoch": 1.83, + "learning_rate": 1.7118759273889615e-05, + "loss": 1.8699, + "step": 9900 + }, + { + "epoch": 1.84, + "learning_rate": 1.674341107792382e-05, + "loss": 1.9187, + "step": 9910 + }, + { + "epoch": 1.84, + "learning_rate": 1.6372153515516463e-05, + "loss": 1.8754, + "step": 9920 + }, + { + "epoch": 1.84, + "learning_rate": 1.600498972926029e-05, + "loss": 1.9913, + "step": 9930 + }, + { + "epoch": 1.84, + "learning_rate": 1.5641922827095256e-05, + "loss": 1.9162, + "step": 9940 + }, + { + "epoch": 1.84, + "learning_rate": 1.528295588228251e-05, + "loss": 1.9475, + "step": 9950 + }, + { + "epoch": 1.84, + "learning_rate": 1.4928091933378018e-05, + "loss": 1.8907, + "step": 9960 + }, + { + "epoch": 1.85, + "learning_rate": 1.4577333984207186e-05, + "loss": 1.9031, + "step": 9970 + }, + { + "epoch": 1.85, + "learning_rate": 1.4230685003839117e-05, + "loss": 1.8969, + "step": 9980 + }, + { + "epoch": 1.85, + "learning_rate": 1.3888147926561733e-05, + "loss": 1.9272, + "step": 9990 + }, + { + "epoch": 1.85, + "learning_rate": 1.3549725651856804e-05, + "loss": 1.9313, + "step": 10000 + }, + { + "epoch": 1.85, + "learning_rate": 1.3215421044375287e-05, + "loss": 1.8596, + "step": 10010 + }, + { + "epoch": 1.86, + "learning_rate": 1.288523693391358e-05, + "loss": 1.9298, + "step": 10020 + }, + { + "epoch": 1.86, + "learning_rate": 1.255917611538876e-05, + "loss": 1.9298, + "step": 10030 + }, + { + "epoch": 1.86, + "learning_rate": 1.2237241348815765e-05, + "loss": 1.9296, + "step": 10040 + }, + { + "epoch": 1.86, + "learning_rate": 1.1919435359283414e-05, + "loss": 1.876, + "step": 10050 + }, + { + "epoch": 1.86, + "learning_rate": 1.16057608369316e-05, + "loss": 1.9207, + "step": 10060 + }, + { + "epoch": 1.87, + "learning_rate": 1.1296220436928629e-05, + "loss": 1.9311, + "step": 10070 + }, + { + "epoch": 1.87, + "learning_rate": 1.0990816779448353e-05, + "loss": 1.9274, + "step": 10080 + }, + { + "epoch": 1.87, + "learning_rate": 1.0689552449648587e-05, + "loss": 1.9191, + "step": 10090 + }, + { + "epoch": 1.87, + "learning_rate": 1.03924299976485e-05, + "loss": 1.915, + "step": 10100 + }, + { + "epoch": 1.87, + "learning_rate": 1.0099451938507642e-05, + "loss": 1.9141, + "step": 10110 + }, + { + "epoch": 1.87, + "learning_rate": 9.810620752204346e-06, + "loss": 1.9291, + "step": 10120 + }, + { + "epoch": 1.88, + "learning_rate": 9.525938883614915e-06, + "loss": 1.9239, + "step": 10130 + }, + { + "epoch": 1.88, + "learning_rate": 9.24540874249269e-06, + "loss": 1.9016, + "step": 10140 + }, + { + "epoch": 1.88, + "learning_rate": 8.969032703447843e-06, + "loss": 1.9208, + "step": 10150 + }, + { + "epoch": 1.88, + "learning_rate": 8.69681310592718e-06, + "loss": 1.9126, + "step": 10160 + }, + { + "epoch": 1.88, + "learning_rate": 8.428752254194427e-06, + "loss": 1.9194, + "step": 10170 + }, + { + "epoch": 1.89, + "learning_rate": 8.164852417310742e-06, + "loss": 1.9257, + "step": 10180 + }, + { + "epoch": 1.89, + "learning_rate": 7.905115829115238e-06, + "loss": 1.8922, + "step": 10190 + }, + { + "epoch": 1.89, + "learning_rate": 7.6495446882065e-06, + "loss": 1.8865, + "step": 10200 + }, + { + "epoch": 1.89, + "learning_rate": 7.398141157923588e-06, + "loss": 1.9282, + "step": 10210 + }, + { + "epoch": 1.89, + "learning_rate": 7.150907366327952e-06, + "loss": 1.9036, + "step": 10220 + }, + { + "epoch": 1.89, + "learning_rate": 6.907845406185387e-06, + "loss": 1.9347, + "step": 10230 + }, + { + "epoch": 1.9, + "learning_rate": 6.6689573349482666e-06, + "loss": 1.9144, + "step": 10240 + }, + { + "epoch": 1.9, + "learning_rate": 6.434245174738063e-06, + "loss": 1.9082, + "step": 10250 + }, + { + "epoch": 1.9, + "learning_rate": 6.203710912328464e-06, + "loss": 1.8831, + "step": 10260 + }, + { + "epoch": 1.9, + "learning_rate": 5.9773564991283395e-06, + "loss": 1.9163, + "step": 10270 + }, + { + "epoch": 1.9, + "learning_rate": 5.755183851165246e-06, + "loss": 1.8726, + "step": 10280 + }, + { + "epoch": 1.91, + "learning_rate": 5.537194849069283e-06, + "loss": 1.9452, + "step": 10290 + }, + { + "epoch": 1.91, + "learning_rate": 5.323391338057204e-06, + "loss": 1.9356, + "step": 10300 + }, + { + "epoch": 1.91, + "learning_rate": 5.113775127916553e-06, + "loss": 1.8665, + "step": 10310 + }, + { + "epoch": 1.91, + "learning_rate": 4.908347992990836e-06, + "loss": 1.9132, + "step": 10320 + }, + { + "epoch": 1.91, + "learning_rate": 4.7071116721638104e-06, + "loss": 1.912, + "step": 10330 + }, + { + "epoch": 1.92, + "learning_rate": 4.5100678688455576e-06, + "loss": 1.9069, + "step": 10340 + }, + { + "epoch": 1.92, + "learning_rate": 4.317218250957322e-06, + "loss": 1.9197, + "step": 10350 + }, + { + "epoch": 1.92, + "learning_rate": 4.12856445091786e-06, + "loss": 1.8681, + "step": 10360 + }, + { + "epoch": 1.92, + "learning_rate": 3.944108065629559e-06, + "loss": 1.9463, + "step": 10370 + }, + { + "epoch": 1.92, + "learning_rate": 3.763850656464729e-06, + "loss": 1.8796, + "step": 10380 + }, + { + "epoch": 1.92, + "learning_rate": 3.58779374925261e-06, + "loss": 1.8699, + "step": 10390 + }, + { + "epoch": 1.93, + "learning_rate": 3.415938834266219e-06, + "loss": 1.951, + "step": 10400 + }, + { + "epoch": 1.93, + "learning_rate": 3.248287366209912e-06, + "loss": 1.9231, + "step": 10410 + }, + { + "epoch": 1.93, + "learning_rate": 3.0848407642072306e-06, + "loss": 1.9204, + "step": 10420 + }, + { + "epoch": 1.93, + "learning_rate": 2.9256004117883538e-06, + "loss": 1.9499, + "step": 10430 + }, + { + "epoch": 1.93, + "learning_rate": 2.770567656878997e-06, + "loss": 1.9403, + "step": 10440 + }, + { + "epoch": 1.94, + "learning_rate": 2.6197438117885884e-06, + "loss": 1.9381, + "step": 10450 + }, + { + "epoch": 1.94, + "learning_rate": 2.4731301531992214e-06, + "loss": 1.9282, + "step": 10460 + }, + { + "epoch": 1.94, + "learning_rate": 2.3307279221551623e-06, + "loss": 1.9598, + "step": 10470 + }, + { + "epoch": 1.94, + "learning_rate": 2.192538324051918e-06, + "loss": 1.8994, + "step": 10480 + }, + { + "epoch": 1.94, + "learning_rate": 2.05856252862624e-06, + "loss": 1.8849, + "step": 10490 + }, + { + "epoch": 1.94, + "learning_rate": 1.9288016699463006e-06, + "loss": 1.9451, + "step": 10500 + }, + { + "epoch": 1.95, + "learning_rate": 1.8032568464018129e-06, + "loss": 1.8973, + "step": 10510 + }, + { + "epoch": 1.95, + "learning_rate": 1.681929120695147e-06, + "loss": 1.9224, + "step": 10520 + }, + { + "epoch": 1.95, + "learning_rate": 1.564819519832006e-06, + "loss": 1.9441, + "step": 10530 + }, + { + "epoch": 1.95, + "learning_rate": 1.451929035112709e-06, + "loss": 1.9274, + "step": 10540 + }, + { + "epoch": 1.95, + "learning_rate": 1.3432586221240884e-06, + "loss": 1.9057, + "step": 10550 + }, + { + "epoch": 1.96, + "learning_rate": 1.2388092007312169e-06, + "loss": 1.9153, + "step": 10560 + }, + { + "epoch": 1.96, + "learning_rate": 1.138581655069526e-06, + "loss": 1.878, + "step": 10570 + }, + { + "epoch": 1.96, + "learning_rate": 1.0425768335375897e-06, + "loss": 1.8931, + "step": 10580 + }, + { + "epoch": 1.96, + "learning_rate": 9.507955487896291e-07, + "loss": 1.9034, + "step": 10590 + }, + { + "epoch": 1.96, + "learning_rate": 8.632385777289087e-07, + "loss": 1.9457, + "step": 10600 + }, + { + "epoch": 1.97, + "learning_rate": 7.799066615010175e-07, + "loss": 1.9204, + "step": 10610 + }, + { + "epoch": 1.97, + "learning_rate": 7.008005054875422e-07, + "loss": 1.9366, + "step": 10620 + }, + { + "epoch": 1.97, + "learning_rate": 6.259207793003486e-07, + "loss": 1.8985, + "step": 10630 + }, + { + "epoch": 1.97, + "learning_rate": 5.552681167755868e-07, + "loss": 1.9348, + "step": 10640 + }, + { + "epoch": 1.97, + "learning_rate": 4.888431159685291e-07, + "loss": 1.9268, + "step": 10650 + }, + { + "epoch": 1.97, + "learning_rate": 4.266463391484621e-07, + "loss": 1.9166, + "step": 10660 + }, + { + "epoch": 1.98, + "learning_rate": 3.6867831279396856e-07, + "loss": 1.9312, + "step": 10670 + }, + { + "epoch": 1.98, + "learning_rate": 3.1493952758832046e-07, + "loss": 1.9247, + "step": 10680 + }, + { + "epoch": 1.98, + "learning_rate": 2.6543043841548153e-07, + "loss": 1.917, + "step": 10690 + }, + { + "epoch": 1.98, + "learning_rate": 2.2015146435627742e-07, + "loss": 1.8837, + "step": 10700 + }, + { + "epoch": 1.98, + "learning_rate": 1.7910298868467623e-07, + "loss": 1.9174, + "step": 10710 + }, + { + "epoch": 1.99, + "learning_rate": 1.422853588647355e-07, + "loss": 1.9107, + "step": 10720 + }, + { + "epoch": 1.99, + "learning_rate": 1.0969888654749349e-07, + "loss": 1.9253, + "step": 10730 + }, + { + "epoch": 1.99, + "learning_rate": 8.134384756841584e-08, + "loss": 1.9154, + "step": 10740 + }, + { + "epoch": 1.99, + "learning_rate": 5.722048194511942e-08, + "loss": 1.893, + "step": 10750 + }, + { + "epoch": 1.99, + "learning_rate": 3.73289938752075e-08, + "loss": 1.91, + "step": 10760 + }, + { + "epoch": 1.99, + "learning_rate": 2.1669551734604385e-08, + "loss": 1.9416, + "step": 10770 + }, + { + "epoch": 2.0, + "learning_rate": 1.0242288076223182e-08, + "loss": 1.9549, + "step": 10780 + }, + { + "epoch": 2.0, + "learning_rate": 3.047299628633482e-09, + "loss": 1.9516, + "step": 10790 + }, + { + "epoch": 2.0, + "step": 10798, + "total_flos": 1.0247474124569969e+19, + "train_loss": 1.978195481530868, + "train_runtime": 26343.521, + "train_samples_per_second": 26.232, + "train_steps_per_second": 0.41 + } + ], + "max_steps": 10798, + "num_train_epochs": 2, + "total_flos": 1.0247474124569969e+19, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b097aab2293da043bc99abba38a0ed7c4525140a --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8813832b030b0a678cb3ad0abd28db5000bdb8bb1708e45ba10cfda908fcc38 +size 3305