{ "best_metric": 0.5099431818181818, "best_model_checkpoint": "/scratch/elec/puhe/p/palp3/sami_ASR/base_model_output/wav2vec2-base-sami-cont-pt-22k/outputs/shuff_1048/ftpseudowr30esp5/checkpoint-5400", "epoch": 8.0, "eval_steps": 500, "global_step": 8640, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 105.84375762939453, "learning_rate": 2.7391975308641977e-05, "loss": 5346.3694, "step": 1080 }, { "epoch": 1.0, "eval_cer": 1.0, "eval_loss": 1150.5341796875, "eval_runtime": 29.9293, "eval_samples_per_second": 29.737, "eval_steps_per_second": 3.742, "eval_wer": 1.0, "step": 1080 }, { "epoch": 2.0, "grad_norm": 54.39596176147461, "learning_rate": 5.5169753086419756e-05, "loss": 3391.3456, "step": 2160 }, { "epoch": 2.0, "eval_cer": 0.9995307019710518, "eval_loss": 1049.42236328125, "eval_runtime": 29.5506, "eval_samples_per_second": 30.118, "eval_steps_per_second": 3.79, "eval_wer": 1.0, "step": 2160 }, { "epoch": 3.0, "grad_norm": 268.0443115234375, "learning_rate": 8.294753086419752e-05, "loss": 1439.7179, "step": 3240 }, { "epoch": 3.0, "eval_cer": 0.1837178283851208, "eval_loss": 304.00048828125, "eval_runtime": 29.4915, "eval_samples_per_second": 30.178, "eval_steps_per_second": 3.798, "eval_wer": 0.5744949494949495, "step": 3240 }, { "epoch": 4.0, "grad_norm": 176.8555908203125, "learning_rate": 0.00011072530864197532, "loss": 662.4384, "step": 4320 }, { "epoch": 4.0, "eval_cer": 0.1842859259991108, "eval_loss": 300.4794921875, "eval_runtime": 30.2589, "eval_samples_per_second": 29.413, "eval_steps_per_second": 3.701, "eval_wer": 0.53125, "step": 4320 }, { "epoch": 5.0, "grad_norm": 394.7081298828125, "learning_rate": 0.0001385030864197531, "loss": 544.894, "step": 5400 }, { "epoch": 5.0, "eval_cer": 0.1691448895914637, "eval_loss": 301.7199401855469, "eval_runtime": 31.6348, "eval_samples_per_second": 28.134, "eval_steps_per_second": 3.54, "eval_wer": 0.5099431818181818, "step": 5400 }, { "epoch": 6.0, "grad_norm": 226.64849853515625, "learning_rate": 0.00016628086419753085, "loss": 527.8369, "step": 6480 }, { "epoch": 6.0, "eval_cer": 0.20328014622338586, "eval_loss": 351.5502014160156, "eval_runtime": 29.8883, "eval_samples_per_second": 29.778, "eval_steps_per_second": 3.747, "eval_wer": 0.5779671717171717, "step": 6480 }, { "epoch": 7.0, "grad_norm": 586.9916381835938, "learning_rate": 0.0001940329218106996, "loss": 484.5173, "step": 7560 }, { "epoch": 7.0, "eval_cer": 0.18781801116435312, "eval_loss": 340.1422119140625, "eval_runtime": 29.5073, "eval_samples_per_second": 30.162, "eval_steps_per_second": 3.796, "eval_wer": 0.5186237373737373, "step": 7560 }, { "epoch": 8.0, "grad_norm": 9.222601890563965, "learning_rate": 0.0002218106995884774, "loss": 492.0863, "step": 8640 }, { "epoch": 8.0, "eval_cer": 0.2231635627130366, "eval_loss": 426.72216796875, "eval_runtime": 31.2147, "eval_samples_per_second": 28.512, "eval_steps_per_second": 3.588, "eval_wer": 0.5787563131313131, "step": 8640 }, { "epoch": 8.0, "step": 8640, "total_flos": 7.357190851535068e+18, "train_loss": 1611.1507269965277, "train_runtime": 7095.9649, "train_samples_per_second": 146.001, "train_steps_per_second": 9.132 } ], "logging_steps": 500, "max_steps": 64800, "num_input_tokens_seen": 0, "num_train_epochs": 60, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 3, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 3 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 7.357190851535068e+18, "train_batch_size": 16, "trial_name": null, "trial_params": null }