{ "best_global_step": 24, "best_metric": 31.195335276967928, "best_model_checkpoint": "/data/hungnm/unisentiment/roberta-base-sentiment/checkpoint-24", "epoch": 4.181818181818182, "eval_steps": 500, "global_step": 25, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.9090909090909091, "grad_norm": 0.0, "learning_rate": 0.0, "loss": 1.9456, "step": 5 }, { "epoch": 1.0, "eval_loss": 1.943359375, "eval_macro_f1": 9.432731429418082, "eval_macro_precision": 17.25200652415304, "eval_macro_recall": 13.460980331549635, "eval_micro_f1": 18.221574344023324, "eval_micro_precision": 18.221574344023324, "eval_micro_recall": 18.221574344023324, "eval_runtime": 0.1703, "eval_samples_per_second": 4027.509, "eval_steps_per_second": 11.742, "step": 6 }, { "epoch": 1.7272727272727273, "grad_norm": 0.0, "learning_rate": 0.0, "loss": 1.7519, "step": 10 }, { "epoch": 2.0, "eval_loss": 1.943359375, "eval_macro_f1": 9.432731429418082, "eval_macro_precision": 17.25200652415304, "eval_macro_recall": 13.460980331549635, "eval_micro_f1": 18.221574344023324, "eval_micro_precision": 18.221574344023324, "eval_micro_recall": 18.221574344023324, "eval_runtime": 0.1648, "eval_samples_per_second": 4161.491, "eval_steps_per_second": 12.133, "step": 12 }, { "epoch": 2.5454545454545454, "grad_norm": 0.0, "learning_rate": 0.0, "loss": 1.7517, "step": 15 }, { "epoch": 3.0, "eval_loss": 1.943359375, "eval_macro_f1": 9.432731429418082, "eval_macro_precision": 17.25200652415304, "eval_macro_recall": 13.460980331549635, "eval_micro_f1": 18.221574344023324, "eval_micro_precision": 18.221574344023324, "eval_micro_recall": 18.221574344023324, "eval_runtime": 0.1698, "eval_samples_per_second": 4040.415, "eval_steps_per_second": 11.78, "step": 18 }, { "epoch": 3.3636363636363638, "grad_norm": 1.8663069009780884, "learning_rate": 5e-05, "loss": 1.7491, "step": 20 }, { "epoch": 4.0, "eval_loss": 1.7236328125, "eval_macro_f1": 6.7936507936507935, "eval_macro_precision": 4.456476468138275, "eval_macro_recall": 14.285714285714285, "eval_micro_f1": 31.195335276967928, "eval_micro_precision": 31.195335276967928, "eval_micro_recall": 31.195335276967928, "eval_runtime": 0.1645, "eval_samples_per_second": 4170.418, "eval_steps_per_second": 12.159, "step": 24 }, { "epoch": 4.181818181818182, "grad_norm": 2.6474199295043945, "learning_rate": 4.4833833507280884e-05, "loss": 1.6352, "step": 25 }, { "epoch": 4.181818181818182, "eval_loss": 1.7158203125, "eval_macro_f1": 6.7936507936507935, "eval_macro_precision": 4.456476468138275, "eval_macro_recall": 14.285714285714285, "eval_micro_f1": 31.195335276967928, "eval_micro_precision": 31.195335276967928, "eval_micro_recall": 31.195335276967928, "eval_runtime": 0.1665, "eval_samples_per_second": 4120.855, "eval_steps_per_second": 12.014, "step": 25 }, { "epoch": 4.181818181818182, "step": 25, "total_flos": 1301189864980480.0, "train_loss": 1.7666796875, "train_runtime": 35.9676, "train_samples_per_second": 771.25, "train_steps_per_second": 0.695 } ], "logging_steps": 5, "max_steps": 25, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 5.0, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1301189864980480.0, "train_batch_size": 512, "trial_name": null, "trial_params": null }