Theoreticallyhugo's picture
Training in progress, epoch 2, checkpoint
0555d17 verified
{
"best_metric": 0.47574615478515625,
"best_model_checkpoint": "longformer-full_labels/checkpoint-82",
"epoch": 2.0,
"eval_steps": 500,
"global_step": 82,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_B-Claim": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 284.0
},
"eval_B-MajorClaim": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 141.0
},
"eval_B-Premise": {
"f1-score": 0.12010443864229765,
"precision": 0.7931034482758621,
"recall": 0.06497175141242938,
"support": 708.0
},
"eval_I-Claim": {
"f1-score": 0.15241779497098645,
"precision": 0.35688405797101447,
"recall": 0.09690113133300542,
"support": 4066.0
},
"eval_I-MajorClaim": {
"f1-score": 0.4055459272097054,
"precision": 0.4854771784232365,
"recall": 0.3482142857142857,
"support": 2016.0
},
"eval_I-Premise": {
"f1-score": 0.8243874805268375,
"precision": 0.7254034519284691,
"recall": 0.9546535465354653,
"support": 12195.0
},
"eval_O": {
"f1-score": 0.8527010510877536,
"precision": 0.8224254998113919,
"recall": 0.8852908334179271,
"support": 9851.0
},
"eval_accuracy": 0.7349372885410614,
"eval_loss": 0.7363316416740417,
"eval_macro avg": {
"f1-score": 0.3364509560625115,
"precision": 0.4547562337728534,
"recall": 0.3357187926304447,
"support": 29261.0
},
"eval_runtime": 1.4874,
"eval_samples_per_second": 53.786,
"eval_steps_per_second": 6.723,
"eval_weighted avg": {
"f1-score": 0.6826734788782265,
"precision": 0.6814305221181916,
"recall": 0.7349372885410614,
"support": 29261.0
},
"step": 41
},
{
"epoch": 2.0,
"eval_B-Claim": {
"f1-score": 0.020905923344947737,
"precision": 1.0,
"recall": 0.01056338028169014,
"support": 284.0
},
"eval_B-MajorClaim": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 141.0
},
"eval_B-Premise": {
"f1-score": 0.7109756097560975,
"precision": 0.6255364806866953,
"recall": 0.8234463276836158,
"support": 708.0
},
"eval_I-Claim": {
"f1-score": 0.5191693290734825,
"precision": 0.5658734764944864,
"recall": 0.4795868175110674,
"support": 4066.0
},
"eval_I-MajorClaim": {
"f1-score": 0.6294067067927773,
"precision": 0.745417515274949,
"recall": 0.5446428571428571,
"support": 2016.0
},
"eval_I-Premise": {
"f1-score": 0.8761396663614285,
"precision": 0.8514935768456895,
"recall": 0.9022550225502255,
"support": 12195.0
},
"eval_O": {
"f1-score": 0.931648308418568,
"precision": 0.9034811635670005,
"recall": 0.9616282610902447,
"support": 9851.0
},
"eval_accuracy": 0.8239636376063703,
"eval_loss": 0.47574615478515625,
"eval_macro avg": {
"f1-score": 0.5268922205353288,
"precision": 0.6702574589812601,
"recall": 0.5317318094656714,
"support": 29261.0
},
"eval_runtime": 1.5047,
"eval_samples_per_second": 53.167,
"eval_steps_per_second": 6.646,
"eval_weighted avg": {
"f1-score": 0.8117058591419718,
"precision": 0.8138696629123667,
"recall": 0.8239636376063703,
"support": 29261.0
},
"step": 82
}
],
"logging_steps": 500,
"max_steps": 205,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 287581625436000.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}