yueqis commited on
Commit
3ad0854
·
verified ·
1 Parent(s): c0c2a3d

Upload trainer_state.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. trainer_state.json +92 -0
trainer_state.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 1.9759229534510432,
6
+ "eval_steps": 1000,
7
+ "global_step": 76,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.2568218298555377,
14
+ "grad_norm": 0.6396063311539051,
15
+ "learning_rate": 9.881480035599667e-06,
16
+ "loss": 0.4811,
17
+ "step": 10
18
+ },
19
+ {
20
+ "epoch": 0.5136436597110754,
21
+ "grad_norm": 0.3654983268045694,
22
+ "learning_rate": 8.966766701456177e-06,
23
+ "loss": 0.2451,
24
+ "step": 20
25
+ },
26
+ {
27
+ "epoch": 0.7704654895666132,
28
+ "grad_norm": 0.28676240172292244,
29
+ "learning_rate": 7.308743066175172e-06,
30
+ "loss": 0.2084,
31
+ "step": 30
32
+ },
33
+ {
34
+ "epoch": 1.0513643659711076,
35
+ "grad_norm": 0.26759225032608386,
36
+ "learning_rate": 5.218096936826681e-06,
37
+ "loss": 0.2115,
38
+ "step": 40
39
+ },
40
+ {
41
+ "epoch": 1.3081861958266452,
42
+ "grad_norm": 0.2861632997496441,
43
+ "learning_rate": 3.0865828381745515e-06,
44
+ "loss": 0.1767,
45
+ "step": 50
46
+ },
47
+ {
48
+ "epoch": 1.565008025682183,
49
+ "grad_norm": 0.2683730583281023,
50
+ "learning_rate": 1.3136133159493803e-06,
51
+ "loss": 0.1714,
52
+ "step": 60
53
+ },
54
+ {
55
+ "epoch": 1.8218298555377208,
56
+ "grad_norm": 0.2705392147351614,
57
+ "learning_rate": 2.314152462588659e-07,
58
+ "loss": 0.1742,
59
+ "step": 70
60
+ },
61
+ {
62
+ "epoch": 1.9759229534510432,
63
+ "step": 76,
64
+ "total_flos": 283081697132544.0,
65
+ "train_loss": 0.23416273531160856,
66
+ "train_runtime": 4543.5593,
67
+ "train_samples_per_second": 2.194,
68
+ "train_steps_per_second": 0.017
69
+ }
70
+ ],
71
+ "logging_steps": 10,
72
+ "max_steps": 76,
73
+ "num_input_tokens_seen": 0,
74
+ "num_train_epochs": 2,
75
+ "save_steps": 100,
76
+ "stateful_callbacks": {
77
+ "TrainerControl": {
78
+ "args": {
79
+ "should_epoch_stop": false,
80
+ "should_evaluate": false,
81
+ "should_log": false,
82
+ "should_save": true,
83
+ "should_training_stop": true
84
+ },
85
+ "attributes": {}
86
+ }
87
+ },
88
+ "total_flos": 283081697132544.0,
89
+ "train_batch_size": 1,
90
+ "trial_name": null,
91
+ "trial_params": null
92
+ }