Theoreticallyhugo commited on
Commit
1b537d3
·
verified ·
1 Parent(s): fa7ece3

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-41/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd33ff53c0edd4d359980f27f4afa194ec5b807febef7f4cbaefde162b633c4b
3
  size 592330980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88c07cbc53c51f5c54df711ef5979bc1f3418049f6d85a04b3dbda81a97924a1
3
  size 592330980
checkpoint-41/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab3510262bc219de46e870072b2a617000c0c57c3d0baaaf87394856c91f5477
3
  size 1014670074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:607460e5b1146da32c681dd270585cfb7f0e8ea70592e43e5c102d6094ae78cc
3
  size 1014670074
checkpoint-41/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b75d0f85c6e5f43bda08f24453a869f5d0b5d0d33d936ef1b542f406f081347
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a939982f711c8a91f0893b4f281f0db4fd89d7ca52de2aed82098ef9ff76ea2
3
  size 14244
checkpoint-41/trainer_state.json CHANGED
@@ -14,60 +14,60 @@
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
- "support": 339.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
- "support": 160.0
24
  },
25
  "eval_B-Premise": {
26
- "f1-score": 0.22426470588235295,
27
- "precision": 0.8299319727891157,
28
- "recall": 0.12964930924548354,
29
- "support": 941.0
30
  },
31
  "eval_I-Claim": {
32
- "f1-score": 0.38247663551401867,
33
- "precision": 0.423873640600725,
34
- "recall": 0.348446147296722,
35
- "support": 4698.0
36
  },
37
  "eval_I-MajorClaim": {
38
- "f1-score": 0.3634627625716104,
39
- "precision": 0.5125673249551167,
40
- "recall": 0.28155818540433925,
41
- "support": 2028.0
42
  },
43
  "eval_I-Premise": {
44
- "f1-score": 0.8298935191271198,
45
- "precision": 0.8110747093209996,
46
- "recall": 0.8496063521970257,
47
- "support": 14861.0
48
  },
49
  "eval_O": {
50
- "f1-score": 0.8121805609242796,
51
- "precision": 0.7380952380952381,
52
- "recall": 0.9027976701995608,
53
- "support": 10473.0
54
  },
55
- "eval_accuracy": 0.7286865671641791,
56
- "eval_loss": 0.763540506362915,
57
  "eval_macro avg": {
58
- "f1-score": 0.3731825977170545,
59
- "precision": 0.47364898368017067,
60
- "recall": 0.3588653806204473,
61
- "support": 33500.0
62
  },
63
- "eval_runtime": 1.4539,
64
- "eval_samples_per_second": 55.714,
65
- "eval_steps_per_second": 7.566,
66
  "eval_weighted avg": {
67
- "f1-score": 0.7040007584084623,
68
- "precision": 0.7043362259324342,
69
- "recall": 0.7286865671641791,
70
- "support": 33500.0
71
  },
72
  "step": 41
73
  }
@@ -77,7 +77,7 @@
77
  "num_input_tokens_seen": 0,
78
  "num_train_epochs": 16,
79
  "save_steps": 500,
80
- "total_flos": 143344257399000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
83
  "trial_params": null
 
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
+ "support": 271.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
+ "support": 139.0
24
  },
25
  "eval_B-Premise": {
26
+ "f1-score": 0.22222222222222218,
27
+ "precision": 0.780952380952381,
28
+ "recall": 0.12954186413902052,
29
+ "support": 633.0
30
  },
31
  "eval_I-Claim": {
32
+ "f1-score": 0.3239807781739265,
33
+ "precision": 0.42653061224489797,
34
+ "recall": 0.26118470382404396,
35
+ "support": 4001.0
36
  },
37
  "eval_I-MajorClaim": {
38
+ "f1-score": 0.43526510480887787,
39
+ "precision": 0.5735174654752234,
40
+ "recall": 0.35072031793343267,
41
+ "support": 2013.0
42
  },
43
  "eval_I-Premise": {
44
+ "f1-score": 0.8370338686471983,
45
+ "precision": 0.7484180515958556,
46
+ "recall": 0.9494530698659139,
47
+ "support": 11336.0
48
  },
49
  "eval_O": {
50
+ "f1-score": 0.8603704893457543,
51
+ "precision": 0.8500846381718155,
52
+ "recall": 0.8709083026230219,
53
+ "support": 9226.0
54
  },
55
+ "eval_accuracy": 0.7469857706651218,
56
+ "eval_loss": 0.6934069395065308,
57
  "eval_macro avg": {
58
+ "f1-score": 0.3826960661711399,
59
+ "precision": 0.48278616406288194,
60
+ "recall": 0.3659726083407761,
61
+ "support": 27619.0
62
  },
63
+ "eval_runtime": 1.3993,
64
+ "eval_samples_per_second": 57.171,
65
+ "eval_steps_per_second": 7.146,
66
  "eval_weighted avg": {
67
+ "f1-score": 0.7147071394985115,
68
+ "precision": 0.7126373293529855,
69
+ "recall": 0.7469857706651218,
70
+ "support": 27619.0
71
  },
72
  "step": 41
73
  }
 
77
  "num_input_tokens_seen": 0,
78
  "num_train_epochs": 16,
79
  "save_steps": 500,
80
+ "total_flos": 143790812718000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
83
  "trial_params": null
checkpoint-41/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:920ab155975bf66f694757fefb246b73b0d1489bdf4f03eda383fa028f5d083a
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea7dd3e20b3e160af2247e96dc319ccd6cb101ae7dc47f0b44b05679d4ad74d7
3
  size 4664