cite-text-analysis commited on
Commit
d01bcb9
·
verified ·
1 Parent(s): 33856c2

Upload folder using huggingface_hub

Browse files
training_checkpoints/checkpoint-1344/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c430c4d9702a4baeddeda050750525b96e67993b8d70503cb410e99320c4837e
3
  size 263153912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67e50219101fbea3214dc9145442b79a48812f4963baedfc9291fea52ef51357
3
  size 263153912
training_checkpoints/checkpoint-1344/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:734af6d9db80f4a6443e449bc11d79d50c0dae777c6d736264f6472948e95e62
3
  size 526369978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1d97977ce160bcbb3e666517f9e5421c05f6ae11b442586ece81bdfa3fcf925
3
  size 526369978
training_checkpoints/checkpoint-1344/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dad5f7ec57203a8e28a98d2deddbfa247195c6ec01360dd1d5e15f1d4acae5f3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edb0cda888f21bb982e8535b7efa97ccc6b83590128f4f956d586c2cf11bf6a9
3
  size 1064
training_checkpoints/checkpoint-1344/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.6190547468267676,
3
- "best_model_checkpoint": "case-analysis-distilbert-base-cased/checkpoint-1344",
4
  "epoch": 6.0,
5
  "eval_steps": 500,
6
  "global_step": 1344,
@@ -10,148 +10,148 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.7683741648106904,
14
- "eval_f1_macro": 0.5345911091709411,
15
- "eval_f1_micro": 0.7683741648106904,
16
- "eval_f1_weighted": 0.7419347573003691,
17
- "eval_loss": 0.6746780872344971,
18
- "eval_macro_fpr": 0.12600030005040652,
19
- "eval_macro_sensitivity": 0.5319427525309879,
20
- "eval_macro_specificity": 0.8890561890350515,
21
- "eval_precision": 0.723734857424959,
22
- "eval_precision_macro": 0.5435421823199279,
23
- "eval_recall": 0.7683741648106904,
24
- "eval_recall_macro": 0.5319427525309879,
25
- "eval_runtime": 5.5739,
26
- "eval_samples_per_second": 80.554,
27
- "eval_steps_per_second": 10.226,
28
- "eval_weighted_fpr": 0.0913081650570676,
29
- "eval_weighted_sensitivity": 0.7683741648106904,
30
- "eval_weighted_specificity": 0.7878505913295152,
31
  "step": 224
32
  },
33
  {
34
  "epoch": 2.0,
35
- "eval_accuracy": 0.8151447661469933,
36
- "eval_f1_macro": 0.6006365232660228,
37
- "eval_f1_micro": 0.8151447661469933,
38
- "eval_f1_weighted": 0.7944989450754872,
39
- "eval_loss": 0.6685805916786194,
40
- "eval_macro_fpr": 0.09260504201680672,
41
- "eval_macro_sensitivity": 0.6135692606280841,
42
- "eval_macro_specificity": 0.9160924396038365,
43
- "eval_precision": 0.775170081701242,
44
- "eval_precision_macro": 0.5885022601098201,
45
- "eval_recall": 0.8151447661469933,
46
- "eval_recall_macro": 0.6135692606280841,
47
- "eval_runtime": 22.918,
48
- "eval_samples_per_second": 19.592,
49
- "eval_steps_per_second": 2.487,
50
- "eval_weighted_fpr": 0.07027942421676546,
51
- "eval_weighted_sensitivity": 0.8151447661469933,
52
- "eval_weighted_specificity": 0.8492249922683526,
53
  "step": 448
54
  },
55
  {
56
  "epoch": 2.232142857142857,
57
- "grad_norm": 15.72251033782959,
58
- "learning_rate": 4.6302083333333335e-05,
59
- "loss": 0.6982,
60
  "step": 500
61
  },
62
  {
63
  "epoch": 3.0,
64
- "eval_accuracy": 0.8106904231625836,
65
- "eval_f1_macro": 0.5965678894021851,
66
- "eval_f1_micro": 0.8106904231625834,
67
- "eval_f1_weighted": 0.789500666861841,
68
- "eval_loss": 0.7899503111839294,
69
- "eval_macro_fpr": 0.09825302902225978,
70
- "eval_macro_sensitivity": 0.6052493478964067,
71
- "eval_macro_specificity": 0.910687377505773,
72
- "eval_precision": 0.7758060756348297,
73
- "eval_precision_macro": 0.5947486579771227,
74
- "eval_recall": 0.8106904231625836,
75
- "eval_recall_macro": 0.6052493478964067,
76
- "eval_runtime": 22.9183,
77
- "eval_samples_per_second": 19.591,
78
- "eval_steps_per_second": 2.487,
79
- "eval_weighted_fpr": 0.07221750212404418,
80
- "eval_weighted_sensitivity": 0.8106904231625836,
81
- "eval_weighted_specificity": 0.8320590868605084,
82
  "step": 672
83
  },
84
  {
85
  "epoch": 4.0,
86
- "eval_accuracy": 0.8129175946547884,
87
- "eval_f1_macro": 0.6024092775980217,
88
- "eval_f1_micro": 0.8129175946547884,
89
- "eval_f1_weighted": 0.7934058050292863,
90
- "eval_loss": 0.8377446532249451,
91
- "eval_macro_fpr": 0.10023342701741786,
92
- "eval_macro_sensitivity": 0.5950729186023304,
93
- "eval_macro_specificity": 0.9076308769469239,
94
- "eval_precision": 0.7822520571931126,
95
- "eval_precision_macro": 0.6157741567498898,
96
- "eval_recall": 0.8129175946547884,
97
- "eval_recall_macro": 0.5950729186023304,
98
- "eval_runtime": 23.0602,
99
- "eval_samples_per_second": 19.471,
100
- "eval_steps_per_second": 2.472,
101
- "eval_weighted_fpr": 0.07124681933842239,
102
- "eval_weighted_sensitivity": 0.8129175946547884,
103
- "eval_weighted_specificity": 0.8176059131329072,
104
  "step": 896
105
  },
106
  {
107
  "epoch": 4.464285714285714,
108
- "grad_norm": 3.802079200744629,
109
- "learning_rate": 4.259672619047619e-05,
110
- "loss": 0.3797,
111
  "step": 1000
112
  },
113
  {
114
  "epoch": 5.0,
115
- "eval_accuracy": 0.8195991091314031,
116
- "eval_f1_macro": 0.6096395609968126,
117
- "eval_f1_micro": 0.8195991091314031,
118
- "eval_f1_weighted": 0.8009201487061303,
119
- "eval_loss": 0.9637371897697449,
120
- "eval_macro_fpr": 0.09298523725810875,
121
- "eval_macro_sensitivity": 0.6097056758821464,
122
- "eval_macro_specificity": 0.9156101048565789,
123
- "eval_precision": 0.7852664668210015,
124
- "eval_precision_macro": 0.6117719622096018,
125
- "eval_recall": 0.8195991091314031,
126
- "eval_recall_macro": 0.6097056758821464,
127
- "eval_runtime": 24.1336,
128
- "eval_samples_per_second": 18.605,
129
- "eval_steps_per_second": 2.362,
130
- "eval_weighted_fpr": 0.06835443037974684,
131
- "eval_weighted_sensitivity": 0.8195991091314031,
132
- "eval_weighted_specificity": 0.8428413102949123,
133
  "step": 1120
134
  },
135
  {
136
  "epoch": 6.0,
137
- "eval_accuracy": 0.799554565701559,
138
- "eval_f1_macro": 0.6190547468267676,
139
- "eval_f1_micro": 0.799554565701559,
140
- "eval_f1_weighted": 0.8002581826434487,
141
- "eval_loss": 1.0848541259765625,
142
- "eval_macro_fpr": 0.09461858568722545,
143
- "eval_macro_sensitivity": 0.6154274977804389,
144
- "eval_macro_specificity": 0.9173876054987379,
145
- "eval_precision": 0.8024626803020691,
146
- "eval_precision_macro": 0.6242875164499879,
147
- "eval_recall": 0.799554565701559,
148
- "eval_recall_macro": 0.6154274977804389,
149
- "eval_runtime": 26.5504,
150
- "eval_samples_per_second": 16.911,
151
- "eval_steps_per_second": 2.147,
152
- "eval_weighted_fpr": 0.07712082262210797,
153
- "eval_weighted_sensitivity": 0.799554565701559,
154
- "eval_weighted_specificity": 0.8699958562933927,
155
  "step": 1344
156
  }
157
  ],
 
1
  {
2
+ "best_metric": 0.6301119928151375,
3
+ "best_model_checkpoint": "case-analysis-distilbert-base-cased/checkpoint-896",
4
  "epoch": 6.0,
5
  "eval_steps": 500,
6
  "global_step": 1344,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7661469933184856,
14
+ "eval_f1_macro": 0.5270352134866867,
15
+ "eval_f1_micro": 0.7661469933184856,
16
+ "eval_f1_weighted": 0.7333313004442764,
17
+ "eval_loss": 0.7000867128372192,
18
+ "eval_macro_fpr": 0.1330263157894737,
19
+ "eval_macro_sensitivity": 0.5137440725676019,
20
+ "eval_macro_specificity": 0.8818942592408516,
21
+ "eval_precision": 0.7310834070149471,
22
+ "eval_precision_macro": 0.5790641299401408,
23
+ "eval_recall": 0.7661469933184856,
24
+ "eval_recall_macro": 0.5137440725676019,
25
+ "eval_runtime": 5.4998,
26
+ "eval_samples_per_second": 81.639,
27
+ "eval_steps_per_second": 10.364,
28
+ "eval_weighted_fpr": 0.09234828496042216,
29
+ "eval_weighted_sensitivity": 0.7661469933184856,
30
+ "eval_weighted_specificity": 0.761430043644921,
31
  "step": 224
32
  },
33
  {
34
  "epoch": 2.0,
35
+ "eval_accuracy": 0.7750556792873051,
36
+ "eval_f1_macro": 0.5486718521990608,
37
+ "eval_f1_micro": 0.775055679287305,
38
+ "eval_f1_weighted": 0.7492575717498114,
39
+ "eval_loss": 0.7387592792510986,
40
+ "eval_macro_fpr": 0.12078200823200373,
41
+ "eval_macro_sensitivity": 0.5464266787796199,
42
+ "eval_macro_specificity": 0.8914743027952345,
43
+ "eval_precision": 0.7315284458297402,
44
+ "eval_precision_macro": 0.5585311316366537,
45
+ "eval_recall": 0.7750556792873051,
46
+ "eval_recall_macro": 0.5464266787796199,
47
+ "eval_runtime": 23.5227,
48
+ "eval_samples_per_second": 19.088,
49
+ "eval_steps_per_second": 2.423,
50
+ "eval_weighted_fpr": 0.08820960698689956,
51
+ "eval_weighted_sensitivity": 0.7750556792873051,
52
+ "eval_weighted_specificity": 0.7908415318936333,
53
  "step": 448
54
  },
55
  {
56
  "epoch": 2.232142857142857,
57
+ "grad_norm": 22.91168785095215,
58
+ "learning_rate": 4.629464285714286e-05,
59
+ "loss": 0.7066,
60
  "step": 500
61
  },
62
  {
63
  "epoch": 3.0,
64
+ "eval_accuracy": 0.8017817371937639,
65
+ "eval_f1_macro": 0.576677451756589,
66
+ "eval_f1_micro": 0.8017817371937639,
67
+ "eval_f1_weighted": 0.7759761601356532,
68
+ "eval_loss": 0.7228724956512451,
69
+ "eval_macro_fpr": 0.10757194512338594,
70
+ "eval_macro_sensitivity": 0.5707859310800487,
71
+ "eval_macro_specificity": 0.9026901603449184,
72
+ "eval_precision": 0.7604834726234316,
73
+ "eval_precision_macro": 0.5932281353135314,
74
+ "eval_recall": 0.8017817371937639,
75
+ "eval_recall_macro": 0.5707859310800487,
76
+ "eval_runtime": 17.5142,
77
+ "eval_samples_per_second": 25.636,
78
+ "eval_steps_per_second": 3.254,
79
+ "eval_weighted_fpr": 0.07613344739093242,
80
+ "eval_weighted_sensitivity": 0.8017817371937639,
81
+ "eval_weighted_specificity": 0.8089789041859096,
82
  "step": 672
83
  },
84
  {
85
  "epoch": 4.0,
86
+ "eval_accuracy": 0.8062360801781737,
87
+ "eval_f1_macro": 0.6301119928151375,
88
+ "eval_f1_micro": 0.8062360801781738,
89
+ "eval_f1_weighted": 0.7933630533945198,
90
+ "eval_loss": 0.8331468105316162,
91
+ "eval_macro_fpr": 0.10175133159747105,
92
+ "eval_macro_sensitivity": 0.6114882070764424,
93
+ "eval_macro_specificity": 0.9069973738423197,
94
+ "eval_precision": 0.7896315051078991,
95
+ "eval_precision_macro": 0.6674639062867935,
96
+ "eval_recall": 0.8062360801781737,
97
+ "eval_recall_macro": 0.6114882070764424,
98
+ "eval_runtime": 17.9901,
99
+ "eval_samples_per_second": 24.958,
100
+ "eval_steps_per_second": 3.168,
101
+ "eval_weighted_fpr": 0.0741687979539642,
102
+ "eval_weighted_sensitivity": 0.8062360801781737,
103
+ "eval_weighted_specificity": 0.8217534151911048,
104
  "step": 896
105
  },
106
  {
107
  "epoch": 4.464285714285714,
108
+ "grad_norm": 0.23617026209831238,
109
+ "learning_rate": 4.258184523809524e-05,
110
+ "loss": 0.3654,
111
  "step": 1000
112
  },
113
  {
114
  "epoch": 5.0,
115
+ "eval_accuracy": 0.7683741648106904,
116
+ "eval_f1_macro": 0.5896043825978781,
117
+ "eval_f1_micro": 0.7683741648106904,
118
+ "eval_f1_weighted": 0.7610828501277613,
119
+ "eval_loss": 1.2299734354019165,
120
+ "eval_macro_fpr": 0.10662840460883276,
121
+ "eval_macro_sensitivity": 0.6130556645262528,
122
+ "eval_macro_specificity": 0.9056447032260023,
123
+ "eval_precision": 0.7698582566254396,
124
+ "eval_precision_macro": 0.6085394130060126,
125
+ "eval_recall": 0.7683741648106904,
126
+ "eval_recall_macro": 0.6130556645262528,
127
+ "eval_runtime": 19.5517,
128
+ "eval_samples_per_second": 22.965,
129
+ "eval_steps_per_second": 2.915,
130
+ "eval_weighted_fpr": 0.0913081650570676,
131
+ "eval_weighted_sensitivity": 0.7683741648106904,
132
+ "eval_weighted_specificity": 0.8542046480933186,
133
  "step": 1120
134
  },
135
  {
136
  "epoch": 6.0,
137
+ "eval_accuracy": 0.8129175946547884,
138
+ "eval_f1_macro": 0.6299577384875399,
139
+ "eval_f1_micro": 0.8129175946547884,
140
+ "eval_f1_weighted": 0.7972266629935387,
141
+ "eval_loss": 1.0698440074920654,
142
+ "eval_macro_fpr": 0.09572659519735909,
143
+ "eval_macro_sensitivity": 0.6152769461592991,
144
+ "eval_macro_specificity": 0.9133810019905357,
145
+ "eval_precision": 0.7940368363876591,
146
+ "eval_precision_macro": 0.6863588955891834,
147
+ "eval_recall": 0.8129175946547884,
148
+ "eval_recall_macro": 0.6152769461592991,
149
+ "eval_runtime": 21.7346,
150
+ "eval_samples_per_second": 20.658,
151
+ "eval_steps_per_second": 2.623,
152
+ "eval_weighted_fpr": 0.07124681933842239,
153
+ "eval_weighted_sensitivity": 0.8129175946547884,
154
+ "eval_weighted_specificity": 0.8406064133073544,
155
  "step": 1344
156
  }
157
  ],
training_checkpoints/checkpoint-1344/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e69a367f465c21d14de763eeb210a4f6dfdc2d5d36a7fd05f0a714a904e7ac23
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3168244efe16c0aeafe631cea29ca8c9c2bbb665a169c0d40c2e4d22eaca40d9
3
  size 5048