cite-text-analysis commited on
Commit
98a8616
·
verified ·
1 Parent(s): dffd72f

Upload folder using huggingface_hub

Browse files
training_checkpoints/checkpoint-896/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3e6a7c5d1c27702eb8d330734d18f23742e98f508adf53bfdd9413b63abeef8
3
  size 263153912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90f5ef9f5d276a78267327ec8a95aa6241ecf8a143980441f2cba144697856ca
3
  size 263153912
training_checkpoints/checkpoint-896/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b04ec52267e9c5bd381895ce71cd0b5293855ea2f99f325017cd832e9a1bcc0a
3
  size 526369978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:253c4164af19b7d9bd0614206f385d6f4c16f0d1c86ec9725c911c6331665a96
3
  size 526369978
training_checkpoints/checkpoint-896/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b2e6138ae63585e8c8bbcdcdb3858d2d30fa7bbfeadc6bfa779f56f19a9bb51
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7154bdee52043f7cd3e4c7a117179ff9946879418b8b87d8fcc7a318873ba73
3
  size 1064
training_checkpoints/checkpoint-896/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.6024092775980217,
3
  "best_model_checkpoint": "case-analysis-distilbert-base-cased/checkpoint-896",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
@@ -10,97 +10,97 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.7683741648106904,
14
- "eval_f1_macro": 0.5345911091709411,
15
- "eval_f1_micro": 0.7683741648106904,
16
- "eval_f1_weighted": 0.7419347573003691,
17
- "eval_loss": 0.6746780872344971,
18
- "eval_macro_fpr": 0.12600030005040652,
19
- "eval_macro_sensitivity": 0.5319427525309879,
20
- "eval_macro_specificity": 0.8890561890350515,
21
- "eval_precision": 0.723734857424959,
22
- "eval_precision_macro": 0.5435421823199279,
23
- "eval_recall": 0.7683741648106904,
24
- "eval_recall_macro": 0.5319427525309879,
25
- "eval_runtime": 5.5739,
26
- "eval_samples_per_second": 80.554,
27
- "eval_steps_per_second": 10.226,
28
- "eval_weighted_fpr": 0.0913081650570676,
29
- "eval_weighted_sensitivity": 0.7683741648106904,
30
- "eval_weighted_specificity": 0.7878505913295152,
31
  "step": 224
32
  },
33
  {
34
  "epoch": 2.0,
35
- "eval_accuracy": 0.8151447661469933,
36
- "eval_f1_macro": 0.6006365232660228,
37
- "eval_f1_micro": 0.8151447661469933,
38
- "eval_f1_weighted": 0.7944989450754872,
39
- "eval_loss": 0.6685805916786194,
40
- "eval_macro_fpr": 0.09260504201680672,
41
- "eval_macro_sensitivity": 0.6135692606280841,
42
- "eval_macro_specificity": 0.9160924396038365,
43
- "eval_precision": 0.775170081701242,
44
- "eval_precision_macro": 0.5885022601098201,
45
- "eval_recall": 0.8151447661469933,
46
- "eval_recall_macro": 0.6135692606280841,
47
- "eval_runtime": 22.918,
48
- "eval_samples_per_second": 19.592,
49
- "eval_steps_per_second": 2.487,
50
- "eval_weighted_fpr": 0.07027942421676546,
51
- "eval_weighted_sensitivity": 0.8151447661469933,
52
- "eval_weighted_specificity": 0.8492249922683526,
53
  "step": 448
54
  },
55
  {
56
  "epoch": 2.232142857142857,
57
- "grad_norm": 15.72251033782959,
58
- "learning_rate": 4.6302083333333335e-05,
59
- "loss": 0.6982,
60
  "step": 500
61
  },
62
  {
63
  "epoch": 3.0,
64
- "eval_accuracy": 0.8106904231625836,
65
- "eval_f1_macro": 0.5965678894021851,
66
- "eval_f1_micro": 0.8106904231625834,
67
- "eval_f1_weighted": 0.789500666861841,
68
- "eval_loss": 0.7899503111839294,
69
- "eval_macro_fpr": 0.09825302902225978,
70
- "eval_macro_sensitivity": 0.6052493478964067,
71
- "eval_macro_specificity": 0.910687377505773,
72
- "eval_precision": 0.7758060756348297,
73
- "eval_precision_macro": 0.5947486579771227,
74
- "eval_recall": 0.8106904231625836,
75
- "eval_recall_macro": 0.6052493478964067,
76
- "eval_runtime": 22.9183,
77
- "eval_samples_per_second": 19.591,
78
- "eval_steps_per_second": 2.487,
79
- "eval_weighted_fpr": 0.07221750212404418,
80
- "eval_weighted_sensitivity": 0.8106904231625836,
81
- "eval_weighted_specificity": 0.8320590868605084,
82
  "step": 672
83
  },
84
  {
85
  "epoch": 4.0,
86
- "eval_accuracy": 0.8129175946547884,
87
- "eval_f1_macro": 0.6024092775980217,
88
- "eval_f1_micro": 0.8129175946547884,
89
- "eval_f1_weighted": 0.7934058050292863,
90
- "eval_loss": 0.8377446532249451,
91
- "eval_macro_fpr": 0.10023342701741786,
92
- "eval_macro_sensitivity": 0.5950729186023304,
93
- "eval_macro_specificity": 0.9076308769469239,
94
- "eval_precision": 0.7822520571931126,
95
- "eval_precision_macro": 0.6157741567498898,
96
- "eval_recall": 0.8129175946547884,
97
- "eval_recall_macro": 0.5950729186023304,
98
- "eval_runtime": 23.0602,
99
- "eval_samples_per_second": 19.471,
100
- "eval_steps_per_second": 2.472,
101
- "eval_weighted_fpr": 0.07124681933842239,
102
- "eval_weighted_sensitivity": 0.8129175946547884,
103
- "eval_weighted_specificity": 0.8176059131329072,
104
  "step": 896
105
  }
106
  ],
 
1
  {
2
+ "best_metric": 0.6301119928151375,
3
  "best_model_checkpoint": "case-analysis-distilbert-base-cased/checkpoint-896",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7661469933184856,
14
+ "eval_f1_macro": 0.5270352134866867,
15
+ "eval_f1_micro": 0.7661469933184856,
16
+ "eval_f1_weighted": 0.7333313004442764,
17
+ "eval_loss": 0.7000867128372192,
18
+ "eval_macro_fpr": 0.1330263157894737,
19
+ "eval_macro_sensitivity": 0.5137440725676019,
20
+ "eval_macro_specificity": 0.8818942592408516,
21
+ "eval_precision": 0.7310834070149471,
22
+ "eval_precision_macro": 0.5790641299401408,
23
+ "eval_recall": 0.7661469933184856,
24
+ "eval_recall_macro": 0.5137440725676019,
25
+ "eval_runtime": 5.4998,
26
+ "eval_samples_per_second": 81.639,
27
+ "eval_steps_per_second": 10.364,
28
+ "eval_weighted_fpr": 0.09234828496042216,
29
+ "eval_weighted_sensitivity": 0.7661469933184856,
30
+ "eval_weighted_specificity": 0.761430043644921,
31
  "step": 224
32
  },
33
  {
34
  "epoch": 2.0,
35
+ "eval_accuracy": 0.7750556792873051,
36
+ "eval_f1_macro": 0.5486718521990608,
37
+ "eval_f1_micro": 0.775055679287305,
38
+ "eval_f1_weighted": 0.7492575717498114,
39
+ "eval_loss": 0.7387592792510986,
40
+ "eval_macro_fpr": 0.12078200823200373,
41
+ "eval_macro_sensitivity": 0.5464266787796199,
42
+ "eval_macro_specificity": 0.8914743027952345,
43
+ "eval_precision": 0.7315284458297402,
44
+ "eval_precision_macro": 0.5585311316366537,
45
+ "eval_recall": 0.7750556792873051,
46
+ "eval_recall_macro": 0.5464266787796199,
47
+ "eval_runtime": 23.5227,
48
+ "eval_samples_per_second": 19.088,
49
+ "eval_steps_per_second": 2.423,
50
+ "eval_weighted_fpr": 0.08820960698689956,
51
+ "eval_weighted_sensitivity": 0.7750556792873051,
52
+ "eval_weighted_specificity": 0.7908415318936333,
53
  "step": 448
54
  },
55
  {
56
  "epoch": 2.232142857142857,
57
+ "grad_norm": 22.91168785095215,
58
+ "learning_rate": 4.629464285714286e-05,
59
+ "loss": 0.7066,
60
  "step": 500
61
  },
62
  {
63
  "epoch": 3.0,
64
+ "eval_accuracy": 0.8017817371937639,
65
+ "eval_f1_macro": 0.576677451756589,
66
+ "eval_f1_micro": 0.8017817371937639,
67
+ "eval_f1_weighted": 0.7759761601356532,
68
+ "eval_loss": 0.7228724956512451,
69
+ "eval_macro_fpr": 0.10757194512338594,
70
+ "eval_macro_sensitivity": 0.5707859310800487,
71
+ "eval_macro_specificity": 0.9026901603449184,
72
+ "eval_precision": 0.7604834726234316,
73
+ "eval_precision_macro": 0.5932281353135314,
74
+ "eval_recall": 0.8017817371937639,
75
+ "eval_recall_macro": 0.5707859310800487,
76
+ "eval_runtime": 17.5142,
77
+ "eval_samples_per_second": 25.636,
78
+ "eval_steps_per_second": 3.254,
79
+ "eval_weighted_fpr": 0.07613344739093242,
80
+ "eval_weighted_sensitivity": 0.8017817371937639,
81
+ "eval_weighted_specificity": 0.8089789041859096,
82
  "step": 672
83
  },
84
  {
85
  "epoch": 4.0,
86
+ "eval_accuracy": 0.8062360801781737,
87
+ "eval_f1_macro": 0.6301119928151375,
88
+ "eval_f1_micro": 0.8062360801781738,
89
+ "eval_f1_weighted": 0.7933630533945198,
90
+ "eval_loss": 0.8331468105316162,
91
+ "eval_macro_fpr": 0.10175133159747105,
92
+ "eval_macro_sensitivity": 0.6114882070764424,
93
+ "eval_macro_specificity": 0.9069973738423197,
94
+ "eval_precision": 0.7896315051078991,
95
+ "eval_precision_macro": 0.6674639062867935,
96
+ "eval_recall": 0.8062360801781737,
97
+ "eval_recall_macro": 0.6114882070764424,
98
+ "eval_runtime": 17.9901,
99
+ "eval_samples_per_second": 24.958,
100
+ "eval_steps_per_second": 3.168,
101
+ "eval_weighted_fpr": 0.0741687979539642,
102
+ "eval_weighted_sensitivity": 0.8062360801781737,
103
+ "eval_weighted_specificity": 0.8217534151911048,
104
  "step": 896
105
  }
106
  ],
training_checkpoints/checkpoint-896/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e69a367f465c21d14de763eeb210a4f6dfdc2d5d36a7fd05f0a714a904e7ac23
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3168244efe16c0aeafe631cea29ca8c9c2bbb665a169c0d40c2e4d22eaca40d9
3
  size 5048