cite-text-analysis commited on
Commit
9d78109
·
verified ·
1 Parent(s): a6dd692

Upload folder using huggingface_hub

Browse files
training_checkpoints/checkpoint-672/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ccda723584e3f87851c6d4fa0f6803e6221bdeb3c0c197f068753d04dde2a2e
3
  size 263153912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1e0f5580b2a53015b1aa305dfc568132ece5f07f42a25b73141736125dbcdc8
3
  size 263153912
training_checkpoints/checkpoint-672/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c2e3f894ac3f2bbcddf38637802cc895b46d7a1caf11b92cddc570828fa5cfb
3
  size 526369978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a34b910c835c7d0ef8353a77bbd9df684d8992cd488f28de461ed8d415a4d122
3
  size 526369978
training_checkpoints/checkpoint-672/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f9a3f98e11364f5e565bedc0bb8b71f97fbe5f7fd840035411aad27e961fa46
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f26db89cf369108ce9c528bb27f1cd8769dd7803aebee3a7068e32131e1fee3
3
  size 1064
training_checkpoints/checkpoint-672/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.6006365232660228,
3
- "best_model_checkpoint": "case-analysis-distilbert-base-cased/checkpoint-448",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
  "global_step": 672,
@@ -10,75 +10,75 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.7683741648106904,
14
- "eval_f1_macro": 0.5345911091709411,
15
- "eval_f1_micro": 0.7683741648106904,
16
- "eval_f1_weighted": 0.7419347573003691,
17
- "eval_loss": 0.6746780872344971,
18
- "eval_macro_fpr": 0.12600030005040652,
19
- "eval_macro_sensitivity": 0.5319427525309879,
20
- "eval_macro_specificity": 0.8890561890350515,
21
- "eval_precision": 0.723734857424959,
22
- "eval_precision_macro": 0.5435421823199279,
23
- "eval_recall": 0.7683741648106904,
24
- "eval_recall_macro": 0.5319427525309879,
25
- "eval_runtime": 5.5739,
26
- "eval_samples_per_second": 80.554,
27
- "eval_steps_per_second": 10.226,
28
- "eval_weighted_fpr": 0.0913081650570676,
29
- "eval_weighted_sensitivity": 0.7683741648106904,
30
- "eval_weighted_specificity": 0.7878505913295152,
31
  "step": 224
32
  },
33
  {
34
  "epoch": 2.0,
35
- "eval_accuracy": 0.8151447661469933,
36
- "eval_f1_macro": 0.6006365232660228,
37
- "eval_f1_micro": 0.8151447661469933,
38
- "eval_f1_weighted": 0.7944989450754872,
39
- "eval_loss": 0.6685805916786194,
40
- "eval_macro_fpr": 0.09260504201680672,
41
- "eval_macro_sensitivity": 0.6135692606280841,
42
- "eval_macro_specificity": 0.9160924396038365,
43
- "eval_precision": 0.775170081701242,
44
- "eval_precision_macro": 0.5885022601098201,
45
- "eval_recall": 0.8151447661469933,
46
- "eval_recall_macro": 0.6135692606280841,
47
- "eval_runtime": 22.918,
48
- "eval_samples_per_second": 19.592,
49
- "eval_steps_per_second": 2.487,
50
- "eval_weighted_fpr": 0.07027942421676546,
51
- "eval_weighted_sensitivity": 0.8151447661469933,
52
- "eval_weighted_specificity": 0.8492249922683526,
53
  "step": 448
54
  },
55
  {
56
  "epoch": 2.232142857142857,
57
- "grad_norm": 15.72251033782959,
58
- "learning_rate": 4.6302083333333335e-05,
59
- "loss": 0.6982,
60
  "step": 500
61
  },
62
  {
63
  "epoch": 3.0,
64
- "eval_accuracy": 0.8106904231625836,
65
- "eval_f1_macro": 0.5965678894021851,
66
- "eval_f1_micro": 0.8106904231625834,
67
- "eval_f1_weighted": 0.789500666861841,
68
- "eval_loss": 0.7899503111839294,
69
- "eval_macro_fpr": 0.09825302902225978,
70
- "eval_macro_sensitivity": 0.6052493478964067,
71
- "eval_macro_specificity": 0.910687377505773,
72
- "eval_precision": 0.7758060756348297,
73
- "eval_precision_macro": 0.5947486579771227,
74
- "eval_recall": 0.8106904231625836,
75
- "eval_recall_macro": 0.6052493478964067,
76
- "eval_runtime": 22.9183,
77
- "eval_samples_per_second": 19.591,
78
- "eval_steps_per_second": 2.487,
79
- "eval_weighted_fpr": 0.07221750212404418,
80
- "eval_weighted_sensitivity": 0.8106904231625836,
81
- "eval_weighted_specificity": 0.8320590868605084,
82
  "step": 672
83
  }
84
  ],
 
1
  {
2
+ "best_metric": 0.576677451756589,
3
+ "best_model_checkpoint": "case-analysis-distilbert-base-cased/checkpoint-672",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
  "global_step": 672,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7661469933184856,
14
+ "eval_f1_macro": 0.5270352134866867,
15
+ "eval_f1_micro": 0.7661469933184856,
16
+ "eval_f1_weighted": 0.7333313004442764,
17
+ "eval_loss": 0.7000867128372192,
18
+ "eval_macro_fpr": 0.1330263157894737,
19
+ "eval_macro_sensitivity": 0.5137440725676019,
20
+ "eval_macro_specificity": 0.8818942592408516,
21
+ "eval_precision": 0.7310834070149471,
22
+ "eval_precision_macro": 0.5790641299401408,
23
+ "eval_recall": 0.7661469933184856,
24
+ "eval_recall_macro": 0.5137440725676019,
25
+ "eval_runtime": 5.4998,
26
+ "eval_samples_per_second": 81.639,
27
+ "eval_steps_per_second": 10.364,
28
+ "eval_weighted_fpr": 0.09234828496042216,
29
+ "eval_weighted_sensitivity": 0.7661469933184856,
30
+ "eval_weighted_specificity": 0.761430043644921,
31
  "step": 224
32
  },
33
  {
34
  "epoch": 2.0,
35
+ "eval_accuracy": 0.7750556792873051,
36
+ "eval_f1_macro": 0.5486718521990608,
37
+ "eval_f1_micro": 0.775055679287305,
38
+ "eval_f1_weighted": 0.7492575717498114,
39
+ "eval_loss": 0.7387592792510986,
40
+ "eval_macro_fpr": 0.12078200823200373,
41
+ "eval_macro_sensitivity": 0.5464266787796199,
42
+ "eval_macro_specificity": 0.8914743027952345,
43
+ "eval_precision": 0.7315284458297402,
44
+ "eval_precision_macro": 0.5585311316366537,
45
+ "eval_recall": 0.7750556792873051,
46
+ "eval_recall_macro": 0.5464266787796199,
47
+ "eval_runtime": 23.5227,
48
+ "eval_samples_per_second": 19.088,
49
+ "eval_steps_per_second": 2.423,
50
+ "eval_weighted_fpr": 0.08820960698689956,
51
+ "eval_weighted_sensitivity": 0.7750556792873051,
52
+ "eval_weighted_specificity": 0.7908415318936333,
53
  "step": 448
54
  },
55
  {
56
  "epoch": 2.232142857142857,
57
+ "grad_norm": 22.91168785095215,
58
+ "learning_rate": 4.629464285714286e-05,
59
+ "loss": 0.7066,
60
  "step": 500
61
  },
62
  {
63
  "epoch": 3.0,
64
+ "eval_accuracy": 0.8017817371937639,
65
+ "eval_f1_macro": 0.576677451756589,
66
+ "eval_f1_micro": 0.8017817371937639,
67
+ "eval_f1_weighted": 0.7759761601356532,
68
+ "eval_loss": 0.7228724956512451,
69
+ "eval_macro_fpr": 0.10757194512338594,
70
+ "eval_macro_sensitivity": 0.5707859310800487,
71
+ "eval_macro_specificity": 0.9026901603449184,
72
+ "eval_precision": 0.7604834726234316,
73
+ "eval_precision_macro": 0.5932281353135314,
74
+ "eval_recall": 0.8017817371937639,
75
+ "eval_recall_macro": 0.5707859310800487,
76
+ "eval_runtime": 17.5142,
77
+ "eval_samples_per_second": 25.636,
78
+ "eval_steps_per_second": 3.254,
79
+ "eval_weighted_fpr": 0.07613344739093242,
80
+ "eval_weighted_sensitivity": 0.8017817371937639,
81
+ "eval_weighted_specificity": 0.8089789041859096,
82
  "step": 672
83
  }
84
  ],
training_checkpoints/checkpoint-672/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e69a367f465c21d14de763eeb210a4f6dfdc2d5d36a7fd05f0a714a904e7ac23
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3168244efe16c0aeafe631cea29ca8c9c2bbb665a169c0d40c2e4d22eaca40d9
3
  size 5048