JhonMR commited on
Commit
2b40310
·
verified ·
1 Parent(s): b2aa4f3

End of training

Browse files
Files changed (5) hide show
  1. README.md +10 -14
  2. all_results.json +4 -4
  3. eval_results.json +4 -8
  4. model.safetensors +1 -1
  5. trainer_state.json +13 -248
README.md CHANGED
@@ -3,11 +3,6 @@ library_name: transformers
3
  base_model: dccuchile/bert-base-spanish-wwm-uncased
4
  tags:
5
  - generated_from_trainer
6
- metrics:
7
- - accuracy
8
- - f1
9
- - precision
10
- - recall
11
  model-index:
12
  - name: Bert_v11
13
  results: []
@@ -20,11 +15,16 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  This model is a fine-tuned version of [dccuchile/bert-base-spanish-wwm-uncased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-uncased) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
- - Accuracy: 0.9032
24
- - F1: 0.9018
25
- - Precision: 0.9036
26
- - Recall: 0.9021
27
- - Loss: 0.4583
 
 
 
 
 
28
 
29
  ## Model description
30
 
@@ -52,10 +52,6 @@ The following hyperparameters were used during training:
52
  - lr_scheduler_warmup_steps: 200
53
  - num_epochs: 15
54
 
55
- ### Training results
56
-
57
-
58
-
59
  ### Framework versions
60
 
61
  - Transformers 4.44.2
 
3
  base_model: dccuchile/bert-base-spanish-wwm-uncased
4
  tags:
5
  - generated_from_trainer
 
 
 
 
 
6
  model-index:
7
  - name: Bert_v11
8
  results: []
 
15
 
16
  This model is a fine-tuned version of [dccuchile/bert-base-spanish-wwm-uncased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-uncased) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
+ - eval_accuracy: 0.9032
19
+ - eval_f1: 0.9017
20
+ - eval_precision: 0.9035
21
+ - eval_recall: 0.9020
22
+ - eval_loss: 0.4575
23
+ - eval_runtime: 116.6553
24
+ - eval_samples_per_second: 32.403
25
+ - eval_steps_per_second: 1.02
26
+ - epoch: 0.0725
27
+ - step: 20
28
 
29
  ## Model description
30
 
 
52
  - lr_scheduler_warmup_steps: 200
53
  - num_epochs: 15
54
 
 
 
 
 
55
  ### Framework versions
56
 
57
  - Transformers 4.44.2
all_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "epoch": 8.0,
3
  "eval_accuracy": 0.9031746031746032,
4
- "eval_f1": 0.9017850721426728,
5
- "eval_loss": 0.45825621485710144,
6
- "eval_precision": 0.9036277073612298,
7
- "eval_recall": 0.902066631184587,
8
  "eval_runtime": 124.5942,
9
  "eval_samples_per_second": 30.339,
10
  "eval_steps_per_second": 0.955,
 
1
  {
2
  "epoch": 8.0,
3
  "eval_accuracy": 0.9031746031746032,
4
+ "eval_f1": 0.9017334623312502,
5
+ "eval_loss": 0.45751890540122986,
6
+ "eval_precision": 0.9035223833704444,
7
+ "eval_recall": 0.9020339725952946,
8
  "eval_runtime": 124.5942,
9
  "eval_samples_per_second": 30.339,
10
  "eval_steps_per_second": 0.955,
eval_results.json CHANGED
@@ -1,11 +1,7 @@
1
  {
2
- "epoch": 8.0,
3
  "eval_accuracy": 0.9031746031746032,
4
- "eval_f1": 0.9017850721426728,
5
- "eval_loss": 0.45825621485710144,
6
- "eval_precision": 0.9036277073612298,
7
- "eval_recall": 0.902066631184587,
8
- "eval_runtime": 124.5942,
9
- "eval_samples_per_second": 30.339,
10
- "eval_steps_per_second": 0.955
11
  }
 
1
  {
 
2
  "eval_accuracy": 0.9031746031746032,
3
+ "eval_f1": 0.9017334623312502,
4
+ "eval_loss": 0.45751890540122986,
5
+ "eval_precision": 0.9035223833704444,
6
+ "eval_recall": 0.9020339725952946
 
 
 
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ae9181229b9a85fc8a5f5f1ceccc19ea785e7ebdad58a1654cbd5f950dd48a7
3
  size 439556248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44da92d9231f6cb9360bf8c4dca271d6427081cbbbc94ce8f35217eb6c5b2f91
3
  size 439556248
trainer_state.json CHANGED
@@ -1,259 +1,24 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 8.0,
5
  "eval_steps": 500,
6
- "global_step": 2208,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.0,
13
- "step": 276,
14
- "train_eval_accuracy": 0.7003401360544218,
15
- "train_eval_f1": 0.6599009769808177,
16
- "train_eval_loss": 1.0742188692092896,
17
- "train_eval_precision": 0.7685367987097715,
18
- "train_eval_recall": 0.7009459009381873,
19
- "train_loss": 1.074218988418579,
20
- "train_runtime": 292.4292,
21
- "train_samples_per_second": 30.161,
22
- "train_steps_per_second": 0.944
23
- },
24
- {
25
- "epoch": 1.0,
26
- "eval_accuracy": 0.6865079365079365,
27
- "eval_f1": 0.6448401353068663,
28
- "eval_loss": 1.1159266233444214,
29
- "eval_precision": 0.7389370546469851,
30
- "eval_recall": 0.685088186510769,
31
- "eval_runtime": 125.2302,
32
- "eval_samples_per_second": 30.184,
33
- "eval_steps_per_second": 0.95,
34
- "step": 276
35
- },
36
- {
37
- "epoch": 2.0,
38
- "step": 552,
39
- "train_eval_accuracy": 0.9049886621315193,
40
- "train_eval_f1": 0.9047389370162652,
41
- "train_eval_loss": 0.3874468207359314,
42
- "train_eval_precision": 0.9101320070777226,
43
- "train_eval_recall": 0.9053131019265812,
44
- "train_loss": 0.3874468505382538,
45
- "train_runtime": 292.6477,
46
- "train_samples_per_second": 30.139,
47
- "train_steps_per_second": 0.943
48
- },
49
- {
50
- "epoch": 2.0,
51
- "eval_accuracy": 0.873015873015873,
52
- "eval_f1": 0.8716046163578155,
53
- "eval_loss": 0.4920203685760498,
54
- "eval_precision": 0.8781278884267814,
55
- "eval_recall": 0.8725450168508944,
56
- "eval_runtime": 125.7044,
57
- "eval_samples_per_second": 30.071,
58
- "eval_steps_per_second": 0.947,
59
- "step": 552
60
- },
61
- {
62
- "epoch": 3.0,
63
- "step": 828,
64
- "train_eval_accuracy": 0.9286848072562358,
65
- "train_eval_f1": 0.9285171455529603,
66
- "train_eval_loss": 0.27065399289131165,
67
- "train_eval_precision": 0.9322649415650033,
68
- "train_eval_recall": 0.9289123109383434,
69
- "train_loss": 0.27065402269363403,
70
- "train_runtime": 292.5422,
71
- "train_samples_per_second": 30.149,
72
- "train_steps_per_second": 0.943
73
- },
74
- {
75
- "epoch": 3.0,
76
- "eval_accuracy": 0.8973544973544973,
77
- "eval_f1": 0.8961220197070991,
78
- "eval_loss": 0.42477917671203613,
79
- "eval_precision": 0.9011567773926408,
80
- "eval_recall": 0.8971253090647534,
81
- "eval_runtime": 125.1591,
82
- "eval_samples_per_second": 30.202,
83
- "eval_steps_per_second": 0.951,
84
- "step": 828
85
- },
86
- {
87
- "epoch": 4.0,
88
- "step": 1104,
89
- "train_eval_accuracy": 0.9471655328798186,
90
- "train_eval_f1": 0.947517595979444,
91
- "train_eval_loss": 0.2088230848312378,
92
- "train_eval_precision": 0.9488916851742717,
93
- "train_eval_recall": 0.9477037054061244,
94
- "train_loss": 0.2088230848312378,
95
- "train_runtime": 292.1312,
96
- "train_samples_per_second": 30.192,
97
- "train_steps_per_second": 0.945
98
- },
99
- {
100
- "epoch": 4.0,
101
- "eval_accuracy": 0.9010582010582011,
102
- "eval_f1": 0.8999224906052751,
103
- "eval_loss": 0.41053256392478943,
104
- "eval_precision": 0.9025635496532717,
105
- "eval_recall": 0.9002552887231217,
106
- "eval_runtime": 125.1369,
107
- "eval_samples_per_second": 30.207,
108
- "eval_steps_per_second": 0.951,
109
- "step": 1104
110
- },
111
- {
112
- "epoch": 5.0,
113
- "step": 1380,
114
- "train_eval_accuracy": 0.9515873015873015,
115
- "train_eval_f1": 0.9516673939530801,
116
- "train_eval_loss": 0.17656771838665009,
117
- "train_eval_precision": 0.9539169437133798,
118
- "train_eval_recall": 0.9520537526614696,
119
- "train_loss": 0.1765676885843277,
120
- "train_runtime": 292.8194,
121
- "train_samples_per_second": 30.121,
122
- "train_steps_per_second": 0.943
123
- },
124
- {
125
- "epoch": 5.0,
126
- "eval_accuracy": 0.9063492063492063,
127
- "eval_f1": 0.9046138481463505,
128
- "eval_loss": 0.41682690382003784,
129
- "eval_precision": 0.9088264652953383,
130
- "eval_recall": 0.9051041885149284,
131
- "eval_runtime": 125.6464,
132
- "eval_samples_per_second": 30.084,
133
- "eval_steps_per_second": 0.947,
134
- "step": 1380
135
- },
136
- {
137
- "epoch": 6.0,
138
- "step": 1656,
139
- "train_eval_accuracy": 0.9654195011337868,
140
- "train_eval_f1": 0.9656476663607069,
141
- "train_eval_loss": 0.12671761214733124,
142
- "train_eval_precision": 0.9666620904833755,
143
- "train_eval_recall": 0.9657485060432522,
144
- "train_loss": 0.12671762704849243,
145
- "train_runtime": 292.8539,
146
- "train_samples_per_second": 30.117,
147
- "train_steps_per_second": 0.942
148
- },
149
- {
150
- "epoch": 6.0,
151
- "eval_accuracy": 0.9084656084656084,
152
- "eval_f1": 0.9069212907450369,
153
- "eval_loss": 0.41428086161613464,
154
- "eval_precision": 0.909310676401177,
155
- "eval_recall": 0.9074800568136571,
156
- "eval_runtime": 125.6663,
157
- "eval_samples_per_second": 30.08,
158
- "eval_steps_per_second": 0.947,
159
- "step": 1656
160
- },
161
- {
162
- "epoch": 7.0,
163
- "step": 1932,
164
- "train_eval_accuracy": 0.9712018140589569,
165
- "train_eval_f1": 0.9713117879463059,
166
- "train_eval_loss": 0.10472333431243896,
167
- "train_eval_precision": 0.9726857205787973,
168
- "train_eval_recall": 0.9716513762432712,
169
- "train_loss": 0.10472334921360016,
170
- "train_runtime": 293.0912,
171
- "train_samples_per_second": 30.093,
172
- "train_steps_per_second": 0.942
173
- },
174
- {
175
- "epoch": 7.0,
176
- "eval_accuracy": 0.9058201058201059,
177
- "eval_f1": 0.9040971215004513,
178
- "eval_loss": 0.4402031898498535,
179
- "eval_precision": 0.9063334381728124,
180
- "eval_recall": 0.9047346717153943,
181
- "eval_runtime": 125.6961,
182
- "eval_samples_per_second": 30.073,
183
- "eval_steps_per_second": 0.947,
184
- "step": 1932
185
- },
186
- {
187
- "epoch": 8.0,
188
- "step": 2208,
189
- "train_eval_accuracy": 0.977437641723356,
190
- "train_eval_f1": 0.9777628423711627,
191
- "train_eval_loss": 0.08053447306156158,
192
- "train_eval_precision": 0.9778969889316966,
193
- "train_eval_recall": 0.9778987153746018,
194
- "train_loss": 0.08053448051214218,
195
- "train_runtime": 293.5192,
196
- "train_samples_per_second": 30.049,
197
- "train_steps_per_second": 0.94
198
- },
199
- {
200
- "epoch": 8.0,
201
  "eval_accuracy": 0.9031746031746032,
202
- "eval_f1": 0.9017850721426728,
203
- "eval_loss": 0.45825621485710144,
204
- "eval_precision": 0.9036277073612298,
205
- "eval_recall": 0.902066631184587,
206
- "eval_runtime": 125.7628,
207
- "eval_samples_per_second": 30.057,
208
- "eval_steps_per_second": 0.946,
209
- "step": 2208
210
- },
211
- {
212
- "epoch": 8.0,
213
- "step": 2208,
214
- "total_flos": 1.85717836136448e+16,
215
- "train_loss": 0.5860137939453125,
216
- "train_runtime": 10564.8969,
217
- "train_samples_per_second": 12.523,
218
- "train_steps_per_second": 0.392
219
- },
220
- {
221
- "epoch": 8.0,
222
- "eval_accuracy": 0.9031746031746032,
223
- "eval_f1": 0.9017850721426728,
224
- "eval_loss": 0.45825621485710144,
225
- "eval_precision": 0.9036277073612298,
226
- "eval_recall": 0.902066631184587,
227
- "eval_runtime": 125.8523,
228
- "eval_samples_per_second": 30.035,
229
- "eval_steps_per_second": 0.946,
230
- "step": 2208
231
- },
232
- {
233
- "epoch": 8.0,
234
- "step": 2208,
235
- "train_en_eval_accuracy": 0.977437641723356,
236
- "train_en_eval_f1": 0.9777628423711627,
237
- "train_en_eval_loss": 0.08053447306156158,
238
- "train_en_eval_precision": 0.9778969889316966,
239
- "train_en_eval_recall": 0.9778987153746018,
240
- "train_en_loss": 0.08053448051214218,
241
- "train_en_runtime": 292.6514,
242
- "train_en_samples_per_second": 30.138,
243
- "train_en_steps_per_second": 0.943
244
- },
245
- {
246
- "epoch": 8.0,
247
- "step": 2208,
248
- "test_en_eval_accuracy": 0.9031746031746032,
249
- "test_en_eval_f1": 0.9017850721426728,
250
- "test_en_eval_loss": 0.45825621485710144,
251
- "test_en_eval_precision": 0.9036277073612298,
252
- "test_en_eval_recall": 0.902066631184587,
253
- "test_en_loss": 0.45825621485710144,
254
- "test_en_runtime": 125.7293,
255
- "test_en_samples_per_second": 30.065,
256
- "test_en_steps_per_second": 0.946
257
  }
258
  ],
259
  "logging_steps": 500,
@@ -267,13 +32,13 @@
267
  "should_epoch_stop": false,
268
  "should_evaluate": false,
269
  "should_log": false,
270
- "should_save": true,
271
  "should_training_stop": true
272
  },
273
  "attributes": {}
274
  }
275
  },
276
- "total_flos": 1.85717836136448e+16,
277
  "train_batch_size": 32,
278
  "trial_name": null,
279
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.07246376811594203,
5
  "eval_steps": 500,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.07246376811594203,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  "eval_accuracy": 0.9031746031746032,
14
+ "eval_f1": 0.9017334623312502,
15
+ "eval_loss": 0.45751890540122986,
16
+ "eval_precision": 0.9035223833704444,
17
+ "eval_recall": 0.9020339725952946,
18
+ "eval_runtime": 116.6553,
19
+ "eval_samples_per_second": 32.403,
20
+ "eval_steps_per_second": 1.02,
21
+ "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  }
23
  ],
24
  "logging_steps": 500,
 
32
  "should_epoch_stop": false,
33
  "should_evaluate": false,
34
  "should_log": false,
35
+ "should_save": false,
36
  "should_training_stop": true
37
  },
38
  "attributes": {}
39
  }
40
  },
41
+ "total_flos": 0,
42
  "train_batch_size": 32,
43
  "trial_name": null,
44
  "trial_params": null