Motahar commited on
Commit
4b5a3e4
·
1 Parent(s): 4bd27f1

fbert-base-multilingual-cased

Browse files
bert-base-multilingual-cased/checkpoint-9000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05474ea02f6de2e39478b040f7c3f5af3a30763c083cf8672d82203ccc67312b
3
+ size 1418230501
bert-base-multilingual-cased/checkpoint-9000/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c82a7bec2885a88508bd05d5d1ef496b819ed5f71b1facf4221da0b356bb828e
3
+ size 711504429
bert-base-multilingual-cased/checkpoint-9000/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fac2e9cf43457983ddb611e0c6de63b60076585533fc091849adf1c21c4d867
3
+ size 14503
bert-base-multilingual-cased/checkpoint-9000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f11c7c5e98873df1990f182ce66597c230d8887be63584ee197c1fa7ad0cda0
3
+ size 559
bert-base-multilingual-cased/checkpoint-9000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c67d19c658494bfed58b35e2f3bc9b0395b4a894282a2f96d1cd187bb0d0c52e
3
+ size 623
bert-base-multilingual-cased/checkpoint-9000/special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
bert-base-multilingual-cased/checkpoint-9000/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
bert-base-multilingual-cased/checkpoint-9000/tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "bert-base-multilingual-cased", "tokenizer_class": "BertTokenizer"}
bert-base-multilingual-cased/checkpoint-9000/trainer_state.json ADDED
@@ -0,0 +1,262 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.675603217158177,
3
+ "best_model_checkpoint": "./clickbait_identification/bert-base-multilingual-cased/checkpoint-9000",
4
+ "epoch": 5.948446794448117,
5
+ "global_step": 9000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.33,
12
+ "eval_accuracy": 0.6998514115898959,
13
+ "eval_f1": 0.30344827586206896,
14
+ "eval_loss": 0.5864189863204956,
15
+ "eval_precision": 0.7652173913043478,
16
+ "eval_recall": 0.18924731182795698,
17
+ "eval_runtime": 33.712,
18
+ "eval_samples_per_second": 39.926,
19
+ "eval_steps_per_second": 5.013,
20
+ "step": 500
21
+ },
22
+ {
23
+ "epoch": 0.66,
24
+ "eval_accuracy": 0.6790490341753344,
25
+ "eval_f1": 0.5893536121673003,
26
+ "eval_loss": 0.6001235842704773,
27
+ "eval_precision": 0.5281090289608177,
28
+ "eval_recall": 0.6666666666666666,
29
+ "eval_runtime": 29.7806,
30
+ "eval_samples_per_second": 45.197,
31
+ "eval_steps_per_second": 5.675,
32
+ "step": 1000
33
+ },
34
+ {
35
+ "epoch": 0.99,
36
+ "eval_accuracy": 0.7199108469539376,
37
+ "eval_f1": 0.5701254275940707,
38
+ "eval_loss": 0.5445224642753601,
39
+ "eval_precision": 0.6067961165048543,
40
+ "eval_recall": 0.5376344086021505,
41
+ "eval_runtime": 29.7385,
42
+ "eval_samples_per_second": 45.261,
43
+ "eval_steps_per_second": 5.683,
44
+ "step": 1500
45
+ },
46
+ {
47
+ "epoch": 1.0,
48
+ "learning_rate": 1.900198281559815e-05,
49
+ "loss": 0.6004,
50
+ "step": 1513
51
+ },
52
+ {
53
+ "epoch": 1.32,
54
+ "eval_accuracy": 0.7295690936106983,
55
+ "eval_f1": 0.5368956743002544,
56
+ "eval_loss": 0.5386852025985718,
57
+ "eval_precision": 0.6573208722741433,
58
+ "eval_recall": 0.45376344086021503,
59
+ "eval_runtime": 29.9406,
60
+ "eval_samples_per_second": 44.956,
61
+ "eval_steps_per_second": 5.645,
62
+ "step": 2000
63
+ },
64
+ {
65
+ "epoch": 1.65,
66
+ "eval_accuracy": 0.725854383358098,
67
+ "eval_f1": 0.6407010710808179,
68
+ "eval_loss": 0.5663045048713684,
69
+ "eval_precision": 0.5854092526690391,
70
+ "eval_recall": 0.7075268817204301,
71
+ "eval_runtime": 30.3062,
72
+ "eval_samples_per_second": 44.413,
73
+ "eval_steps_per_second": 5.576,
74
+ "step": 2500
75
+ },
76
+ {
77
+ "epoch": 1.98,
78
+ "eval_accuracy": 0.7421991084695394,
79
+ "eval_f1": 0.5873959571938168,
80
+ "eval_loss": 0.5486178994178772,
81
+ "eval_precision": 0.6569148936170213,
82
+ "eval_recall": 0.5311827956989247,
83
+ "eval_runtime": 29.7471,
84
+ "eval_samples_per_second": 45.248,
85
+ "eval_steps_per_second": 5.681,
86
+ "step": 3000
87
+ },
88
+ {
89
+ "epoch": 2.0,
90
+ "learning_rate": 1.8002643754130865e-05,
91
+ "loss": 0.5474,
92
+ "step": 3026
93
+ },
94
+ {
95
+ "epoch": 2.31,
96
+ "eval_accuracy": 0.7325408618127786,
97
+ "eval_f1": 0.5324675324675324,
98
+ "eval_loss": 0.5591620206832886,
99
+ "eval_precision": 0.6721311475409836,
100
+ "eval_recall": 0.44086021505376344,
101
+ "eval_runtime": 29.7683,
102
+ "eval_samples_per_second": 45.216,
103
+ "eval_steps_per_second": 5.677,
104
+ "step": 3500
105
+ },
106
+ {
107
+ "epoch": 2.64,
108
+ "eval_accuracy": 0.7310549777117384,
109
+ "eval_f1": 0.6387225548902197,
110
+ "eval_loss": 0.5655362606048584,
111
+ "eval_precision": 0.595903165735568,
112
+ "eval_recall": 0.6881720430107527,
113
+ "eval_runtime": 29.9403,
114
+ "eval_samples_per_second": 44.956,
115
+ "eval_steps_per_second": 5.645,
116
+ "step": 4000
117
+ },
118
+ {
119
+ "epoch": 2.97,
120
+ "eval_accuracy": 0.7511144130757801,
121
+ "eval_f1": 0.6447507953340403,
122
+ "eval_loss": 0.5128304362297058,
123
+ "eval_precision": 0.6359832635983264,
124
+ "eval_recall": 0.6537634408602151,
125
+ "eval_runtime": 30.3031,
126
+ "eval_samples_per_second": 44.418,
127
+ "eval_steps_per_second": 5.577,
128
+ "step": 4500
129
+ },
130
+ {
131
+ "epoch": 3.0,
132
+ "learning_rate": 1.7003304692663586e-05,
133
+ "loss": 0.5233,
134
+ "step": 4539
135
+ },
136
+ {
137
+ "epoch": 3.3,
138
+ "eval_accuracy": 0.7288261515601783,
139
+ "eval_f1": 0.6473429951690822,
140
+ "eval_loss": 0.5453668236732483,
141
+ "eval_precision": 0.5877192982456141,
142
+ "eval_recall": 0.7204301075268817,
143
+ "eval_runtime": 29.7531,
144
+ "eval_samples_per_second": 45.239,
145
+ "eval_steps_per_second": 5.68,
146
+ "step": 5000
147
+ },
148
+ {
149
+ "epoch": 3.64,
150
+ "eval_accuracy": 0.7139673105497771,
151
+ "eval_f1": 0.6471127406049496,
152
+ "eval_loss": 0.5753292441368103,
153
+ "eval_precision": 0.5638977635782748,
154
+ "eval_recall": 0.7591397849462366,
155
+ "eval_runtime": 29.7709,
156
+ "eval_samples_per_second": 45.212,
157
+ "eval_steps_per_second": 5.677,
158
+ "step": 5500
159
+ },
160
+ {
161
+ "epoch": 3.97,
162
+ "eval_accuracy": 0.7459138187221397,
163
+ "eval_f1": 0.6633858267716536,
164
+ "eval_loss": 0.5507068634033203,
165
+ "eval_precision": 0.6116152450090744,
166
+ "eval_recall": 0.7247311827956989,
167
+ "eval_runtime": 29.958,
168
+ "eval_samples_per_second": 44.93,
169
+ "eval_steps_per_second": 5.641,
170
+ "step": 6000
171
+ },
172
+ {
173
+ "epoch": 4.0,
174
+ "learning_rate": 1.60039656311963e-05,
175
+ "loss": 0.508,
176
+ "step": 6052
177
+ },
178
+ {
179
+ "epoch": 4.3,
180
+ "eval_accuracy": 0.7399702823179792,
181
+ "eval_f1": 0.6478873239436621,
182
+ "eval_loss": 0.5609683394432068,
183
+ "eval_precision": 0.6086956521739131,
184
+ "eval_recall": 0.6924731182795699,
185
+ "eval_runtime": 30.321,
186
+ "eval_samples_per_second": 44.392,
187
+ "eval_steps_per_second": 5.574,
188
+ "step": 6500
189
+ },
190
+ {
191
+ "epoch": 4.63,
192
+ "eval_accuracy": 0.7555720653789004,
193
+ "eval_f1": 0.6496272630457934,
194
+ "eval_loss": 0.5197449326515198,
195
+ "eval_precision": 0.6434599156118144,
196
+ "eval_recall": 0.6559139784946236,
197
+ "eval_runtime": 29.7694,
198
+ "eval_samples_per_second": 45.214,
199
+ "eval_steps_per_second": 5.677,
200
+ "step": 7000
201
+ },
202
+ {
203
+ "epoch": 4.96,
204
+ "eval_accuracy": 0.7555720653789004,
205
+ "eval_f1": 0.6404371584699454,
206
+ "eval_loss": 0.5097370147705078,
207
+ "eval_precision": 0.6511111111111111,
208
+ "eval_recall": 0.6301075268817204,
209
+ "eval_runtime": 29.7687,
210
+ "eval_samples_per_second": 45.215,
211
+ "eval_steps_per_second": 5.677,
212
+ "step": 7500
213
+ },
214
+ {
215
+ "epoch": 5.0,
216
+ "learning_rate": 1.50039656311963e-05,
217
+ "loss": 0.4929,
218
+ "step": 7565
219
+ },
220
+ {
221
+ "epoch": 5.29,
222
+ "eval_accuracy": 0.7421991084695394,
223
+ "eval_f1": 0.669838249286394,
224
+ "eval_loss": 0.5773559212684631,
225
+ "eval_precision": 0.6006825938566553,
226
+ "eval_recall": 0.7569892473118279,
227
+ "eval_runtime": 29.971,
228
+ "eval_samples_per_second": 44.91,
229
+ "eval_steps_per_second": 5.639,
230
+ "step": 8000
231
+ },
232
+ {
233
+ "epoch": 5.62,
234
+ "eval_accuracy": 0.7444279346210996,
235
+ "eval_f1": 0.6614173228346457,
236
+ "eval_loss": 0.5227199792861938,
237
+ "eval_precision": 0.6098003629764065,
238
+ "eval_recall": 0.7225806451612903,
239
+ "eval_runtime": 30.0099,
240
+ "eval_samples_per_second": 44.852,
241
+ "eval_steps_per_second": 5.631,
242
+ "step": 8500
243
+ },
244
+ {
245
+ "epoch": 5.95,
246
+ "eval_accuracy": 0.7303120356612184,
247
+ "eval_f1": 0.675603217158177,
248
+ "eval_loss": 0.5550133585929871,
249
+ "eval_precision": 0.5779816513761468,
250
+ "eval_recall": 0.8129032258064516,
251
+ "eval_runtime": 30.134,
252
+ "eval_samples_per_second": 44.667,
253
+ "eval_steps_per_second": 5.608,
254
+ "step": 9000
255
+ }
256
+ ],
257
+ "max_steps": 30260,
258
+ "num_train_epochs": 20,
259
+ "total_flos": 0.0,
260
+ "trial_name": null,
261
+ "trial_params": null
262
+ }
bert-base-multilingual-cased/checkpoint-9000/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:192706f865a7bca1b262339da824cc7edc0bced2eebaf146f2e2bc22537dc94c
3
+ size 3055
bert-base-multilingual-cased/checkpoint-9000/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
bert-base-multilingual-cased/runs/Jan13_09-50-21_22ece1fdce42/1642067432.1696281/events.out.tfevents.1642067432.22ece1fdce42.3471.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3267e2981dc9d92193e3d13d4525b70e94786068d39876e4c59f3fdff862293
3
+ size 4845
bert-base-multilingual-cased/runs/Jan13_09-50-21_22ece1fdce42/events.out.tfevents.1642067432.22ece1fdce42.3471.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d24ef3f85fbd1fa87fdd7feefaa7d59e7469d73a2b85aa472d8fff7a0a04e7b1
3
+ size 12572