Training in progress, epoch 1
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- model.safetensors +1 -1
- run-0/checkpoint-117/model.safetensors +1 -1
- run-0/checkpoint-117/optimizer.pt +1 -1
- run-0/checkpoint-117/scheduler.pt +1 -1
- run-0/checkpoint-117/trainer_state.json +20 -20
- run-0/checkpoint-117/training_args.bin +1 -1
- run-0/checkpoint-156/model.safetensors +1 -1
- run-0/checkpoint-156/optimizer.pt +1 -1
- run-0/checkpoint-156/scheduler.pt +1 -1
- run-0/checkpoint-156/trainer_state.json +24 -24
- run-0/checkpoint-156/training_args.bin +1 -1
- run-0/checkpoint-195/model.safetensors +1 -1
- run-0/checkpoint-195/optimizer.pt +1 -1
- run-0/checkpoint-195/scheduler.pt +1 -1
- run-0/checkpoint-195/trainer_state.json +29 -29
- run-0/checkpoint-195/training_args.bin +1 -1
- run-0/checkpoint-78/model.safetensors +1 -1
- run-0/checkpoint-78/optimizer.pt +1 -1
- run-0/checkpoint-78/scheduler.pt +1 -1
- run-0/checkpoint-78/trainer_state.json +16 -16
- run-0/checkpoint-78/training_args.bin +1 -1
- run-1/checkpoint-117/model.safetensors +1 -1
- run-1/checkpoint-117/optimizer.pt +1 -1
- run-1/checkpoint-117/trainer_state.json +17 -17
- run-1/checkpoint-117/training_args.bin +1 -1
- run-1/checkpoint-156/model.safetensors +1 -1
- run-1/checkpoint-156/optimizer.pt +1 -1
- run-1/checkpoint-156/trainer_state.json +22 -22
- run-1/checkpoint-156/training_args.bin +1 -1
- run-1/checkpoint-195/model.safetensors +1 -1
- run-1/checkpoint-195/optimizer.pt +1 -1
- run-1/checkpoint-195/trainer_state.json +27 -27
- run-1/checkpoint-195/training_args.bin +1 -1
- run-1/checkpoint-39/model.safetensors +1 -1
- run-1/checkpoint-39/optimizer.pt +1 -1
- run-1/checkpoint-39/trainer_state.json +6 -6
- run-1/checkpoint-39/training_args.bin +1 -1
- run-1/checkpoint-78/model.safetensors +1 -1
- run-1/checkpoint-78/optimizer.pt +1 -1
- run-1/checkpoint-78/trainer_state.json +11 -11
- run-1/checkpoint-78/training_args.bin +1 -1
- run-2/checkpoint-117/model.safetensors +1 -1
- run-2/checkpoint-117/optimizer.pt +1 -1
- run-2/checkpoint-117/trainer_state.json +16 -16
- run-2/checkpoint-117/training_args.bin +1 -1
- run-2/checkpoint-156/model.safetensors +1 -1
- run-2/checkpoint-156/optimizer.pt +1 -1
- run-2/checkpoint-156/trainer_state.json +23 -23
- run-2/checkpoint-156/training_args.bin +1 -1
- run-2/checkpoint-195/model.safetensors +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:037031c0588abe3648a2177d448c4f64586291910d904d4aeedabe446ba66111
|
3 |
size 437958648
|
run-0/checkpoint-117/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c802ec515bc86042cdf8b15c8b139fa0f9cf6ca850b5573e82a8a229503bd37
|
3 |
size 437958648
|
run-0/checkpoint-117/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e87c9c15e82618884edf2708969a5b156acbfe11a90c8b8aff20c1bec639402e
|
3 |
size 876038394
|
run-0/checkpoint-117/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b52c2b12734a8e47563cebc4f66b329836ea028b2a85fbfd91dadd377531bfe
|
3 |
size 1064
|
run-0/checkpoint-117/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"best_global_step": 117,
|
3 |
-
"best_metric": 0.
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-117",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
@@ -11,36 +11,36 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second":
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
40 |
"logging_steps": 500,
|
41 |
-
"max_steps":
|
42 |
"num_input_tokens_seen": 0,
|
43 |
-
"num_train_epochs":
|
44 |
"save_steps": 500,
|
45 |
"stateful_callbacks": {
|
46 |
"TrainerControl": {
|
@@ -49,7 +49,7 @@
|
|
49 |
"should_evaluate": false,
|
50 |
"should_log": false,
|
51 |
"should_save": true,
|
52 |
-
"should_training_stop":
|
53 |
},
|
54 |
"attributes": {}
|
55 |
}
|
@@ -61,7 +61,7 @@
|
|
61 |
"dropout_rate": 0.0134,
|
62 |
"learning_rate": 0.0001,
|
63 |
"max_length": 32,
|
64 |
-
"num_train_epochs":
|
65 |
"per_device_train_batch_size": 64
|
66 |
}
|
67 |
}
|
|
|
1 |
{
|
2 |
"best_global_step": 117,
|
3 |
+
"best_metric": 0.6931407942238267,
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-117",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6344426274299622,
|
16 |
+
"eval_runtime": 0.6369,
|
17 |
+
"eval_samples_per_second": 434.892,
|
18 |
+
"eval_steps_per_second": 14.13,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6606498194945848,
|
24 |
+
"eval_loss": 0.6399555802345276,
|
25 |
+
"eval_runtime": 0.6384,
|
26 |
+
"eval_samples_per_second": 433.892,
|
27 |
+
"eval_steps_per_second": 14.098,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6931407942238267,
|
33 |
+
"eval_loss": 0.7489305734634399,
|
34 |
+
"eval_runtime": 0.6376,
|
35 |
+
"eval_samples_per_second": 434.416,
|
36 |
+
"eval_steps_per_second": 14.115,
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
40 |
"logging_steps": 500,
|
41 |
+
"max_steps": 195,
|
42 |
"num_input_tokens_seen": 0,
|
43 |
+
"num_train_epochs": 5,
|
44 |
"save_steps": 500,
|
45 |
"stateful_callbacks": {
|
46 |
"TrainerControl": {
|
|
|
49 |
"should_evaluate": false,
|
50 |
"should_log": false,
|
51 |
"should_save": true,
|
52 |
+
"should_training_stop": false
|
53 |
},
|
54 |
"attributes": {}
|
55 |
}
|
|
|
61 |
"dropout_rate": 0.0134,
|
62 |
"learning_rate": 0.0001,
|
63 |
"max_length": 32,
|
64 |
+
"num_train_epochs": 5,
|
65 |
"per_device_train_batch_size": 64
|
66 |
}
|
67 |
}
|
run-0/checkpoint-117/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-0/checkpoint-156/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5db92fb8a00f8c2455466018148153ef5f020c57f80a395281a30e8736e91a23
|
3 |
size 437958648
|
run-0/checkpoint-156/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a0751d6ff4e94e130c1204c790ff869f7b223d5558f613fd95b01591686a496
|
3 |
size 876038394
|
run-0/checkpoint-156/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64871ea17abfaf974175c856702e9195f2d949b9a3207a0265bff73135f4adeb
|
3 |
size 1064
|
run-0/checkpoint-156/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
-
"best_metric": 0.
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
@@ -11,38 +11,38 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss":
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second": 14.
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss": 0.
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second":
|
45 |
-
"eval_steps_per_second": 14.
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
@@ -68,7 +68,7 @@
|
|
68 |
"trial_name": null,
|
69 |
"trial_params": {
|
70 |
"dropout_rate": 0.0134,
|
71 |
-
"learning_rate": 0.
|
72 |
"max_length": 32,
|
73 |
"num_train_epochs": 5,
|
74 |
"per_device_train_batch_size": 64
|
|
|
1 |
{
|
2 |
+
"best_global_step": 156,
|
3 |
+
"best_metric": 0.7111913357400722,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-156",
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6344426274299622,
|
16 |
+
"eval_runtime": 0.6369,
|
17 |
+
"eval_samples_per_second": 434.892,
|
18 |
+
"eval_steps_per_second": 14.13,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6606498194945848,
|
24 |
+
"eval_loss": 0.6399555802345276,
|
25 |
+
"eval_runtime": 0.6384,
|
26 |
+
"eval_samples_per_second": 433.892,
|
27 |
+
"eval_steps_per_second": 14.098,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6931407942238267,
|
33 |
+
"eval_loss": 0.7489305734634399,
|
34 |
+
"eval_runtime": 0.6376,
|
35 |
+
"eval_samples_per_second": 434.416,
|
36 |
+
"eval_steps_per_second": 14.115,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.7111913357400722,
|
42 |
+
"eval_loss": 0.9546563029289246,
|
43 |
+
"eval_runtime": 0.6421,
|
44 |
+
"eval_samples_per_second": 431.374,
|
45 |
+
"eval_steps_per_second": 14.016,
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
|
|
68 |
"trial_name": null,
|
69 |
"trial_params": {
|
70 |
"dropout_rate": 0.0134,
|
71 |
+
"learning_rate": 0.0001,
|
72 |
"max_length": 32,
|
73 |
"num_train_epochs": 5,
|
74 |
"per_device_train_batch_size": 64
|
run-0/checkpoint-156/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-0/checkpoint-195/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:617e561d87a0a00190966fad2e666cfc7c7511275a22ab5451714d514b3d047c
|
3 |
size 437958648
|
run-0/checkpoint-195/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd14c0c2fd8af6ba25e630124589880ec3c065718165595a3f67e870ae299b5f
|
3 |
size 876038394
|
run-0/checkpoint-195/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7535d6d6d3346211338a559c66a34e5433ea456734f0f5c94e8703828d95ba57
|
3 |
size 1064
|
run-0/checkpoint-195/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
-
"best_metric": 0.
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-
|
5 |
"epoch": 5.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 195,
|
@@ -11,47 +11,47 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss":
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second": 14.
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss": 0.
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second":
|
45 |
-
"eval_steps_per_second": 14.
|
46 |
"step": 156
|
47 |
},
|
48 |
{
|
49 |
"epoch": 5.0,
|
50 |
-
"eval_accuracy": 0.
|
51 |
-
"eval_loss":
|
52 |
-
"eval_runtime": 0.
|
53 |
-
"eval_samples_per_second":
|
54 |
-
"eval_steps_per_second":
|
55 |
"step": 195
|
56 |
}
|
57 |
],
|
@@ -77,7 +77,7 @@
|
|
77 |
"trial_name": null,
|
78 |
"trial_params": {
|
79 |
"dropout_rate": 0.0134,
|
80 |
-
"learning_rate": 0.
|
81 |
"max_length": 32,
|
82 |
"num_train_epochs": 5,
|
83 |
"per_device_train_batch_size": 64
|
|
|
1 |
{
|
2 |
+
"best_global_step": 156,
|
3 |
+
"best_metric": 0.7111913357400722,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-156",
|
5 |
"epoch": 5.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 195,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6344426274299622,
|
16 |
+
"eval_runtime": 0.6369,
|
17 |
+
"eval_samples_per_second": 434.892,
|
18 |
+
"eval_steps_per_second": 14.13,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6606498194945848,
|
24 |
+
"eval_loss": 0.6399555802345276,
|
25 |
+
"eval_runtime": 0.6384,
|
26 |
+
"eval_samples_per_second": 433.892,
|
27 |
+
"eval_steps_per_second": 14.098,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6931407942238267,
|
33 |
+
"eval_loss": 0.7489305734634399,
|
34 |
+
"eval_runtime": 0.6376,
|
35 |
+
"eval_samples_per_second": 434.416,
|
36 |
+
"eval_steps_per_second": 14.115,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.7111913357400722,
|
42 |
+
"eval_loss": 0.9546563029289246,
|
43 |
+
"eval_runtime": 0.6421,
|
44 |
+
"eval_samples_per_second": 431.374,
|
45 |
+
"eval_steps_per_second": 14.016,
|
46 |
"step": 156
|
47 |
},
|
48 |
{
|
49 |
"epoch": 5.0,
|
50 |
+
"eval_accuracy": 0.703971119133574,
|
51 |
+
"eval_loss": 1.0655008554458618,
|
52 |
+
"eval_runtime": 0.6437,
|
53 |
+
"eval_samples_per_second": 430.356,
|
54 |
+
"eval_steps_per_second": 13.983,
|
55 |
"step": 195
|
56 |
}
|
57 |
],
|
|
|
77 |
"trial_name": null,
|
78 |
"trial_params": {
|
79 |
"dropout_rate": 0.0134,
|
80 |
+
"learning_rate": 0.0001,
|
81 |
"max_length": 32,
|
82 |
"num_train_epochs": 5,
|
83 |
"per_device_train_batch_size": 64
|
run-0/checkpoint-195/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-0/checkpoint-78/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:095c36a06fc2953f3fa1e12dc8abd3e9cb7f7fc377af4df1c2846b1e859eac15
|
3 |
size 437958648
|
run-0/checkpoint-78/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ebe11ec5538d8ded7bd7bc7188f64ccb65bcd4808f2f1e366db5c204845b326
|
3 |
size 876038394
|
run-0/checkpoint-78/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb667ae3b67495afb6dd345289d7886f47c7be4d88545cef5fd8a2859941ae93
|
3 |
size 1064
|
run-0/checkpoint-78/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
-
"best_metric": 0.
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-
|
5 |
"epoch": 2.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 78,
|
@@ -11,27 +11,27 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
}
|
30 |
],
|
31 |
"logging_steps": 500,
|
32 |
-
"max_steps":
|
33 |
"num_input_tokens_seen": 0,
|
34 |
-
"num_train_epochs":
|
35 |
"save_steps": 500,
|
36 |
"stateful_callbacks": {
|
37 |
"TrainerControl": {
|
@@ -52,7 +52,7 @@
|
|
52 |
"dropout_rate": 0.0134,
|
53 |
"learning_rate": 0.0001,
|
54 |
"max_length": 32,
|
55 |
-
"num_train_epochs":
|
56 |
"per_device_train_batch_size": 64
|
57 |
}
|
58 |
}
|
|
|
1 |
{
|
2 |
+
"best_global_step": 78,
|
3 |
+
"best_metric": 0.6606498194945848,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-78",
|
5 |
"epoch": 2.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 78,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6344426274299622,
|
16 |
+
"eval_runtime": 0.6369,
|
17 |
+
"eval_samples_per_second": 434.892,
|
18 |
+
"eval_steps_per_second": 14.13,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6606498194945848,
|
24 |
+
"eval_loss": 0.6399555802345276,
|
25 |
+
"eval_runtime": 0.6384,
|
26 |
+
"eval_samples_per_second": 433.892,
|
27 |
+
"eval_steps_per_second": 14.098,
|
28 |
"step": 78
|
29 |
}
|
30 |
],
|
31 |
"logging_steps": 500,
|
32 |
+
"max_steps": 195,
|
33 |
"num_input_tokens_seen": 0,
|
34 |
+
"num_train_epochs": 5,
|
35 |
"save_steps": 500,
|
36 |
"stateful_callbacks": {
|
37 |
"TrainerControl": {
|
|
|
52 |
"dropout_rate": 0.0134,
|
53 |
"learning_rate": 0.0001,
|
54 |
"max_length": 32,
|
55 |
+
"num_train_epochs": 5,
|
56 |
"per_device_train_batch_size": 64
|
57 |
}
|
58 |
}
|
run-0/checkpoint-78/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-1/checkpoint-117/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:679e027e39e2e1b7b9e1240bb8d9f42125967b9daf06e4768ab77daf28fa7315
|
3 |
size 437958648
|
run-1/checkpoint-117/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f80bde91e09964025f09bae3e83f85e29f7fea36ff0e59ca2d24f18de39b3e34
|
3 |
size 876038394
|
run-1/checkpoint-117/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
"best_metric": 0.6895306859205776,
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 117,
|
@@ -11,29 +11,29 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second":
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
|
|
1 |
{
|
2 |
+
"best_global_step": 78,
|
3 |
"best_metric": 0.6895306859205776,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-78",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 117,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6302457451820374,
|
16 |
+
"eval_runtime": 0.6387,
|
17 |
+
"eval_samples_per_second": 433.698,
|
18 |
+
"eval_steps_per_second": 14.091,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6895306859205776,
|
24 |
+
"eval_loss": 0.6575530171394348,
|
25 |
+
"eval_runtime": 0.6355,
|
26 |
+
"eval_samples_per_second": 435.845,
|
27 |
+
"eval_steps_per_second": 14.161,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6714801444043321,
|
33 |
+
"eval_loss": 0.7819653749465942,
|
34 |
+
"eval_runtime": 0.6474,
|
35 |
+
"eval_samples_per_second": 427.864,
|
36 |
+
"eval_steps_per_second": 13.902,
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
run-1/checkpoint-117/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-1/checkpoint-156/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7a529cdb7fd45102ca4e5cb191f5b15052e08493cc3b511561fe9e04e22fa30
|
3 |
size 437958648
|
run-1/checkpoint-156/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c36cbf4150836ab18a04c1215688af6efe06fb5929a0244861ffd82e52fd8f64
|
3 |
size 876038394
|
run-1/checkpoint-156/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
"best_metric": 0.6895306859205776,
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
@@ -11,38 +11,38 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second":
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss":
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second":
|
45 |
-
"eval_steps_per_second":
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
|
|
1 |
{
|
2 |
+
"best_global_step": 78,
|
3 |
"best_metric": 0.6895306859205776,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-78",
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6302457451820374,
|
16 |
+
"eval_runtime": 0.6387,
|
17 |
+
"eval_samples_per_second": 433.698,
|
18 |
+
"eval_steps_per_second": 14.091,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6895306859205776,
|
24 |
+
"eval_loss": 0.6575530171394348,
|
25 |
+
"eval_runtime": 0.6355,
|
26 |
+
"eval_samples_per_second": 435.845,
|
27 |
+
"eval_steps_per_second": 14.161,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6714801444043321,
|
33 |
+
"eval_loss": 0.7819653749465942,
|
34 |
+
"eval_runtime": 0.6474,
|
35 |
+
"eval_samples_per_second": 427.864,
|
36 |
+
"eval_steps_per_second": 13.902,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.6859205776173285,
|
42 |
+
"eval_loss": 1.0000327825546265,
|
43 |
+
"eval_runtime": 0.6479,
|
44 |
+
"eval_samples_per_second": 427.507,
|
45 |
+
"eval_steps_per_second": 13.89,
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
run-1/checkpoint-156/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-1/checkpoint-195/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f5f943346824275e0a0240c4c5c24abddae8a7d72a96a13f1cfb452f98b188e
|
3 |
size 437958648
|
run-1/checkpoint-195/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66c84c6a45cf5fb5f95ce3b7f54adabe8e2019bcda952dbcb3aca1ace4fccb6d
|
3 |
size 876038394
|
run-1/checkpoint-195/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
"best_metric": 0.6895306859205776,
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-
|
5 |
"epoch": 5.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 195,
|
@@ -11,47 +11,47 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second":
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss":
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second":
|
45 |
-
"eval_steps_per_second":
|
46 |
"step": 156
|
47 |
},
|
48 |
{
|
49 |
"epoch": 5.0,
|
50 |
-
"eval_accuracy": 0.
|
51 |
-
"eval_loss": 1.
|
52 |
-
"eval_runtime": 0.
|
53 |
-
"eval_samples_per_second":
|
54 |
-
"eval_steps_per_second": 14.
|
55 |
"step": 195
|
56 |
}
|
57 |
],
|
|
|
1 |
{
|
2 |
+
"best_global_step": 78,
|
3 |
"best_metric": 0.6895306859205776,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-78",
|
5 |
"epoch": 5.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 195,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6302457451820374,
|
16 |
+
"eval_runtime": 0.6387,
|
17 |
+
"eval_samples_per_second": 433.698,
|
18 |
+
"eval_steps_per_second": 14.091,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6895306859205776,
|
24 |
+
"eval_loss": 0.6575530171394348,
|
25 |
+
"eval_runtime": 0.6355,
|
26 |
+
"eval_samples_per_second": 435.845,
|
27 |
+
"eval_steps_per_second": 14.161,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6714801444043321,
|
33 |
+
"eval_loss": 0.7819653749465942,
|
34 |
+
"eval_runtime": 0.6474,
|
35 |
+
"eval_samples_per_second": 427.864,
|
36 |
+
"eval_steps_per_second": 13.902,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.6859205776173285,
|
42 |
+
"eval_loss": 1.0000327825546265,
|
43 |
+
"eval_runtime": 0.6479,
|
44 |
+
"eval_samples_per_second": 427.507,
|
45 |
+
"eval_steps_per_second": 13.89,
|
46 |
"step": 156
|
47 |
},
|
48 |
{
|
49 |
"epoch": 5.0,
|
50 |
+
"eval_accuracy": 0.6750902527075813,
|
51 |
+
"eval_loss": 1.1014820337295532,
|
52 |
+
"eval_runtime": 0.637,
|
53 |
+
"eval_samples_per_second": 434.837,
|
54 |
+
"eval_steps_per_second": 14.128,
|
55 |
"step": 195
|
56 |
}
|
57 |
],
|
run-1/checkpoint-195/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-1/checkpoint-39/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4950ee24f30f03a15da573885ef4f5a550ec43401bd10183ed896ec546cb2b94
|
3 |
size 437958648
|
run-1/checkpoint-39/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:454df7d9bd4efad84c1ff895b9d617d3ea94beba61c8912b16c69a42d94a254a
|
3 |
size 876038394
|
run-1/checkpoint-39/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"best_global_step": 39,
|
3 |
-
"best_metric": 0.
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-39",
|
5 |
"epoch": 1.0,
|
6 |
"eval_steps": 500,
|
@@ -11,11 +11,11 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
}
|
21 |
],
|
|
|
1 |
{
|
2 |
"best_global_step": 39,
|
3 |
+
"best_metric": 0.6570397111913358,
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-39",
|
5 |
"epoch": 1.0,
|
6 |
"eval_steps": 500,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6302457451820374,
|
16 |
+
"eval_runtime": 0.6387,
|
17 |
+
"eval_samples_per_second": 433.698,
|
18 |
+
"eval_steps_per_second": 14.091,
|
19 |
"step": 39
|
20 |
}
|
21 |
],
|
run-1/checkpoint-39/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-1/checkpoint-78/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf1e36fde00996e3f2b73551fcd782119ce7c5d0a6afaa777a1c8449968bf933
|
3 |
size 437958648
|
run-1/checkpoint-78/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ea17d384de4432779b205f7807510f44ae5c1174daabaaf9f252bfed0a817a6
|
3 |
size 876038394
|
run-1/checkpoint-78/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"best_global_step": 78,
|
3 |
-
"best_metric": 0.
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-78",
|
5 |
"epoch": 2.0,
|
6 |
"eval_steps": 500,
|
@@ -11,20 +11,20 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
}
|
30 |
],
|
|
|
1 |
{
|
2 |
"best_global_step": 78,
|
3 |
+
"best_metric": 0.6895306859205776,
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-1/checkpoint-78",
|
5 |
"epoch": 2.0,
|
6 |
"eval_steps": 500,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6302457451820374,
|
16 |
+
"eval_runtime": 0.6387,
|
17 |
+
"eval_samples_per_second": 433.698,
|
18 |
+
"eval_steps_per_second": 14.091,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6895306859205776,
|
24 |
+
"eval_loss": 0.6575530171394348,
|
25 |
+
"eval_runtime": 0.6355,
|
26 |
+
"eval_samples_per_second": 435.845,
|
27 |
+
"eval_steps_per_second": 14.161,
|
28 |
"step": 78
|
29 |
}
|
30 |
],
|
run-1/checkpoint-78/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-2/checkpoint-117/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:908f5f76525e7b3ec579e59ddb340c506d961630672efe1f4f731a2a14813c5d
|
3 |
size 437958648
|
run-2/checkpoint-117/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b61bb77c00282985cf555c2428aeed3ddb9dd975bf4e47ef8332af46e78eb903
|
3 |
size 876038394
|
run-2/checkpoint-117/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"best_global_step": 117,
|
3 |
-
"best_metric": 0.
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-2/checkpoint-117",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
@@ -11,29 +11,29 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second": 435.
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second":
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
|
|
1 |
{
|
2 |
"best_global_step": 117,
|
3 |
+
"best_metric": 0.6678700361010831,
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-2/checkpoint-117",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6299930810928345,
|
16 |
+
"eval_runtime": 0.636,
|
17 |
+
"eval_samples_per_second": 435.504,
|
18 |
+
"eval_steps_per_second": 14.15,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6606498194945848,
|
24 |
+
"eval_loss": 0.701384961605072,
|
25 |
+
"eval_runtime": 0.6379,
|
26 |
+
"eval_samples_per_second": 434.232,
|
27 |
+
"eval_steps_per_second": 14.109,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6678700361010831,
|
33 |
+
"eval_loss": 0.7389248609542847,
|
34 |
+
"eval_runtime": 0.6433,
|
35 |
+
"eval_samples_per_second": 430.624,
|
36 |
+
"eval_steps_per_second": 13.991,
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
run-2/checkpoint-117/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-2/checkpoint-156/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f1d4e1e1573d4c23e702a54e2c50b2d056566e3092df8f470ebf1561daf60bc
|
3 |
size 437958648
|
run-2/checkpoint-156/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:266d8385b6d55e9347537874355cb10632a22bf69f183d8631ea5e7ba89d3fb2
|
3 |
size 876038394
|
run-2/checkpoint-156/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
-
"best_metric": 0.
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-2/checkpoint-
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
@@ -11,38 +11,38 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second": 435.
|
18 |
-
"eval_steps_per_second": 14.
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second": 14.
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second":
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss": 0.
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second": 431.
|
45 |
-
"eval_steps_per_second": 14.
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
|
|
1 |
{
|
2 |
+
"best_global_step": 156,
|
3 |
+
"best_metric": 0.6931407942238267,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-2/checkpoint-156",
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6570397111913358,
|
15 |
+
"eval_loss": 0.6299930810928345,
|
16 |
+
"eval_runtime": 0.636,
|
17 |
+
"eval_samples_per_second": 435.504,
|
18 |
+
"eval_steps_per_second": 14.15,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6606498194945848,
|
24 |
+
"eval_loss": 0.701384961605072,
|
25 |
+
"eval_runtime": 0.6379,
|
26 |
+
"eval_samples_per_second": 434.232,
|
27 |
+
"eval_steps_per_second": 14.109,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6678700361010831,
|
33 |
+
"eval_loss": 0.7389248609542847,
|
34 |
+
"eval_runtime": 0.6433,
|
35 |
+
"eval_samples_per_second": 430.624,
|
36 |
+
"eval_steps_per_second": 13.991,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.6931407942238267,
|
42 |
+
"eval_loss": 0.9925442337989807,
|
43 |
+
"eval_runtime": 0.6423,
|
44 |
+
"eval_samples_per_second": 431.287,
|
45 |
+
"eval_steps_per_second": 14.013,
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
run-2/checkpoint-156/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638657d2294b16b6a018ef8c4921c705157459687a72f242b7f437400a9b1e8a
|
3 |
size 5432
|
run-2/checkpoint-195/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e0a5f90545a9de75f3d982220c600765a5bcd444a868ce7fae7fb1a9113b668
|
3 |
size 437958648
|