Training in progress, epoch 1
Browse files- model.safetensors +1 -1
- run-5/checkpoint-117/config.json +1 -1
- run-5/checkpoint-117/model.safetensors +1 -1
- run-5/checkpoint-117/optimizer.pt +1 -1
- run-5/checkpoint-117/scheduler.pt +1 -1
- run-5/checkpoint-117/trainer_state.json +22 -20
- run-5/checkpoint-117/training_args.bin +1 -1
- run-5/checkpoint-156/config.json +1 -1
- run-5/checkpoint-156/model.safetensors +1 -1
- run-5/checkpoint-156/optimizer.pt +1 -1
- run-5/checkpoint-156/scheduler.pt +1 -1
- run-5/checkpoint-156/trainer_state.json +29 -27
- run-5/checkpoint-156/training_args.bin +1 -1
- run-5/checkpoint-195/config.json +1 -1
- run-5/checkpoint-195/model.safetensors +1 -1
- run-5/checkpoint-195/optimizer.pt +1 -1
- run-5/checkpoint-195/scheduler.pt +1 -1
- run-5/checkpoint-195/trainer_state.json +35 -33
- run-5/checkpoint-195/training_args.bin +1 -1
- runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717028.677fb5893cf0.2669.36 +3 -0
- runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717051.677fb5893cf0.2669.37 +3 -0
- runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717074.677fb5893cf0.2669.38 +3 -0
- runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717096.677fb5893cf0.2669.39 +3 -0
- runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717372.677fb5893cf0.2669.40 +3 -0
- training_args.bin +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:051cea0219c05c88062053d4125e94a53939800f3ac2ef703a3ed1c1e6511cbf
|
3 |
size 437958648
|
run-5/checkpoint-117/config.json
CHANGED
@@ -19,7 +19,7 @@
|
|
19 |
"position_embedding_type": "absolute",
|
20 |
"problem_type": "single_label_classification",
|
21 |
"torch_dtype": "float32",
|
22 |
-
"transformers_version": "4.50.
|
23 |
"type_vocab_size": 2,
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 30522
|
|
|
19 |
"position_embedding_type": "absolute",
|
20 |
"problem_type": "single_label_classification",
|
21 |
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.50.3",
|
23 |
"type_vocab_size": 2,
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 30522
|
run-5/checkpoint-117/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98cc438e7dfc5491ae782202f415d63e4e2f7c257182591919e76cb9e6817f3b
|
3 |
size 437958648
|
run-5/checkpoint-117/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb4a8fb16dfe5b553a0b64713d3e0db0abf908945279f6aed14c6bec3ec5f47d
|
3 |
size 876038394
|
run-5/checkpoint-117/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6ae0df3dcc77291d5111438baa3e28157dd68485e127efa4307b87edaaaace0
|
3 |
size 1064
|
run-5/checkpoint-117/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"best_global_step": 117,
|
3 |
-
"best_metric": 0.
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-5/checkpoint-117",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
@@ -11,36 +11,36 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second":
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second":
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second": 13.
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
40 |
"logging_steps": 500,
|
41 |
-
"max_steps":
|
42 |
"num_input_tokens_seen": 0,
|
43 |
-
"num_train_epochs":
|
44 |
"save_steps": 500,
|
45 |
"stateful_callbacks": {
|
46 |
"TrainerControl": {
|
@@ -58,8 +58,10 @@
|
|
58 |
"train_batch_size": 64,
|
59 |
"trial_name": null,
|
60 |
"trial_params": {
|
61 |
-
"
|
62 |
-
"
|
|
|
|
|
63 |
"per_device_train_batch_size": 64
|
64 |
}
|
65 |
}
|
|
|
1 |
{
|
2 |
"best_global_step": 117,
|
3 |
+
"best_metric": 0.6462093862815884,
|
4 |
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-5/checkpoint-117",
|
5 |
"epoch": 3.0,
|
6 |
"eval_steps": 500,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6697127819061279,
|
16 |
+
"eval_runtime": 0.6455,
|
17 |
+
"eval_samples_per_second": 429.108,
|
18 |
+
"eval_steps_per_second": 13.942,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6173285198555957,
|
24 |
+
"eval_loss": 0.6653470993041992,
|
25 |
+
"eval_runtime": 0.6465,
|
26 |
+
"eval_samples_per_second": 428.491,
|
27 |
+
"eval_steps_per_second": 13.922,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6462093862815884,
|
33 |
+
"eval_loss": 0.6471791863441467,
|
34 |
+
"eval_runtime": 0.6482,
|
35 |
+
"eval_samples_per_second": 427.345,
|
36 |
+
"eval_steps_per_second": 13.885,
|
37 |
"step": 117
|
38 |
}
|
39 |
],
|
40 |
"logging_steps": 500,
|
41 |
+
"max_steps": 195,
|
42 |
"num_input_tokens_seen": 0,
|
43 |
+
"num_train_epochs": 5,
|
44 |
"save_steps": 500,
|
45 |
"stateful_callbacks": {
|
46 |
"TrainerControl": {
|
|
|
58 |
"train_batch_size": 64,
|
59 |
"trial_name": null,
|
60 |
"trial_params": {
|
61 |
+
"dropout_rate": 0.0134,
|
62 |
+
"learning_rate": 2.6344508518520418e-05,
|
63 |
+
"max_length": 32,
|
64 |
+
"num_train_epochs": 5,
|
65 |
"per_device_train_batch_size": 64
|
66 |
}
|
67 |
}
|
run-5/checkpoint-117/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7917deeac7fb94209a1ee4626c629b8767972d103256b1daf4cf2460cf8fc397
|
3 |
size 5432
|
run-5/checkpoint-156/config.json
CHANGED
@@ -19,7 +19,7 @@
|
|
19 |
"position_embedding_type": "absolute",
|
20 |
"problem_type": "single_label_classification",
|
21 |
"torch_dtype": "float32",
|
22 |
-
"transformers_version": "4.50.
|
23 |
"type_vocab_size": 2,
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 30522
|
|
|
19 |
"position_embedding_type": "absolute",
|
20 |
"problem_type": "single_label_classification",
|
21 |
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.50.3",
|
23 |
"type_vocab_size": 2,
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 30522
|
run-5/checkpoint-156/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:699cb5a8a2b395bae13740d67cad52a787e452716c8bce97126d62fcbbd448f4
|
3 |
size 437958648
|
run-5/checkpoint-156/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2c85ecce3ad489617c49ac805b32922fa87bc1e623e04d387ce64d911ccadd5
|
3 |
size 876038394
|
run-5/checkpoint-156/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:207ce3a72ea6f8b5696a7d7d9bbd3121caaa776bb13247589131051d1e72878d
|
3 |
size 1064
|
run-5/checkpoint-156/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
-
"best_metric": 0.
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-5/checkpoint-
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
@@ -11,45 +11,45 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second":
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second":
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second": 13.
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss": 0.
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second":
|
45 |
-
"eval_steps_per_second": 14.
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
49 |
"logging_steps": 500,
|
50 |
-
"max_steps":
|
51 |
"num_input_tokens_seen": 0,
|
52 |
-
"num_train_epochs":
|
53 |
"save_steps": 500,
|
54 |
"stateful_callbacks": {
|
55 |
"TrainerControl": {
|
@@ -67,8 +67,10 @@
|
|
67 |
"train_batch_size": 64,
|
68 |
"trial_name": null,
|
69 |
"trial_params": {
|
70 |
-
"
|
71 |
-
"
|
|
|
|
|
72 |
"per_device_train_batch_size": 64
|
73 |
}
|
74 |
}
|
|
|
1 |
{
|
2 |
+
"best_global_step": 117,
|
3 |
+
"best_metric": 0.6462093862815884,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-5/checkpoint-117",
|
5 |
"epoch": 4.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 156,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6697127819061279,
|
16 |
+
"eval_runtime": 0.6455,
|
17 |
+
"eval_samples_per_second": 429.108,
|
18 |
+
"eval_steps_per_second": 13.942,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6173285198555957,
|
24 |
+
"eval_loss": 0.6653470993041992,
|
25 |
+
"eval_runtime": 0.6465,
|
26 |
+
"eval_samples_per_second": 428.491,
|
27 |
+
"eval_steps_per_second": 13.922,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6462093862815884,
|
33 |
+
"eval_loss": 0.6471791863441467,
|
34 |
+
"eval_runtime": 0.6482,
|
35 |
+
"eval_samples_per_second": 427.345,
|
36 |
+
"eval_steps_per_second": 13.885,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.6425992779783394,
|
42 |
+
"eval_loss": 0.7032743692398071,
|
43 |
+
"eval_runtime": 0.6412,
|
44 |
+
"eval_samples_per_second": 431.983,
|
45 |
+
"eval_steps_per_second": 14.036,
|
46 |
"step": 156
|
47 |
}
|
48 |
],
|
49 |
"logging_steps": 500,
|
50 |
+
"max_steps": 195,
|
51 |
"num_input_tokens_seen": 0,
|
52 |
+
"num_train_epochs": 5,
|
53 |
"save_steps": 500,
|
54 |
"stateful_callbacks": {
|
55 |
"TrainerControl": {
|
|
|
67 |
"train_batch_size": 64,
|
68 |
"trial_name": null,
|
69 |
"trial_params": {
|
70 |
+
"dropout_rate": 0.0134,
|
71 |
+
"learning_rate": 2.6344508518520418e-05,
|
72 |
+
"max_length": 32,
|
73 |
+
"num_train_epochs": 5,
|
74 |
"per_device_train_batch_size": 64
|
75 |
}
|
76 |
}
|
run-5/checkpoint-156/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7917deeac7fb94209a1ee4626c629b8767972d103256b1daf4cf2460cf8fc397
|
3 |
size 5432
|
run-5/checkpoint-195/config.json
CHANGED
@@ -19,7 +19,7 @@
|
|
19 |
"position_embedding_type": "absolute",
|
20 |
"problem_type": "single_label_classification",
|
21 |
"torch_dtype": "float32",
|
22 |
-
"transformers_version": "4.50.
|
23 |
"type_vocab_size": 2,
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 30522
|
|
|
19 |
"position_embedding_type": "absolute",
|
20 |
"problem_type": "single_label_classification",
|
21 |
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.50.3",
|
23 |
"type_vocab_size": 2,
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 30522
|
run-5/checkpoint-195/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437958648
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d690aa49d748bed346152dd8d411d500271814260a9e22c48bbe63faf711e37
|
3 |
size 437958648
|
run-5/checkpoint-195/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 876038394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8009bbaeb8a151943fc432bc1dcdc737d596f0ebb50de8d48262f8172414dc5
|
3 |
size 876038394
|
run-5/checkpoint-195/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7ca426136780e5123882a2de71f9961eb1444076226a5a757f36e08f1a88f24
|
3 |
size 1064
|
run-5/checkpoint-195/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_global_step":
|
3 |
-
"best_metric": 0.
|
4 |
-
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-5/checkpoint-
|
5 |
"epoch": 5.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 195,
|
@@ -11,54 +11,54 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
-
"eval_accuracy": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_runtime": 0.
|
17 |
-
"eval_samples_per_second":
|
18 |
-
"eval_steps_per_second":
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
-
"eval_accuracy": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 0.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second":
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
-
"eval_accuracy": 0.
|
33 |
-
"eval_loss": 0.
|
34 |
-
"eval_runtime": 0.
|
35 |
-
"eval_samples_per_second":
|
36 |
-
"eval_steps_per_second": 13.
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
-
"eval_accuracy": 0.
|
42 |
-
"eval_loss": 0.
|
43 |
-
"eval_runtime": 0.
|
44 |
-
"eval_samples_per_second":
|
45 |
-
"eval_steps_per_second": 14.
|
46 |
"step": 156
|
47 |
},
|
48 |
{
|
49 |
"epoch": 5.0,
|
50 |
-
"eval_accuracy": 0.
|
51 |
-
"eval_loss":
|
52 |
-
"eval_runtime": 0.
|
53 |
-
"eval_samples_per_second":
|
54 |
-
"eval_steps_per_second":
|
55 |
"step": 195
|
56 |
}
|
57 |
],
|
58 |
"logging_steps": 500,
|
59 |
-
"max_steps":
|
60 |
"num_input_tokens_seen": 0,
|
61 |
-
"num_train_epochs":
|
62 |
"save_steps": 500,
|
63 |
"stateful_callbacks": {
|
64 |
"TrainerControl": {
|
@@ -67,7 +67,7 @@
|
|
67 |
"should_evaluate": false,
|
68 |
"should_log": false,
|
69 |
"should_save": true,
|
70 |
-
"should_training_stop":
|
71 |
},
|
72 |
"attributes": {}
|
73 |
}
|
@@ -76,8 +76,10 @@
|
|
76 |
"train_batch_size": 64,
|
77 |
"trial_name": null,
|
78 |
"trial_params": {
|
79 |
-
"
|
80 |
-
"
|
|
|
|
|
81 |
"per_device_train_batch_size": 64
|
82 |
}
|
83 |
}
|
|
|
1 |
{
|
2 |
+
"best_global_step": 195,
|
3 |
+
"best_metric": 0.6678700361010831,
|
4 |
+
"best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-5/checkpoint-195",
|
5 |
"epoch": 5.0,
|
6 |
"eval_steps": 500,
|
7 |
"global_step": 195,
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.6245487364620939,
|
15 |
+
"eval_loss": 0.6697127819061279,
|
16 |
+
"eval_runtime": 0.6455,
|
17 |
+
"eval_samples_per_second": 429.108,
|
18 |
+
"eval_steps_per_second": 13.942,
|
19 |
"step": 39
|
20 |
},
|
21 |
{
|
22 |
"epoch": 2.0,
|
23 |
+
"eval_accuracy": 0.6173285198555957,
|
24 |
+
"eval_loss": 0.6653470993041992,
|
25 |
+
"eval_runtime": 0.6465,
|
26 |
+
"eval_samples_per_second": 428.491,
|
27 |
+
"eval_steps_per_second": 13.922,
|
28 |
"step": 78
|
29 |
},
|
30 |
{
|
31 |
"epoch": 3.0,
|
32 |
+
"eval_accuracy": 0.6462093862815884,
|
33 |
+
"eval_loss": 0.6471791863441467,
|
34 |
+
"eval_runtime": 0.6482,
|
35 |
+
"eval_samples_per_second": 427.345,
|
36 |
+
"eval_steps_per_second": 13.885,
|
37 |
"step": 117
|
38 |
},
|
39 |
{
|
40 |
"epoch": 4.0,
|
41 |
+
"eval_accuracy": 0.6425992779783394,
|
42 |
+
"eval_loss": 0.7032743692398071,
|
43 |
+
"eval_runtime": 0.6412,
|
44 |
+
"eval_samples_per_second": 431.983,
|
45 |
+
"eval_steps_per_second": 14.036,
|
46 |
"step": 156
|
47 |
},
|
48 |
{
|
49 |
"epoch": 5.0,
|
50 |
+
"eval_accuracy": 0.6678700361010831,
|
51 |
+
"eval_loss": 0.7250702977180481,
|
52 |
+
"eval_runtime": 0.6441,
|
53 |
+
"eval_samples_per_second": 430.034,
|
54 |
+
"eval_steps_per_second": 13.972,
|
55 |
"step": 195
|
56 |
}
|
57 |
],
|
58 |
"logging_steps": 500,
|
59 |
+
"max_steps": 195,
|
60 |
"num_input_tokens_seen": 0,
|
61 |
+
"num_train_epochs": 5,
|
62 |
"save_steps": 500,
|
63 |
"stateful_callbacks": {
|
64 |
"TrainerControl": {
|
|
|
67 |
"should_evaluate": false,
|
68 |
"should_log": false,
|
69 |
"should_save": true,
|
70 |
+
"should_training_stop": true
|
71 |
},
|
72 |
"attributes": {}
|
73 |
}
|
|
|
76 |
"train_batch_size": 64,
|
77 |
"trial_name": null,
|
78 |
"trial_params": {
|
79 |
+
"dropout_rate": 0.0134,
|
80 |
+
"learning_rate": 2.6344508518520418e-05,
|
81 |
+
"max_length": 32,
|
82 |
+
"num_train_epochs": 5,
|
83 |
"per_device_train_batch_size": 64
|
84 |
}
|
85 |
}
|
run-5/checkpoint-195/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7917deeac7fb94209a1ee4626c629b8767972d103256b1daf4cf2460cf8fc397
|
3 |
size 5432
|
runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717028.677fb5893cf0.2669.36
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:029604126a877beb35be813d3848bf3ee597e1d61f07154eb95bf5fd6edd8388
|
3 |
+
size 5418
|
runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717051.677fb5893cf0.2669.37
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9c0e4a9b8c72b580f1ad1dccd16168c5aec953ece2a97c39a61f3569d00a5f0
|
3 |
+
size 5419
|
runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717074.677fb5893cf0.2669.38
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:696e557175f4f5a9b7e35164503ea3c1cfde6b7e2eacc7ab0c8eca8dc5acce45
|
3 |
+
size 5418
|
runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717096.677fb5893cf0.2669.39
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb808169465a1f4417beaab7ae068a37d2e58ebc800e5235990a788649802789
|
3 |
+
size 5418
|
runs/Apr03_17-48-13_677fb5893cf0/events.out.tfevents.1743717372.677fb5893cf0.2669.40
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f525cc7da0d341de466be931de19e02d9d1f9f8811c6f660f2721fc11fbd78a
|
3 |
+
size 7052
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbea049dc6efc74c0d7885710ece1a927b118d7bd83967aa580756e6dd000b3e
|
3 |
size 5432
|