samil24 commited on
Commit
565e9b7
·
verified ·
1 Parent(s): 6e9f684

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aca61fdfa6931d9f3560deed6c44b32707d9fab0df28c139275244ffa76072d8
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77a1db500591369d0e6d7f7a2a040bfa60647f0b57ba372d76c961375a165f87
3
  size 437958648
run-3/checkpoint-195/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ef7a96a393735b725e146d321a6f6dc41c06d36d33265d8af6aa586197251a1
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cc6a53b787dca1a8fd5968d7713e0bdc4cb03fe0b0ffc027a1a38f588787720
3
  size 437958648
run-3/checkpoint-195/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a51d64cc22fb9d505be4305a4ace9b12a66a9968ab937f17a9dd23e995240cb1
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b168f2d67bf89ef6265a4d7d4988ef9ae0e5835e4fda333d485b338efd59518
3
  size 876038394
run-3/checkpoint-195/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:675f1463f743ae2eb6e82532e7f83c82034a00c6beaef47454d1a0f0ab6ea1d0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c481cea2d473218259260c74bb2a405cbdfc1493d220688497623f197c9473f8
3
  size 1064
run-3/checkpoint-195/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a54d1e9a16102072f117ac90cba2c8de9da1d67b974b29749928b6494fcb115
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31e11225076494526a7157d904c355e54980b239c63149e5cb6bd46c8e0ca9c
3
  size 5432
run-3/checkpoint-234/config.json CHANGED
@@ -19,7 +19,7 @@
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
- "transformers_version": "4.50.2",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
  "vocab_size": 30522
 
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
+ "transformers_version": "4.50.3",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
  "vocab_size": 30522
run-3/checkpoint-234/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45cd8daabde69408f195fd28e4b853be07e30a9106ff1566429456998cbc8c92
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90ec478c4f4d76515e1d41b69e27e91521687063de38e4906930256c18c4fc7d
3
  size 437958648
run-3/checkpoint-234/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46bd481d79c4c5ae8a6d5a200655bf1640484b70d772a9745a261a01ca30e715
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40ad820918273930bc861db241dff5536746b9d30d16746fcfcb7ef7dee31a0d
3
  size 876038394
run-3/checkpoint-234/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b778235f2c6be8dc1444821cb28b8aa66138c940d71270633f893f1e9dcc897f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fafdc9d67bc99334116e96a009c77a5be4c802d83fd0d02e557b73626be589e
3
  size 1064
run-3/checkpoint-234/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 234,
3
- "best_metric": 0.7003610108303249,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-3/checkpoint-234",
5
  "epoch": 6.0,
6
  "eval_steps": 500,
@@ -11,63 +11,63 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.6028880866425993,
15
- "eval_loss": 0.6455268263816833,
16
- "eval_runtime": 0.6422,
17
- "eval_samples_per_second": 431.339,
18
- "eval_steps_per_second": 14.015,
19
  "step": 39
20
  },
21
  {
22
  "epoch": 2.0,
23
- "eval_accuracy": 0.5992779783393501,
24
- "eval_loss": 0.6891809701919556,
25
- "eval_runtime": 0.6455,
26
- "eval_samples_per_second": 429.15,
27
- "eval_steps_per_second": 13.944,
28
  "step": 78
29
  },
30
  {
31
  "epoch": 3.0,
32
- "eval_accuracy": 0.6425992779783394,
33
- "eval_loss": 0.8288224935531616,
34
- "eval_runtime": 0.6442,
35
- "eval_samples_per_second": 429.982,
36
- "eval_steps_per_second": 13.971,
37
  "step": 117
38
  },
39
  {
40
  "epoch": 4.0,
41
- "eval_accuracy": 0.6823104693140795,
42
- "eval_loss": 0.9376588463783264,
43
- "eval_runtime": 0.6392,
44
- "eval_samples_per_second": 433.358,
45
- "eval_steps_per_second": 14.08,
46
  "step": 156
47
  },
48
  {
49
  "epoch": 5.0,
50
- "eval_accuracy": 0.6642599277978339,
51
- "eval_loss": 1.4554625749588013,
52
- "eval_runtime": 0.6427,
53
- "eval_samples_per_second": 430.994,
54
- "eval_steps_per_second": 14.003,
55
  "step": 195
56
  },
57
  {
58
  "epoch": 6.0,
59
- "eval_accuracy": 0.7003610108303249,
60
- "eval_loss": 1.4293187856674194,
61
- "eval_runtime": 0.6389,
62
- "eval_samples_per_second": 433.574,
63
- "eval_steps_per_second": 14.087,
64
  "step": 234
65
  }
66
  ],
67
  "logging_steps": 500,
68
- "max_steps": 585,
69
  "num_input_tokens_seen": 0,
70
- "num_train_epochs": 15,
71
  "save_steps": 500,
72
  "stateful_callbacks": {
73
  "TrainerControl": {
@@ -85,8 +85,10 @@
85
  "train_batch_size": 64,
86
  "trial_name": null,
87
  "trial_params": {
88
- "learning_rate": 5.296158019829305e-05,
89
- "num_train_epochs": 15,
 
 
90
  "per_device_train_batch_size": 64
91
  }
92
  }
 
1
  {
2
  "best_global_step": 234,
3
+ "best_metric": 0.7111913357400722,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-3/checkpoint-234",
5
  "epoch": 6.0,
6
  "eval_steps": 500,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.5992779783393501,
15
+ "eval_loss": 0.6721181869506836,
16
+ "eval_runtime": 0.6383,
17
+ "eval_samples_per_second": 433.997,
18
+ "eval_steps_per_second": 14.101,
19
  "step": 39
20
  },
21
  {
22
  "epoch": 2.0,
23
+ "eval_accuracy": 0.628158844765343,
24
+ "eval_loss": 0.6599582433700562,
25
+ "eval_runtime": 0.636,
26
+ "eval_samples_per_second": 435.52,
27
+ "eval_steps_per_second": 14.15,
28
  "step": 78
29
  },
30
  {
31
  "epoch": 3.0,
32
+ "eval_accuracy": 0.6389891696750902,
33
+ "eval_loss": 0.7105341553688049,
34
+ "eval_runtime": 0.6384,
35
+ "eval_samples_per_second": 433.913,
36
+ "eval_steps_per_second": 14.098,
37
  "step": 117
38
  },
39
  {
40
  "epoch": 4.0,
41
+ "eval_accuracy": 0.6931407942238267,
42
+ "eval_loss": 0.9099717140197754,
43
+ "eval_runtime": 0.6379,
44
+ "eval_samples_per_second": 434.226,
45
+ "eval_steps_per_second": 14.108,
46
  "step": 156
47
  },
48
  {
49
  "epoch": 5.0,
50
+ "eval_accuracy": 0.6353790613718412,
51
+ "eval_loss": 1.4261176586151123,
52
+ "eval_runtime": 0.6382,
53
+ "eval_samples_per_second": 434.009,
54
+ "eval_steps_per_second": 14.101,
55
  "step": 195
56
  },
57
  {
58
  "epoch": 6.0,
59
+ "eval_accuracy": 0.7111913357400722,
60
+ "eval_loss": 1.1338996887207031,
61
+ "eval_runtime": 0.6397,
62
+ "eval_samples_per_second": 432.989,
63
+ "eval_steps_per_second": 14.068,
64
  "step": 234
65
  }
66
  ],
67
  "logging_steps": 500,
68
+ "max_steps": 273,
69
  "num_input_tokens_seen": 0,
70
+ "num_train_epochs": 7,
71
  "save_steps": 500,
72
  "stateful_callbacks": {
73
  "TrainerControl": {
 
85
  "train_batch_size": 64,
86
  "trial_name": null,
87
  "trial_params": {
88
+ "dropout_rate": 0.0134,
89
+ "learning_rate": 0.0001,
90
+ "max_length": 32,
91
+ "num_train_epochs": 7,
92
  "per_device_train_batch_size": 64
93
  }
94
  }
run-3/checkpoint-234/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1d7cd6cde9b143872fea17834d1d37a574e764e020936e4ec84f9f6dbbfb1fa
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31e11225076494526a7157d904c355e54980b239c63149e5cb6bd46c8e0ca9c
3
  size 5432
run-3/checkpoint-273/config.json CHANGED
@@ -19,7 +19,7 @@
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
- "transformers_version": "4.50.2",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
  "vocab_size": 30522
 
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
+ "transformers_version": "4.50.3",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
  "vocab_size": 30522
run-3/checkpoint-273/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8ee8fbbf2add9264bfc97241fe76a6afcfd64b6d4a0a25f818965ce869e48f5
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79cc0c387248a83368ee577ad22685e93e409035a861137d8d04429041b4b883
3
  size 437958648
run-3/checkpoint-273/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:976f65a06b1402963db90008dbc5b7687e68793f8442fa5784a241a50182c59b
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64351c72515b55bf2c716320f06d028c08f8d27fadac655d08598f0605935b74
3
  size 876038394
run-3/checkpoint-273/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd47ea1d94a19fef46f4580027106ea139e893819b7396cf1b81508f158fb854
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3c171ceab3b90de030417936fdba57019f3ded92bc954fc958883932ab95e05
3
  size 1064
run-3/checkpoint-273/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 234,
3
- "best_metric": 0.7003610108303249,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-3/checkpoint-234",
5
  "epoch": 7.0,
6
  "eval_steps": 500,
@@ -11,72 +11,72 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.6028880866425993,
15
- "eval_loss": 0.6455268263816833,
16
- "eval_runtime": 0.6422,
17
- "eval_samples_per_second": 431.339,
18
- "eval_steps_per_second": 14.015,
19
  "step": 39
20
  },
21
  {
22
  "epoch": 2.0,
23
- "eval_accuracy": 0.5992779783393501,
24
- "eval_loss": 0.6891809701919556,
25
- "eval_runtime": 0.6455,
26
- "eval_samples_per_second": 429.15,
27
- "eval_steps_per_second": 13.944,
28
  "step": 78
29
  },
30
  {
31
  "epoch": 3.0,
32
- "eval_accuracy": 0.6425992779783394,
33
- "eval_loss": 0.8288224935531616,
34
- "eval_runtime": 0.6442,
35
- "eval_samples_per_second": 429.982,
36
- "eval_steps_per_second": 13.971,
37
  "step": 117
38
  },
39
  {
40
  "epoch": 4.0,
41
- "eval_accuracy": 0.6823104693140795,
42
- "eval_loss": 0.9376588463783264,
43
- "eval_runtime": 0.6392,
44
- "eval_samples_per_second": 433.358,
45
- "eval_steps_per_second": 14.08,
46
  "step": 156
47
  },
48
  {
49
  "epoch": 5.0,
50
- "eval_accuracy": 0.6642599277978339,
51
- "eval_loss": 1.4554625749588013,
52
- "eval_runtime": 0.6427,
53
- "eval_samples_per_second": 430.994,
54
- "eval_steps_per_second": 14.003,
55
  "step": 195
56
  },
57
  {
58
  "epoch": 6.0,
59
- "eval_accuracy": 0.7003610108303249,
60
- "eval_loss": 1.4293187856674194,
61
- "eval_runtime": 0.6389,
62
- "eval_samples_per_second": 433.574,
63
- "eval_steps_per_second": 14.087,
64
  "step": 234
65
  },
66
  {
67
  "epoch": 7.0,
68
- "eval_accuracy": 0.6895306859205776,
69
- "eval_loss": 1.7040148973464966,
70
- "eval_runtime": 0.6386,
71
- "eval_samples_per_second": 433.742,
72
- "eval_steps_per_second": 14.093,
73
  "step": 273
74
  }
75
  ],
76
  "logging_steps": 500,
77
- "max_steps": 585,
78
  "num_input_tokens_seen": 0,
79
- "num_train_epochs": 15,
80
  "save_steps": 500,
81
  "stateful_callbacks": {
82
  "TrainerControl": {
@@ -85,7 +85,7 @@
85
  "should_evaluate": false,
86
  "should_log": false,
87
  "should_save": true,
88
- "should_training_stop": false
89
  },
90
  "attributes": {}
91
  }
@@ -94,8 +94,10 @@
94
  "train_batch_size": 64,
95
  "trial_name": null,
96
  "trial_params": {
97
- "learning_rate": 5.296158019829305e-05,
98
- "num_train_epochs": 15,
 
 
99
  "per_device_train_batch_size": 64
100
  }
101
  }
 
1
  {
2
  "best_global_step": 234,
3
+ "best_metric": 0.7111913357400722,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-3/checkpoint-234",
5
  "epoch": 7.0,
6
  "eval_steps": 500,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.5992779783393501,
15
+ "eval_loss": 0.6721181869506836,
16
+ "eval_runtime": 0.6383,
17
+ "eval_samples_per_second": 433.997,
18
+ "eval_steps_per_second": 14.101,
19
  "step": 39
20
  },
21
  {
22
  "epoch": 2.0,
23
+ "eval_accuracy": 0.628158844765343,
24
+ "eval_loss": 0.6599582433700562,
25
+ "eval_runtime": 0.636,
26
+ "eval_samples_per_second": 435.52,
27
+ "eval_steps_per_second": 14.15,
28
  "step": 78
29
  },
30
  {
31
  "epoch": 3.0,
32
+ "eval_accuracy": 0.6389891696750902,
33
+ "eval_loss": 0.7105341553688049,
34
+ "eval_runtime": 0.6384,
35
+ "eval_samples_per_second": 433.913,
36
+ "eval_steps_per_second": 14.098,
37
  "step": 117
38
  },
39
  {
40
  "epoch": 4.0,
41
+ "eval_accuracy": 0.6931407942238267,
42
+ "eval_loss": 0.9099717140197754,
43
+ "eval_runtime": 0.6379,
44
+ "eval_samples_per_second": 434.226,
45
+ "eval_steps_per_second": 14.108,
46
  "step": 156
47
  },
48
  {
49
  "epoch": 5.0,
50
+ "eval_accuracy": 0.6353790613718412,
51
+ "eval_loss": 1.4261176586151123,
52
+ "eval_runtime": 0.6382,
53
+ "eval_samples_per_second": 434.009,
54
+ "eval_steps_per_second": 14.101,
55
  "step": 195
56
  },
57
  {
58
  "epoch": 6.0,
59
+ "eval_accuracy": 0.7111913357400722,
60
+ "eval_loss": 1.1338996887207031,
61
+ "eval_runtime": 0.6397,
62
+ "eval_samples_per_second": 432.989,
63
+ "eval_steps_per_second": 14.068,
64
  "step": 234
65
  },
66
  {
67
  "epoch": 7.0,
68
+ "eval_accuracy": 0.7075812274368231,
69
+ "eval_loss": 1.221158742904663,
70
+ "eval_runtime": 0.6395,
71
+ "eval_samples_per_second": 433.117,
72
+ "eval_steps_per_second": 14.072,
73
  "step": 273
74
  }
75
  ],
76
  "logging_steps": 500,
77
+ "max_steps": 273,
78
  "num_input_tokens_seen": 0,
79
+ "num_train_epochs": 7,
80
  "save_steps": 500,
81
  "stateful_callbacks": {
82
  "TrainerControl": {
 
85
  "should_evaluate": false,
86
  "should_log": false,
87
  "should_save": true,
88
+ "should_training_stop": true
89
  },
90
  "attributes": {}
91
  }
 
94
  "train_batch_size": 64,
95
  "trial_name": null,
96
  "trial_params": {
97
+ "dropout_rate": 0.0134,
98
+ "learning_rate": 0.0001,
99
+ "max_length": 32,
100
+ "num_train_epochs": 7,
101
  "per_device_train_batch_size": 64
102
  }
103
  }
run-3/checkpoint-273/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1d7cd6cde9b143872fea17834d1d37a574e764e020936e4ec84f9f6dbbfb1fa
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31e11225076494526a7157d904c355e54980b239c63149e5cb6bd46c8e0ca9c
3
  size 5432
run-4/checkpoint-39/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3fb45e76350b9c813d1fad11ba64ae690635e5381b8ba1aee7be80f6d2f22e49
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77a1db500591369d0e6d7f7a2a040bfa60647f0b57ba372d76c961375a165f87
3
  size 437958648
run-4/checkpoint-39/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3b3aac8275d08ddfa154a8eb29c8aca0ad27c54705712bd55a1bec7871c63a0
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f29b3441008d4a261724b0ded94ccf789ae193c4bc68c832853899208c5537b6
3
  size 876038394
run-4/checkpoint-39/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a7bd3ac89cc6f989a2b823bb8bde976a5355b84b9a51281486645c8df8e47b9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e78d5e09340c0681df725fbe1595e157ca67a75816fc394229ff49b11a9add2
3
  size 1064
run-4/checkpoint-39/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 39,
3
- "best_metric": 0.4729241877256318,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-4/checkpoint-39",
5
  "epoch": 1.0,
6
  "eval_steps": 500,
@@ -11,18 +11,18 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.4729241877256318,
15
- "eval_loss": 0.6936286687850952,
16
- "eval_runtime": 0.6353,
17
- "eval_samples_per_second": 436.012,
18
- "eval_steps_per_second": 14.166,
19
  "step": 39
20
  }
21
  ],
22
  "logging_steps": 500,
23
- "max_steps": 195,
24
  "num_input_tokens_seen": 0,
25
- "num_train_epochs": 5,
26
  "save_steps": 500,
27
  "stateful_callbacks": {
28
  "TrainerControl": {
@@ -31,7 +31,7 @@
31
  "should_evaluate": false,
32
  "should_log": false,
33
  "should_save": true,
34
- "should_training_stop": false
35
  },
36
  "attributes": {}
37
  }
@@ -41,9 +41,9 @@
41
  "trial_name": null,
42
  "trial_params": {
43
  "dropout_rate": 0.0134,
44
- "learning_rate": 0.0005,
45
  "max_length": 32,
46
- "num_train_epochs": 5,
47
  "per_device_train_batch_size": 64
48
  }
49
  }
 
1
  {
2
  "best_global_step": 39,
3
+ "best_metric": 0.6389891696750902,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-4/checkpoint-39",
5
  "epoch": 1.0,
6
  "eval_steps": 500,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.6389891696750902,
15
+ "eval_loss": 0.6387895345687866,
16
+ "eval_runtime": 0.6355,
17
+ "eval_samples_per_second": 435.878,
18
+ "eval_steps_per_second": 14.162,
19
  "step": 39
20
  }
21
  ],
22
  "logging_steps": 500,
23
+ "max_steps": 39,
24
  "num_input_tokens_seen": 0,
25
+ "num_train_epochs": 1,
26
  "save_steps": 500,
27
  "stateful_callbacks": {
28
  "TrainerControl": {
 
31
  "should_evaluate": false,
32
  "should_log": false,
33
  "should_save": true,
34
+ "should_training_stop": true
35
  },
36
  "attributes": {}
37
  }
 
41
  "trial_name": null,
42
  "trial_params": {
43
  "dropout_rate": 0.0134,
44
+ "learning_rate": 0.0001,
45
  "max_length": 32,
46
+ "num_train_epochs": 1,
47
  "per_device_train_batch_size": 64
48
  }
49
  }
run-4/checkpoint-39/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9370cb350f581377d77550ad98e0d71f735e273933b1b105b3b4564570e10207
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f321d5971ff6ba91e19e8f1139788c24314fbde22665abea04b8ef44596c5939
3
  size 5432
runs/Apr04_16-57-59_5bdb2d0e2198/events.out.tfevents.1743793224.5bdb2d0e2198.1206.41 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5885f3f2919be7322a7254bcb7aea8ccb82698c5348ebbca622714ab941e1a15
3
+ size 5751
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a31e11225076494526a7157d904c355e54980b239c63149e5cb6bd46c8e0ca9c
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f321d5971ff6ba91e19e8f1139788c24314fbde22665abea04b8ef44596c5939
3
  size 5432