End of training
Browse files- README.md +2 -2
- logs/events.out.tfevents.1709200952.a7a08a4788fa.738.1 +3 -0
- model.safetensors +1 -1
- tokenizer_config.json +7 -0
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -32,13 +32,13 @@ More information needed
|
|
| 32 |
### Training hyperparameters
|
| 33 |
|
| 34 |
The following hyperparameters were used during training:
|
| 35 |
-
- learning_rate: 0.
|
| 36 |
- train_batch_size: 8
|
| 37 |
- eval_batch_size: 8
|
| 38 |
- seed: 42
|
| 39 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 40 |
- lr_scheduler_type: linear
|
| 41 |
-
- num_epochs:
|
| 42 |
|
| 43 |
### Training results
|
| 44 |
|
|
|
|
| 32 |
### Training hyperparameters
|
| 33 |
|
| 34 |
The following hyperparameters were used during training:
|
| 35 |
+
- learning_rate: 0.0005
|
| 36 |
- train_batch_size: 8
|
| 37 |
- eval_batch_size: 8
|
| 38 |
- seed: 42
|
| 39 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 40 |
- lr_scheduler_type: linear
|
| 41 |
+
- num_epochs: 10
|
| 42 |
|
| 43 |
### Training results
|
| 44 |
|
logs/events.out.tfevents.1709200952.a7a08a4788fa.738.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4243cf0745ad07afa701e576a992eb48a23ca8bc951e4835f939fb687cad41d3
|
| 3 |
+
size 7250
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 990345064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7986a098d3918ddf468a2e09f20d35666582f40c27dbc6090e4cd6c777aa7d2
|
| 3 |
size 990345064
|
tokenizer_config.json
CHANGED
|
@@ -930,9 +930,16 @@
|
|
| 930 |
"clean_up_tokenization_spaces": true,
|
| 931 |
"eos_token": "</s>",
|
| 932 |
"extra_ids": 100,
|
|
|
|
| 933 |
"model_max_length": 512,
|
|
|
|
| 934 |
"pad_token": "<pad>",
|
|
|
|
|
|
|
| 935 |
"sp_model_kwargs": {},
|
|
|
|
| 936 |
"tokenizer_class": "T5Tokenizer",
|
|
|
|
|
|
|
| 937 |
"unk_token": "<unk>"
|
| 938 |
}
|
|
|
|
| 930 |
"clean_up_tokenization_spaces": true,
|
| 931 |
"eos_token": "</s>",
|
| 932 |
"extra_ids": 100,
|
| 933 |
+
"max_length": 7,
|
| 934 |
"model_max_length": 512,
|
| 935 |
+
"pad_to_multiple_of": null,
|
| 936 |
"pad_token": "<pad>",
|
| 937 |
+
"pad_token_type_id": 0,
|
| 938 |
+
"padding_side": "right",
|
| 939 |
"sp_model_kwargs": {},
|
| 940 |
+
"stride": 0,
|
| 941 |
"tokenizer_class": "T5Tokenizer",
|
| 942 |
+
"truncation_side": "right",
|
| 943 |
+
"truncation_strategy": "longest_first",
|
| 944 |
"unk_token": "<unk>"
|
| 945 |
}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4856
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cc7887b932d1cd8a641005ba327d392d8f47b9ecb467482b336c0e93e1f1b11
|
| 3 |
size 4856
|