Commit
·
2f95a71
1
Parent(s):
6aef9d7
Upload folder using huggingface_hub
Browse files- all_results.json +1 -0
- config.json +27 -0
- pytorch_model.bin +3 -0
- special_tokens_map.json +6 -0
- step_0/optimizer.bin +3 -0
- step_0/pytorch_model.bin +3 -0
- step_0/random_states_0.pkl +3 -0
- step_0/random_states_1.pkl +3 -0
- step_0/random_states_2.pkl +3 -0
- step_0/random_states_3.pkl +3 -0
- step_0/random_states_4.pkl +3 -0
- step_0/random_states_5.pkl +3 -0
- step_0/random_states_6.pkl +3 -0
- step_0/random_states_7.pkl +3 -0
- step_0/scaler.pt +3 -0
- step_0/scheduler.bin +3 -0
- step_20000/optimizer.bin +3 -0
- step_20000/pytorch_model.bin +3 -0
- step_20000/random_states_0.pkl +3 -0
- step_20000/random_states_1.pkl +3 -0
- step_20000/random_states_2.pkl +3 -0
- step_20000/random_states_3.pkl +3 -0
- step_20000/random_states_4.pkl +3 -0
- step_20000/random_states_5.pkl +3 -0
- step_20000/scaler.pt +3 -0
- step_20000/scheduler.bin +3 -0
- step_40000/optimizer.bin +3 -0
- step_40000/pytorch_model.bin +3 -0
- step_40000/random_states_0.pkl +3 -0
- step_40000/random_states_1.pkl +3 -0
- step_40000/random_states_2.pkl +3 -0
- step_40000/random_states_3.pkl +3 -0
- step_40000/random_states_4.pkl +3 -0
- step_40000/random_states_5.pkl +3 -0
- step_40000/scaler.pt +3 -0
- step_40000/scheduler.bin +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +9 -0
all_results.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"perplexity": 5.52966697436367}
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./config_base.json",
|
3 |
+
"architectures": [
|
4 |
+
"RobertaForMaskedLM"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": "None",
|
8 |
+
"classifier_dropout": null,
|
9 |
+
"eos_token_id": "None",
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 768,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 3072,
|
15 |
+
"layer_norm_eps": 1e-05,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "roberta",
|
18 |
+
"num_attention_heads": 12,
|
19 |
+
"num_hidden_layers": 12,
|
20 |
+
"pad_token_id": 0,
|
21 |
+
"position_embedding_type": "absolute",
|
22 |
+
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.30.0.dev0",
|
24 |
+
"type_vocab_size": 1,
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 50000
|
27 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10d13f0c9faabdf08f650ff35b5a98e7246cbc0678fef03b0c8c0c2391e05e0c
|
3 |
+
size 498042169
|
special_tokens_map.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "<cls>",
|
3 |
+
"mask_token": "<mask>",
|
4 |
+
"pad_token": "<pad>",
|
5 |
+
"sep_token": "<sep>"
|
6 |
+
}
|
step_0/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cb9dab095f7c783ddcd9c01f29bd8cb94966c10921a9d5ad1a283776ac413b6
|
3 |
+
size 1203
|
step_0/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b1634d9e2ba3e44e7361af09e9e7a6f7ddf592ee6dac3708ec13360e43f035e
|
3 |
+
size 498057081
|
step_0/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2ecc836ffbf7b4e933d3b0e0dd4755cb7b46539d191d1848bab57f41eee2bf
|
3 |
+
size 19739
|
step_0/random_states_1.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fbe7c991914ffd5bc19aaa0d0e6a9eb07b95ad477c4c940375f2b73d70f7847
|
3 |
+
size 19739
|
step_0/random_states_2.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a610c833c1e2f80fac8e759cb7a25c1465b02f608d927cb34e6e6b475935b4d
|
3 |
+
size 19739
|
step_0/random_states_3.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c7a400533239b9e1ffe34e3661734fc7c2cac3fc4522ec3dc01f99dc960b2fb
|
3 |
+
size 19739
|
step_0/random_states_4.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bc70b28a5855215e11a8a86cb6aaba74199314803e8804f3da1ada30045a78f
|
3 |
+
size 19739
|
step_0/random_states_5.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed25756ddeeb6711d4f99641e4c04c51e6e34158e4d1b7f7b5de0e90281b576a
|
3 |
+
size 19739
|
step_0/random_states_6.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42cd90d1414d21c8ef2a8035d7c2a084a0ab89e369908eb9a9f1f8eed3af0b23
|
3 |
+
size 21731
|
step_0/random_states_7.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d3752519998d07ca14cad333a86e920f2dc1526f38bf449ce4df998714f1142
|
3 |
+
size 21731
|
step_0/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e73131f210099e8e2bd443b421a6ae3bb8ea2ba0864fd725775cb155699d69a
|
3 |
+
size 557
|
step_0/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1623030e8989ea5d77dc27c9afbcf93f77adee2336300f5b2c82d9101cd4486b
|
3 |
+
size 627
|
step_20000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dd40c72eb61da0d89a79f2b53a4045382b0a8e473f652b58bc2f33d57a457ea
|
3 |
+
size 996105413
|
step_20000/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d35ca54f559c554e2f8e36c85517677536c59da5e0405f6ea974f359eaf0aa3
|
3 |
+
size 498057081
|
step_20000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:485dabf0861c25ecf6be972a8623e124071890fd38741c66c417955645ed9fdc
|
3 |
+
size 19739
|
step_20000/random_states_1.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5dfa4ae207e33dba3b1046851944c19a719d7d23251b496022255acde11d986
|
3 |
+
size 19739
|
step_20000/random_states_2.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a50a033d354e5c6c5b002405cb9277646612ef7acada13ec8b7c8d24ceffb7bc
|
3 |
+
size 19739
|
step_20000/random_states_3.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a571416cef03725f7a796f30a2f06b49fa8a6d2e285bde9099ca0e864453bfb9
|
3 |
+
size 19739
|
step_20000/random_states_4.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeeba46fd4bc8d81dc854da4a2f97406038635db4a8e39cf42c392d1b84de4bf
|
3 |
+
size 19739
|
step_20000/random_states_5.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1476cee139a2b63831c89d7acdc89a7c5f1ade7757c053ea2a7ed745bba974f6
|
3 |
+
size 19739
|
step_20000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e131ffa76a6d668a1b432512f5183102514e603314c62c77693c07e17f6784b
|
3 |
+
size 557
|
step_20000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a0fa00fdb8bebf5836501e0e31515bb673702b6daaec2122677fa29e065346e
|
3 |
+
size 627
|
step_40000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6e8e166d34f58ae6f055d99b13d2dd59d5ab3e3213efdbeade6fdd22b87679d
|
3 |
+
size 996105413
|
step_40000/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f4a0b2a98c3ce985bc1d8ff0457c234177d2c0622de47cd882a8a26edcdb992
|
3 |
+
size 498057081
|
step_40000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d503a7d155b075dc4d726f4415eb697d923ac7ecbf16e8cf9262700a908cf475
|
3 |
+
size 19739
|
step_40000/random_states_1.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ef663e82b3f4ba435532314def42cea751713863742475e60a6f4b5a6cae85b
|
3 |
+
size 19739
|
step_40000/random_states_2.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b071feff06de42b0913c0ee0681d5b647766710975406c5c444fa1a25bb6cb0
|
3 |
+
size 19739
|
step_40000/random_states_3.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d69b3adb704ce9722f78d70c0b3d27188b8c1341cdbf8ac26feb7a27d9c0e1f1
|
3 |
+
size 19739
|
step_40000/random_states_4.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b42863ef041a1407634edf603b3bd68a5c93b78e1d8483c5c4ab38f12dcb139
|
3 |
+
size 19739
|
step_40000/random_states_5.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0a4281b93d81c0ffbfb030f7d1bb00ba35412ea90e2b565e3503b91e084ee66
|
3 |
+
size 19739
|
step_40000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c42f3b799628e875a386d8d29abd28869c9b252de1c32b1f225f2834a8a2aa8f
|
3 |
+
size 557
|
step_40000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31fcc4f51db45bb274bb420e9a3e573b010f19551d9e5376cb8ee299f52ee1f3
|
3 |
+
size 627
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"clean_up_tokenization_spaces": true,
|
3 |
+
"cls_token": "<cls>",
|
4 |
+
"mask_token": "<mask>",
|
5 |
+
"model_max_length": 512,
|
6 |
+
"pad_token": "<pad>",
|
7 |
+
"sep_token": "<sep>",
|
8 |
+
"tokenizer_class": "PreTrainedTokenizerFast"
|
9 |
+
}
|