Commit
·
64197a6
1
Parent(s):
7940c2d
Upload folder using huggingface_hub
Browse files- all_results.json +1 -0
- config.json +27 -0
- pytorch_model.bin +3 -0
- special_tokens_map.json +6 -0
- step_0/optimizer.bin +3 -0
- step_0/pytorch_model.bin +3 -0
- step_0/random_states_0.pkl +3 -0
- step_0/random_states_1.pkl +3 -0
- step_0/random_states_2.pkl +3 -0
- step_0/random_states_3.pkl +3 -0
- step_0/random_states_4.pkl +3 -0
- step_0/random_states_5.pkl +3 -0
- step_0/scaler.pt +3 -0
- step_0/scheduler.bin +3 -0
- step_10000/optimizer.bin +3 -0
- step_10000/pytorch_model.bin +3 -0
- step_10000/random_states_0.pkl +3 -0
- step_10000/random_states_1.pkl +3 -0
- step_10000/random_states_2.pkl +3 -0
- step_10000/random_states_3.pkl +3 -0
- step_10000/random_states_4.pkl +3 -0
- step_10000/random_states_5.pkl +3 -0
- step_10000/scaler.pt +3 -0
- step_10000/scheduler.bin +3 -0
- step_20000/optimizer.bin +3 -0
- step_20000/pytorch_model.bin +3 -0
- step_20000/random_states_0.pkl +3 -0
- step_20000/random_states_1.pkl +3 -0
- step_20000/random_states_2.pkl +3 -0
- step_20000/random_states_3.pkl +3 -0
- step_20000/random_states_4.pkl +3 -0
- step_20000/random_states_5.pkl +3 -0
- step_20000/scaler.pt +3 -0
- step_20000/scheduler.bin +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +9 -0
all_results.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"perplexity": 5.348193740926849}
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./config_base.json",
|
3 |
+
"architectures": [
|
4 |
+
"RobertaForMaskedLM"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": "None",
|
8 |
+
"classifier_dropout": null,
|
9 |
+
"eos_token_id": "None",
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 768,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 3072,
|
15 |
+
"layer_norm_eps": 1e-05,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "roberta",
|
18 |
+
"num_attention_heads": 12,
|
19 |
+
"num_hidden_layers": 12,
|
20 |
+
"pad_token_id": 0,
|
21 |
+
"position_embedding_type": "absolute",
|
22 |
+
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.30.0.dev0",
|
24 |
+
"type_vocab_size": 1,
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 50000
|
27 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d4ce99c2f58f1518a6cc7997362eb247ed19045d0fae497dc5d8c73a0aa3953
|
3 |
+
size 498042169
|
special_tokens_map.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "<cls>",
|
3 |
+
"mask_token": "<mask>",
|
4 |
+
"pad_token": "<pad>",
|
5 |
+
"sep_token": "<sep>"
|
6 |
+
}
|
step_0/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cb9dab095f7c783ddcd9c01f29bd8cb94966c10921a9d5ad1a283776ac413b6
|
3 |
+
size 1203
|
step_0/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b1634d9e2ba3e44e7361af09e9e7a6f7ddf592ee6dac3708ec13360e43f035e
|
3 |
+
size 498057081
|
step_0/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3572f9e20e6c4aad37daab6439b9054014c6793c97ddca9992827e1fabaf8da2
|
3 |
+
size 19739
|
step_0/random_states_1.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5a444bfbf639e2c7d62c7bcdb903c414d6ffbbe949d352c72f6405c04cd1798
|
3 |
+
size 19739
|
step_0/random_states_2.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48c932ac718b19c50732d48740fdcd297f64c430f5a9f3e4d6495cfb7100efc2
|
3 |
+
size 19739
|
step_0/random_states_3.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7c30897a57a6390f96bc6a9c3bf9fc01d5bbf884528db79624d282b9756f022
|
3 |
+
size 19739
|
step_0/random_states_4.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3b9790b81ec619f75f83f241122d5678141eba03ab2281729f7c33d0d719e8b
|
3 |
+
size 19739
|
step_0/random_states_5.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43684221310c8851e8023116109f96f51918191d5b259a2ab2774f5ba0fc7ada
|
3 |
+
size 19739
|
step_0/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e73131f210099e8e2bd443b421a6ae3bb8ea2ba0864fd725775cb155699d69a
|
3 |
+
size 557
|
step_0/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1623030e8989ea5d77dc27c9afbcf93f77adee2336300f5b2c82d9101cd4486b
|
3 |
+
size 627
|
step_10000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:035d119132d0d32c341ff113bf6c9fac5bd28538383244c19bc5add2b9abf9bc
|
3 |
+
size 996105413
|
step_10000/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95879dba2c3022e5b9a3fc7901143ac46d18bf7760057d6bfd7d5dd9298b1bee
|
3 |
+
size 498057081
|
step_10000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc260e8365a23809cae8278d1d8acf3093a2959abe490050a4f0a04a8843d11
|
3 |
+
size 19739
|
step_10000/random_states_1.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc0d99722e88fd84cb26479454b588c891aee2832e04df4efa3cdb9bc6e6b539
|
3 |
+
size 19739
|
step_10000/random_states_2.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13968328726316b907fda74121e8059e5d232793c852726b90ff6add078f16d7
|
3 |
+
size 19739
|
step_10000/random_states_3.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4dc87a61748ee38d89db0379b68a24a5be7db42debee01aa64b698da50c3b22
|
3 |
+
size 19739
|
step_10000/random_states_4.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00acb5a187830b2fccc12c1a2311f7066bfb009734f340100a5ea27e82390298
|
3 |
+
size 19739
|
step_10000/random_states_5.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23f7937990b6ead6ce3b67aa7c3a3d569aff36337d7d937af2957af214fb6ce1
|
3 |
+
size 19739
|
step_10000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9be2ad76dcbc923b00e6a142f6db62aad4a46c47bb83864ccb68ddc899d0ce78
|
3 |
+
size 557
|
step_10000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:903f690bc25b62056715ef382e2712243ca76b534ddfc4f8c7975a4effa02ee6
|
3 |
+
size 627
|
step_20000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d7c52fcb7c02b730dc96ada66bff71910dc91efd022397902c97a1bbbeda7f7
|
3 |
+
size 996105413
|
step_20000/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3df1838d551e8900b23025bf3be371d8cdc8ef1725b9b0f89c3292d5a94e1c43
|
3 |
+
size 498057081
|
step_20000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67ae17e57d17d9a2f1480293768115342ea6b78897c16d24485abbac8dc99b11
|
3 |
+
size 19739
|
step_20000/random_states_1.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cac81cd0f6fc82a5461e8412774bb9c851d5b3e00c09f06696011a37a8d80c91
|
3 |
+
size 19739
|
step_20000/random_states_2.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d191924ee6fad4ae5966a86264316734ba574e9a5ab8108191a9187e31b12ee
|
3 |
+
size 19739
|
step_20000/random_states_3.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a34ab1dc4775addcd11b1a9f5225fa955706e3f2368c8cae8ba19e1f11738f0c
|
3 |
+
size 19739
|
step_20000/random_states_4.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d97bec246a1bcb2de990fbe8a82eb95447058166de891d5df712049bef9fa43
|
3 |
+
size 19739
|
step_20000/random_states_5.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f0765a58906169366e0b0cd3f510fed86d989322985da023e3b902d843467b3
|
3 |
+
size 19739
|
step_20000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16b712e95d6671e9667d1a2918b71781638ea5ffdc4c563ca255cddb1eae6886
|
3 |
+
size 557
|
step_20000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c61f065af635c948c0b0cc46dc52fcc60f9482a11ac5330e92ca358a6d63452e
|
3 |
+
size 627
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"clean_up_tokenization_spaces": true,
|
3 |
+
"cls_token": "<cls>",
|
4 |
+
"mask_token": "<mask>",
|
5 |
+
"model_max_length": 512,
|
6 |
+
"pad_token": "<pad>",
|
7 |
+
"sep_token": "<sep>",
|
8 |
+
"tokenizer_class": "PreTrainedTokenizerFast"
|
9 |
+
}
|