Commit
·
abe8c97
1
Parent(s):
8c93358
Upload folder using huggingface_hub
Browse files- config.json +9 -18
- generation_config.json +11 -4
- model-00001-of-00018.safetensors +3 -0
- model-00002-of-00018.safetensors +3 -0
- model-00003-of-00018.safetensors +3 -0
- model-00004-of-00018.safetensors +3 -0
- model-00005-of-00018.safetensors +3 -0
- model-00006-of-00018.safetensors +3 -0
- model-00007-of-00018.safetensors +3 -0
- model-00008-of-00018.safetensors +3 -0
- model-00009-of-00018.safetensors +3 -0
- model-00010-of-00018.safetensors +3 -0
- model-00011-of-00018.safetensors +3 -0
- model-00012-of-00018.safetensors +3 -0
- model-00013-of-00018.safetensors +3 -0
- model-00014-of-00018.safetensors +3 -0
- model-00015-of-00018.safetensors +3 -0
- model-00016-of-00018.safetensors +3 -0
- model-00017-of-00018.safetensors +3 -0
- model-00018-of-00018.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
CHANGED
@@ -1,37 +1,28 @@
|
|
1 |
{
|
2 |
-
"_moe_implementation": "fused",
|
3 |
-
"_name_or_path": "/tmp/08513abd184b0668398ede78b54d60db/huggingface",
|
4 |
"architectures": [
|
5 |
-
"
|
6 |
],
|
7 |
-
"attention_bias": true,
|
8 |
"attention_dropout": 0.0,
|
9 |
-
"
|
10 |
-
"bos_token_id": 151644,
|
11 |
-
"embd_pdrop": 0.0,
|
12 |
"eos_token_id": 151645,
|
13 |
"hidden_act": "silu",
|
14 |
"hidden_size": 5120,
|
15 |
-
"initializer_range": 0.
|
16 |
"intermediate_size": 27648,
|
17 |
-
"layer_norm_eps": null,
|
18 |
"max_position_embeddings": 32768,
|
19 |
-
"
|
20 |
-
"model_type": "
|
21 |
"num_attention_heads": 40,
|
22 |
"num_hidden_layers": 64,
|
23 |
"num_key_value_heads": 8,
|
24 |
-
"pad_token_id": 151643,
|
25 |
-
"resid_pdrop": 0.0,
|
26 |
"rms_norm_eps": 1e-06,
|
27 |
-
"rope_scaling":
|
28 |
-
"factor": 1,
|
29 |
-
"rope_type": "default"
|
30 |
-
},
|
31 |
"rope_theta": 1000000.0,
|
|
|
32 |
"tie_word_embeddings": false,
|
33 |
"torch_dtype": "bfloat16",
|
34 |
-
"transformers_version": "4.
|
35 |
"use_cache": true,
|
|
|
36 |
"vocab_size": 152064
|
37 |
}
|
|
|
1 |
{
|
|
|
|
|
2 |
"architectures": [
|
3 |
+
"Qwen2ForCausalLM"
|
4 |
],
|
|
|
5 |
"attention_dropout": 0.0,
|
6 |
+
"bos_token_id": 151643,
|
|
|
|
|
7 |
"eos_token_id": 151645,
|
8 |
"hidden_act": "silu",
|
9 |
"hidden_size": 5120,
|
10 |
+
"initializer_range": 0.02,
|
11 |
"intermediate_size": 27648,
|
|
|
12 |
"max_position_embeddings": 32768,
|
13 |
+
"max_window_layers": 70,
|
14 |
+
"model_type": "qwen2",
|
15 |
"num_attention_heads": 40,
|
16 |
"num_hidden_layers": 64,
|
17 |
"num_key_value_heads": 8,
|
|
|
|
|
18 |
"rms_norm_eps": 1e-06,
|
19 |
+
"rope_scaling": null,
|
|
|
|
|
|
|
20 |
"rope_theta": 1000000.0,
|
21 |
+
"sliding_window": 131072,
|
22 |
"tie_word_embeddings": false,
|
23 |
"torch_dtype": "bfloat16",
|
24 |
+
"transformers_version": "4.51.3",
|
25 |
"use_cache": true,
|
26 |
+
"use_sliding_window": false,
|
27 |
"vocab_size": 152064
|
28 |
}
|
generation_config.json
CHANGED
@@ -1,7 +1,14 @@
|
|
1 |
{
|
2 |
-
"
|
3 |
-
"
|
4 |
-
"eos_token_id":
|
|
|
|
|
|
|
5 |
"pad_token_id": 151643,
|
6 |
-
"
|
|
|
|
|
|
|
|
|
7 |
}
|
|
|
1 |
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"temperature": 0.7,
|
11 |
+
"top_k": 20,
|
12 |
+
"top_p": 0.8,
|
13 |
+
"transformers_version": "4.51.3"
|
14 |
}
|
model-00001-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5edb2392f48755ecd48adfa08fc70709c7ac8f357aa97f0aadb3d8f96f495b6b
|
3 |
+
size 3633403488
|
model-00002-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca441d6c3cd7b1dbb179bbd7f8dd85ba3da59d8e85be3f8b29c206c7b51f7fec
|
3 |
+
size 3848418568
|
model-00003-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d64cc4165777c2f5c24037d0a5b320853d1fb49050f4d77df6e93a35d1264213
|
3 |
+
size 3890359432
|
model-00004-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eca2c4f578940de0c7ed6513669cbb8aff1303e02094cd7aa3116638ef5d7ff
|
3 |
+
size 3890359488
|
model-00005-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f513361f1e6307402821df44661f787d15061e46040f2739d39eca5791dbd2a8
|
3 |
+
size 3848408256
|
model-00006-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd04e73731a50988b7cdfbe6e1c7bb986db411910f64d8f8a4c4793093d601db
|
3 |
+
size 3617711168
|
model-00007-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cf3edd704e5dba77bfa79ca4bc7fccb9853f213aadfff5dd057c4c59f1822bb
|
3 |
+
size 3617731904
|
model-00008-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04bf406a5648460d6ac7a39859c6120fbf38797fb6606fdc62a622f1722f37b
|
3 |
+
size 3617731896
|
model-00009-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b9b9db48cd34d92a8b31733faed8ed7ea9dfd47b199da303589862eb1a8a206
|
3 |
+
size 3848418616
|
model-00010-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ce20cfb9134489dc1ca99486407399a4774cd36e07d11bec7dcc38c5901f38b
|
3 |
+
size 3890359496
|
model-00011-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b6355fef7bcce07f6c34fa2a2c91edb2b83225e92a8a9488044691fd67c984f
|
3 |
+
size 3890359488
|
model-00012-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef8027c404de6d881b371dc1a2098677a49c9d6d3ce924f4c85722c1e195c925
|
3 |
+
size 3848408256
|
model-00013-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276f4716d448d01b871d2b16a19baf991cca68357dbf5f93da17e0f6fd5e6952
|
3 |
+
size 3617711168
|
model-00014-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:515549e49dc5df9b94dc7c1de7c47d59085edec64dadaf0109ff5cd7b2666ac6
|
3 |
+
size 3617731904
|
model-00015-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87a2a91fba6146433c5f6abad94fe18361b467a7af0553d9bcf65f295a726cfc
|
3 |
+
size 3617731896
|
model-00016-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebed8d541e9de007b28891547cf0fe2dbb6c1fdef374b268d4cd049d64a1c702
|
3 |
+
size 3848418616
|
model-00017-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94b75fc24621c193e0ea98458e3150e7e79e08bdff20e1395931593b0096b68f
|
3 |
+
size 3827442520
|
model-00018-of-00018.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2dab1e5cd953caf2c45870ae7c12c2d08f83845a2be901fd6c344c2849d269c
|
3 |
+
size 1557135488
|
model.safetensors.index.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|