Upload folder using huggingface_hub (#1)
Browse files- 3d0ce6cd0e6b546985ddb16a01943390228920dc1b731ec2dcd561a872be1eab (d73e990f139d2587e605d610cc2f99a9503ee8da)
- 70049e49239523459d6b0512e313093d62fa1226167d8bc3113f4b2549a5b181 (7de53c4b35c537ef06f892901618172f05d783ec)
- f041bc507380c5ed222012593418945fa7d8625a99d0ea505a24b7b1e7921ee6 (5d3a036e7b471d6147de5d0e66a1a8d0fa7c1582)
- 25399827b5344c6c7e08171dcd2cfa4c95481e3a157669a3215337388ff8ecc0 (df77c4666c768d33f452b79ee62ccc0851524fff)
- 9f8c11fc2c94705aec79550e4e434580e2fa74368d3066e9062f0030743e48e1 (c80cc56612b63e70c22221635a49f9ba6c087a95)
- c5b524d42ddb7ce593f8f64fc3ed76e80b97b8cc19a804e7918a42325c89f121 (c9a96087916ff5682b41eb261a87525d254bb723)
- config.json +40 -0
- generation_config.json +10 -0
- model-00001-of-00006.safetensors +3 -0
- model-00002-of-00006.safetensors +3 -0
- model-00003-of-00006.safetensors +3 -0
- model-00004-of-00006.safetensors +3 -0
- model-00005-of-00006.safetensors +3 -0
- model-00006-of-00006.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "meta-llama/Llama-2-70b-hf",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 64,
|
18 |
+
"num_hidden_layers": 80,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"quip_params": {
|
22 |
+
"K": 3,
|
23 |
+
"L": 16,
|
24 |
+
"V": 2,
|
25 |
+
"codebook": "bitshift",
|
26 |
+
"codebook_version": 0,
|
27 |
+
"decode_mode": "quantlut_sym",
|
28 |
+
"td_x": 16,
|
29 |
+
"td_y": 16,
|
30 |
+
"tlut_bits": 9
|
31 |
+
},
|
32 |
+
"rms_norm_eps": 1e-05,
|
33 |
+
"rope_scaling": null,
|
34 |
+
"rope_theta": 10000.0,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "float16",
|
37 |
+
"transformers_version": "4.44.2",
|
38 |
+
"use_cache": true,
|
39 |
+
"vocab_size": 32000
|
40 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 1,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"max_length": 4096,
|
6 |
+
"pad_token_id": 0,
|
7 |
+
"temperature": 0.6,
|
8 |
+
"top_p": 0.9,
|
9 |
+
"transformers_version": "4.44.2"
|
10 |
+
}
|
model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f32416785c64814c52d5a262f4180c4be2afccaff522759206e529be62fcd988
|
3 |
+
size 4935769496
|
model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df252b6b980255fe3db6610c92d3461f8314dc8734316f268dbe341b6052bfc8
|
3 |
+
size 4966068848
|
model-00003-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adf3e716b9d58d25e777a9fee98cc6d71b12f92d13525067b3f0608c94d3e9a1
|
3 |
+
size 4997518464
|
model-00004-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbcbef064565299f79871501dd4717fd5604fdb79fab197394db0fb0aa6fafa2
|
3 |
+
size 4966068848
|
model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ecb1c39ba753bb1081f744dea742b9f41256182df4d239f3f3127f7a28c0c30
|
3 |
+
size 4997518464
|
model-00006-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b111bf083f770667c7a14b83f93df9c6d7be8ced0fce191e245ba6cd04f59cd
|
3 |
+
size 1898132784
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|