Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- config.json +40 -0
- model-00001-of-00062.safetensors +3 -0
- model-00002-of-00062.safetensors +3 -0
- model-00003-of-00062.safetensors +3 -0
- model-00004-of-00062.safetensors +3 -0
- model-00005-of-00062.safetensors +3 -0
- model-00006-of-00062.safetensors +3 -0
- model-00007-of-00062.safetensors +3 -0
- model-00008-of-00062.safetensors +3 -0
- model-00009-of-00062.safetensors +3 -0
- model-00010-of-00062.safetensors +3 -0
- model-00011-of-00062.safetensors +3 -0
- model-00012-of-00062.safetensors +3 -0
- model-00013-of-00062.safetensors +3 -0
- model-00014-of-00062.safetensors +3 -0
- model-00015-of-00062.safetensors +3 -0
- model-00016-of-00062.safetensors +3 -0
- model-00017-of-00062.safetensors +3 -0
- model-00018-of-00062.safetensors +3 -0
- model-00019-of-00062.safetensors +3 -0
- model-00020-of-00062.safetensors +3 -0
- model-00021-of-00062.safetensors +3 -0
- model-00022-of-00062.safetensors +3 -0
- model-00023-of-00062.safetensors +3 -0
- model-00024-of-00062.safetensors +3 -0
- model-00025-of-00062.safetensors +3 -0
- model-00026-of-00062.safetensors +3 -0
- model-00027-of-00062.safetensors +3 -0
- model-00028-of-00062.safetensors +3 -0
- model-00029-of-00062.safetensors +3 -0
- model-00030-of-00062.safetensors +3 -0
- model-00031-of-00062.safetensors +3 -0
- model-00032-of-00062.safetensors +3 -0
- model-00033-of-00062.safetensors +3 -0
- model-00034-of-00062.safetensors +3 -0
- model-00035-of-00062.safetensors +3 -0
- model-00036-of-00062.safetensors +3 -0
- model-00037-of-00062.safetensors +3 -0
- model-00038-of-00062.safetensors +3 -0
- model-00039-of-00062.safetensors +3 -0
- model-00040-of-00062.safetensors +3 -0
- model-00041-of-00062.safetensors +3 -0
- model-00042-of-00062.safetensors +3 -0
- model-00043-of-00062.safetensors +3 -0
- model-00044-of-00062.safetensors +3 -0
- model-00045-of-00062.safetensors +3 -0
- model-00046-of-00062.safetensors +3 -0
- model-00047-of-00062.safetensors +3 -0
- model-00048-of-00062.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Sao10K/Llama-3.3-70B-Vulpecula-r1",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 8192,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 28672,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 64,
|
23 |
+
"num_hidden_layers": 80,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pretraining_tp": 1,
|
26 |
+
"rms_norm_eps": 1e-05,
|
27 |
+
"rope_scaling": {
|
28 |
+
"factor": 8.0,
|
29 |
+
"high_freq_factor": 4.0,
|
30 |
+
"low_freq_factor": 1.0,
|
31 |
+
"original_max_position_embeddings": 8192,
|
32 |
+
"rope_type": "llama3"
|
33 |
+
},
|
34 |
+
"rope_theta": 500000.0,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "bfloat16",
|
37 |
+
"transformers_version": "4.49.0",
|
38 |
+
"use_cache": true,
|
39 |
+
"vocab_size": 128256
|
40 |
+
}
|
model-00001-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73f9d97400eb59d54f8c227bc9159e8b63886bdaa99715211014d8fbb19bd275
|
3 |
+
size 4202725616
|
model-00002-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:278fecac681b3b1b37944ea1e0d12422aa2d615c926203b232af83a1809a03bf
|
3 |
+
size 4202692744
|
model-00003-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2a6cb0a7c9e4f9c4b0f972f37f5f4218d51b41edb3ffa72e559feea77a03389
|
3 |
+
size 4362142872
|
model-00004-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29f0b1740b63e6084bf23ad8a857a80840f52fa07334efa98fae51e99f064d8f
|
3 |
+
size 4362175768
|
model-00005-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65667b6dd24a14140dad19c4cbfbafed82159574f32eb2bfa607005bbd598276
|
3 |
+
size 4966156008
|
model-00006-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbac993026afa7600801ce1dde91ddbfc47ce321f20a0b8d93f701007102ecdb
|
3 |
+
size 4362142888
|
model-00007-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91568a3f66b75468e3b10d8dbfdfb148701fbc4ed65be1103f0d90d82265159b
|
3 |
+
size 4362175776
|
model-00008-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afa25e40cc9bd5b6eb128e480e5b69a5e52fef0560e2d389941e2445624a82d1
|
3 |
+
size 4966156008
|
model-00009-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82f728a569283ec802895f88522f8f74ec2b46d43bbdcce298439da3a1dd21a3
|
3 |
+
size 4362142888
|
model-00010-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:651caebca29dfd2253dad6cb869152c1ee009a6b615c80bb1b0ec79f3a633a11
|
3 |
+
size 4362175776
|
model-00011-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb247a8cf552f645553e0270261c4d9f2b53d6b3890f32c17d46db507b001af1
|
3 |
+
size 4966156000
|
model-00012-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44a8c9fd72f28181f57364602c44cbc7a494a94976edb0f812ffdcd5ec6b03e4
|
3 |
+
size 4362142880
|
model-00013-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cb4b7dfae91aa2f3a35f1d2d72baf6470627a25228956c00e551f0eb4d462d7
|
3 |
+
size 4362175776
|
model-00014-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d2880607957d99700e4199171e4a8d49124d01c3ab412d2c9325799300c129e
|
3 |
+
size 4966156008
|
model-00015-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4154756c0c6f82ce428f6c8a366a47f3aa62178bd64b3b8b491a37a93a72555f
|
3 |
+
size 4362142888
|
model-00016-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d069485fc7058b78f29f076bd71d214bad50d1928d249515356ec74496fea2a
|
3 |
+
size 4362175776
|
model-00017-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e4d008ef0d75afbed0797a610f5287f2ea2401b688595cf07d410f57f30c5d1
|
3 |
+
size 4966156008
|
model-00018-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:145129f0f619526b160d1c1e5959f3793f9a1bc16522ffb42df4a0cb29f227a7
|
3 |
+
size 4362142888
|
model-00019-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1061d78dbb5fb18a98ad79f6a0c14d0145e02ea9958de0be64da7128a2daf447
|
3 |
+
size 4362175776
|
model-00020-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81a26d0177c230e4b375425ba65d4a9b76f6d186dbd9d49bdb014e6102175266
|
3 |
+
size 4966155992
|
model-00021-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:285bef6deef4071f57b2e83ec8c67698de0b58d31809cdb4c557d2f1409a4f81
|
3 |
+
size 4362142888
|
model-00022-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ada0b7d5a0ab25476a450c066a189860ef7abdf4fe0d095019f1711356c8894
|
3 |
+
size 4362175776
|
model-00023-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a17666d2283927e721d70395bc5889314b02adc735e2eb37c0bfe4ad2bce1a58
|
3 |
+
size 4966156008
|
model-00024-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ec5f66284d1dd89ea6546c8ab25646565817d8655e5e4c392a22c5698cf825d
|
3 |
+
size 4362142888
|
model-00025-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6387b90bcde8a4b2bdb60c7145e7c564164c8e2046a53135c42ad32b57818f6
|
3 |
+
size 4362175776
|
model-00026-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4e0b5c9489948fa76a8e11b5e34df3c8f6bc55b9761d8e80ad49e7f46b52ef7
|
3 |
+
size 4966156008
|
model-00027-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56d7aa5a3a95d3839602203b1769d1218c5840a696be15c66d8b6f33c80bb278
|
3 |
+
size 4362142888
|
model-00028-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b077d871ee079d28148c3b726294fb8fea84ce44c482b3ef765a66d2cf1dd7b
|
3 |
+
size 4362175768
|
model-00029-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b29ef4733019d16095a0d3af467b685c2a9d65650bfe1db344918dc128acadff
|
3 |
+
size 4966156000
|
model-00030-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaa4a93799a173e5559fbac11b59d130bf191131fff697e49b34b2d49ab1304
|
3 |
+
size 4362142888
|
model-00031-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f016e4d6e306cc3e037ab2ea287cc2e83016442f25db0930ead4fbcd985cb68f
|
3 |
+
size 4664165896
|
model-00032-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2e035aff865fcd46f3da82af0e4c8097f9ac31ce6403180fb734e6a08470fee
|
3 |
+
size 4664165880
|
model-00033-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e0cfeea50bb811d70317a1239e0e13d4bcb4b0844b88dc3ea7fa4cbb3ba4dce
|
3 |
+
size 4362142888
|
model-00034-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1eaccd9982d3ace47b17d97babbe0d6b5b746d406750177ccfdc808f226b4f02
|
3 |
+
size 4362175776
|
model-00035-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:455b7f67ce011f519a8ae60c76748d198747c4865c774c37ad931af62a116b4c
|
3 |
+
size 4966156008
|
model-00036-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6683488cca19b7949300cded8d018551d74ac37df3613fcd54118440ef88cd43
|
3 |
+
size 4362142880
|
model-00037-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd11a5800dabd5eaab77d5a52bc96b0eb4cc2449f0ac53b7c4b0228e16e9ba7e
|
3 |
+
size 4362175768
|
model-00038-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3017753f5e2e55d9cbade08015969564582df260607189355832e238372515e7
|
3 |
+
size 4966156008
|
model-00039-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3c56bfd4191535f1532e9d6e271be206b10d5e7a0a7ffcfe068e117a6e05695
|
3 |
+
size 4362142888
|
model-00040-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21e5b23ebcaff449d48f0daacf4e3d2c8ffe5bf5a81e97f5166b8fd054df2eaf
|
3 |
+
size 4362175776
|
model-00041-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1da243899403f21ddb72903592de7f2e416a951635fe0b7f8611f4b1f2abf933
|
3 |
+
size 4966156008
|
model-00042-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c46f54af97a9c67687f8a09f440dbf1c18f5b470cfae71a6e287ba54740a336
|
3 |
+
size 4362142888
|
model-00043-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:feab4d27f40f7b39724fcc679c475a83b8df1052f955232663b1a598aaa68859
|
3 |
+
size 4362175776
|
model-00044-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5616be4588517ea64afe6e61449960fd1cf11b0a364da44b576590228b93e1ea
|
3 |
+
size 4966156000
|
model-00045-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c177499ea41e69c5f7654109171a4d4218cebe9a86efd7630977b081ee270c5
|
3 |
+
size 4362142880
|
model-00046-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31295d8794996257fe4433844478ddf65b774af7a0d349b4d5142c6bf4c612ff
|
3 |
+
size 4362175776
|
model-00047-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66c82b513fcb17feab28ddec406f0d9d949bce67d1f502b892b3afd0356a3154
|
3 |
+
size 4966156008
|
model-00048-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b9b45832777ddc10ad82f3208314848d4c8a9bc6196b621ec76a7e1bc52e601
|
3 |
+
size 4362142888
|