deploy model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +41 -0
- generation_config.json +1 -0
- model-00001-of-00166.safetensors +3 -0
- model-00002-of-00166.safetensors +3 -0
- model-00003-of-00166.safetensors +3 -0
- model-00004-of-00166.safetensors +3 -0
- model-00005-of-00166.safetensors +3 -0
- model-00006-of-00166.safetensors +3 -0
- model-00007-of-00166.safetensors +3 -0
- model-00008-of-00166.safetensors +3 -0
- model-00009-of-00166.safetensors +3 -0
- model-00010-of-00166.safetensors +3 -0
- model-00011-of-00166.safetensors +3 -0
- model-00012-of-00166.safetensors +3 -0
- model-00013-of-00166.safetensors +3 -0
- model-00014-of-00166.safetensors +3 -0
- model-00015-of-00166.safetensors +3 -0
- model-00016-of-00166.safetensors +3 -0
- model-00017-of-00166.safetensors +3 -0
- model-00018-of-00166.safetensors +3 -0
- model-00019-of-00166.safetensors +3 -0
- model-00020-of-00166.safetensors +3 -0
- model-00021-of-00166.safetensors +3 -0
- model-00022-of-00166.safetensors +3 -0
- model-00023-of-00166.safetensors +3 -0
- model-00024-of-00166.safetensors +3 -0
- model-00025-of-00166.safetensors +3 -0
- model-00026-of-00166.safetensors +3 -0
- model-00027-of-00166.safetensors +3 -0
- model-00028-of-00166.safetensors +3 -0
- model-00029-of-00166.safetensors +3 -0
- model-00030-of-00166.safetensors +3 -0
- model-00031-of-00166.safetensors +3 -0
- model-00032-of-00166.safetensors +3 -0
- model-00033-of-00166.safetensors +3 -0
- model-00034-of-00166.safetensors +3 -0
- model-00035-of-00166.safetensors +3 -0
- model-00036-of-00166.safetensors +3 -0
- model-00037-of-00166.safetensors +3 -0
- model-00038-of-00166.safetensors +3 -0
- model-00039-of-00166.safetensors +3 -0
- model-00040-of-00166.safetensors +3 -0
- model-00041-of-00166.safetensors +3 -0
- model-00042-of-00166.safetensors +3 -0
- model-00043-of-00166.safetensors +3 -0
- model-00044-of-00166.safetensors +3 -0
- model-00045-of-00166.safetensors +3 -0
- model-00046-of-00166.safetensors +3 -0
- model-00047-of-00166.safetensors +3 -0
- model-00048-of-00166.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"JambaForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_dropout": 0.0,
|
6 |
+
"attn_layer_offset": 4,
|
7 |
+
"attn_layer_period": 8,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"expert_layer_offset": 1,
|
11 |
+
"expert_layer_period": 2,
|
12 |
+
"hidden_act": "silu",
|
13 |
+
"hidden_size": 8192,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 24576,
|
16 |
+
"mamba_conv_bias": true,
|
17 |
+
"mamba_d_conv": 4,
|
18 |
+
"mamba_d_state": 16,
|
19 |
+
"mamba_dt_rank": 512,
|
20 |
+
"mamba_expand": 2,
|
21 |
+
"mamba_proj_bias": false,
|
22 |
+
"max_position_embeddings": 262144,
|
23 |
+
"model_type": "jamba",
|
24 |
+
"num_attention_heads": 64,
|
25 |
+
"num_experts": 16,
|
26 |
+
"num_experts_per_tok": 2,
|
27 |
+
"num_hidden_layers": 72,
|
28 |
+
"num_key_value_heads": 8,
|
29 |
+
"num_logits_to_keep": 1,
|
30 |
+
"output_router_logits": false,
|
31 |
+
"pad_token_id": 0,
|
32 |
+
"rms_norm_eps": 1e-06,
|
33 |
+
"router_aux_loss_coef": 0.001,
|
34 |
+
"sliding_window": null,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "bfloat16",
|
37 |
+
"transformers_version": "4.41.2",
|
38 |
+
"use_cache": true,
|
39 |
+
"use_mamba_kernels": true,
|
40 |
+
"vocab_size": 65536
|
41 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"_from_model_config": true, "bos_token_id": 1, "eos_token_id": [2, 518], "pad_token_id": 0, "transformers_version": "4.41.2"}
|
model-00001-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:359b87105d3c954dd994982d15489ab2bc96d6c4cc4565f045bd5be809ccb88c
|
3 |
+
size 4768634672
|
model-00002-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8c1351e315306d52da5f6499d62df2cc3a3efa56836e368e1bd0a00d3b18d30
|
3 |
+
size 4831839840
|
model-00003-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c405e01d931a815cc73eb9cffc086e5ef6ebd4e6aec1c521faecd3af3ca3bd03
|
3 |
+
size 4831839840
|
model-00004-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71e94b7669d33e5ad09bd05d92d3894d30dbbcc149b4652274a9aafffabb557c
|
3 |
+
size 4831839848
|
model-00005-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cbb6384c20042a8de8270edb4fa4feab32bc1cd7789f041662ae977d12ab5df
|
3 |
+
size 4867231656
|
model-00006-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87f2a409c6823652ec2a17b98891710459579a03c49f6b0b58bb211e7b656d64
|
3 |
+
size 4867493880
|
model-00007-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd8d4d86f51d42058d4413b277347b587a2bd4e43c3c6205f564fca73eaf7098
|
3 |
+
size 4831839840
|
model-00008-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bf5e4bc413ea78eb68eef804385e6463692d8e8545dea57159f66f28ae3e427
|
3 |
+
size 4831839840
|
model-00009-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31b952323f70082cfa4ee6ff0568f6f10650c022529865e09f69980a0e8d83af
|
3 |
+
size 4831839848
|
model-00010-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be5612a40e6a14657c2ec74587ef0bfcacd54d8ba95f4350d7442b1856967e44
|
3 |
+
size 4766863912
|
model-00011-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfc356f24a128181b2cbdf3a969b365d855718b64059690b69af6942315de448
|
3 |
+
size 4831839840
|
model-00012-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84bf53d9af9a1ec38f4bff3db37efb883057dd9590893a5ebd04421edda32ea9
|
3 |
+
size 4831839840
|
model-00013-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b8d93611cfe90838bdba298d7b10afd4d361192d8fadb7c5374c6ee79d5335d
|
3 |
+
size 4831839848
|
model-00014-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:817e74201449379f66e69ca5040c22dacc0b0ef9ccdb749ccf7e9529eca83821
|
3 |
+
size 4984637768
|
model-00015-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b64c2ecfa033225e338a65d2291ea771cada8eee4659a48692dac147c20e489
|
3 |
+
size 4750087760
|
model-00016-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28abceb15017bb4bf84b8c87e05d5403abe1f0398a8d9e22add4d322a00ce0ab
|
3 |
+
size 4831839840
|
model-00017-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ca2564152ff22684f4d70d61b32bc6baca802c283d3f02a15528da695a7118a
|
3 |
+
size 4831839840
|
model-00018-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20b4d26b6a47fcf464d14097687935de1bd90740f11d2dcd38ec7778749febe6
|
3 |
+
size 4831839848
|
model-00019-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:407b72a6a08eecb42df5b17f593e638600cf5c30b99c6eaba34b39d9de0cf618
|
3 |
+
size 4465332608
|
model-00020-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfe365c18a8bc8d478b255a06f208c6d951009d37e61661442df2c784a22591b
|
3 |
+
size 4866739600
|
model-00021-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e366daddd16cd92d9a62fdd70f1b9ccc17107df28028e8b6b0b582969f53d82c
|
3 |
+
size 4831839840
|
model-00022-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a70600ec3f75825f5c11ca21875162ede7356177825e9a06fb5d3170221ab95
|
3 |
+
size 4831839840
|
model-00023-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87609bd9e1969fa279a928bb9068796b856492f4af22231508a4118845b476eb
|
3 |
+
size 4831839848
|
model-00024-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ac6b6d820cd04b823b5964ceb4f816f13407b430f0c5d49fd8e3792ff71ebcc
|
3 |
+
size 4902885720
|
model-00025-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aec3e78a1b1d11d6af0f28110fb79b9bff69ef4d86528911af822adde4333b83
|
3 |
+
size 4831839848
|
model-00026-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2335e763dcd1bc209230b58586cf0e81e22cb54e54d8d10a6e84686e350fb87
|
3 |
+
size 4831839848
|
model-00027-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a65a7720da4e7cd7894b8c98404ee374fb897454a5e21a1e30ca7323b74dcb09
|
3 |
+
size 4831839856
|
model-00028-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f69ce5b37a402524d7a9e35e8ffb9d1fe8d61540f326f034a6a14b35f36317bf
|
3 |
+
size 4731209872
|
model-00029-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:165ca1395a26cb06effb80c683fd199061debee47eb13724e854c123f209f173
|
3 |
+
size 4867493920
|
model-00030-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36b3fafaf403129522ae47c6b4a4ab19f0ff2beac2552e9a1d62d446217835c6
|
3 |
+
size 4831839848
|
model-00031-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fcbe84290fbf2f006dc6b8d0be2968e011372030f2c4f2cad517f9181120a55
|
3 |
+
size 4831839856
|
model-00032-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60acd4a51b343d70db1e87cf6f85ba6d1113e5755d81f32ed5dfd50888f4db71
|
3 |
+
size 4831839864
|
model-00033-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15511c932f9b9a4ff0118360dff394920461f378b7b6c4ebadd3155645912969
|
3 |
+
size 4902885720
|
model-00034-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dad09a79db18bbfe8f0fafe17546959454451dc8b4cc54f0ff73b7a978078996
|
3 |
+
size 4831839848
|
model-00035-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11a6c8db4175095eb9eff23de842546e96cb49556b5af1bd39e0bd163c5ad110
|
3 |
+
size 4831839848
|
model-00036-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:656a8dbadaca5c0257ce71e4ba43ab24fb613a7287a85a6533d615d2c272de55
|
3 |
+
size 4831839856
|
model-00037-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70f2b9fd621dd868adbe56b6b1a7d75c1ea27a453ff81d42562524c887c3b36e
|
3 |
+
size 4867231680
|
model-00038-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eace8f56109b06f8e42fcac004483beed4725acb1dd08f82ee2711fefab0218f
|
3 |
+
size 4867493904
|
model-00039-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb55aabad7b28bf7862647cb7a63d3b22f49674e736f67d282ef2c847b819576
|
3 |
+
size 4831839848
|
model-00040-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3221e0b80dc79abe7205af1a375f13e8f398598572cfe7d803f2092cd6753ed9
|
3 |
+
size 4831839848
|
model-00041-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2edabb942459f5f6112a65f26d3e0d68793da3c777d86f0dd420b44628a958e8
|
3 |
+
size 4831839864
|
model-00042-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9d12af53f2204119458e506faa79d9524f6b51e0ae9b99a1721b32af620b8d6
|
3 |
+
size 4902885728
|
model-00043-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:072f3ecd8901bb6d8abb863a44a001e57ebf1697f64158f0350b805850fafb7f
|
3 |
+
size 4831839848
|
model-00044-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65ad5054c3a3f5c09bd124b824747d530714e178acd065ffd5176a9bc2d4ff8d
|
3 |
+
size 4831839848
|
model-00045-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de5dfa5be219838e44b82ac3dfec471f0bdd9cb2dc570b42ccf55e4808ce75fa
|
3 |
+
size 4831839856
|
model-00046-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b46176416fa9de573cf6980c9c1118195ea2f50931715fe05f1cdf47f8fd51bd
|
3 |
+
size 4999645368
|
model-00047-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc3a7918317217f3e1dd493096c45995c65b7569bb3fcc0e371e5034339afc4f
|
3 |
+
size 4599058432
|
model-00048-of-00166.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03e50a52a7e3ac83585c59292e0eb441e04e55d21c30640ad878734bbbff4b02
|
3 |
+
size 4831839848
|