WoahMiri commited on
Commit
3ed18a6
·
1 Parent(s): 15390a5

deploy model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +41 -0
  2. generation_config.json +1 -0
  3. model-00001-of-00166.safetensors +3 -0
  4. model-00002-of-00166.safetensors +3 -0
  5. model-00003-of-00166.safetensors +3 -0
  6. model-00004-of-00166.safetensors +3 -0
  7. model-00005-of-00166.safetensors +3 -0
  8. model-00006-of-00166.safetensors +3 -0
  9. model-00007-of-00166.safetensors +3 -0
  10. model-00008-of-00166.safetensors +3 -0
  11. model-00009-of-00166.safetensors +3 -0
  12. model-00010-of-00166.safetensors +3 -0
  13. model-00011-of-00166.safetensors +3 -0
  14. model-00012-of-00166.safetensors +3 -0
  15. model-00013-of-00166.safetensors +3 -0
  16. model-00014-of-00166.safetensors +3 -0
  17. model-00015-of-00166.safetensors +3 -0
  18. model-00016-of-00166.safetensors +3 -0
  19. model-00017-of-00166.safetensors +3 -0
  20. model-00018-of-00166.safetensors +3 -0
  21. model-00019-of-00166.safetensors +3 -0
  22. model-00020-of-00166.safetensors +3 -0
  23. model-00021-of-00166.safetensors +3 -0
  24. model-00022-of-00166.safetensors +3 -0
  25. model-00023-of-00166.safetensors +3 -0
  26. model-00024-of-00166.safetensors +3 -0
  27. model-00025-of-00166.safetensors +3 -0
  28. model-00026-of-00166.safetensors +3 -0
  29. model-00027-of-00166.safetensors +3 -0
  30. model-00028-of-00166.safetensors +3 -0
  31. model-00029-of-00166.safetensors +3 -0
  32. model-00030-of-00166.safetensors +3 -0
  33. model-00031-of-00166.safetensors +3 -0
  34. model-00032-of-00166.safetensors +3 -0
  35. model-00033-of-00166.safetensors +3 -0
  36. model-00034-of-00166.safetensors +3 -0
  37. model-00035-of-00166.safetensors +3 -0
  38. model-00036-of-00166.safetensors +3 -0
  39. model-00037-of-00166.safetensors +3 -0
  40. model-00038-of-00166.safetensors +3 -0
  41. model-00039-of-00166.safetensors +3 -0
  42. model-00040-of-00166.safetensors +3 -0
  43. model-00041-of-00166.safetensors +3 -0
  44. model-00042-of-00166.safetensors +3 -0
  45. model-00043-of-00166.safetensors +3 -0
  46. model-00044-of-00166.safetensors +3 -0
  47. model-00045-of-00166.safetensors +3 -0
  48. model-00046-of-00166.safetensors +3 -0
  49. model-00047-of-00166.safetensors +3 -0
  50. model-00048-of-00166.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "JambaForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "attn_layer_offset": 4,
7
+ "attn_layer_period": 8,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "expert_layer_offset": 1,
11
+ "expert_layer_period": 2,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 8192,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 24576,
16
+ "mamba_conv_bias": true,
17
+ "mamba_d_conv": 4,
18
+ "mamba_d_state": 16,
19
+ "mamba_dt_rank": 512,
20
+ "mamba_expand": 2,
21
+ "mamba_proj_bias": false,
22
+ "max_position_embeddings": 262144,
23
+ "model_type": "jamba",
24
+ "num_attention_heads": 64,
25
+ "num_experts": 16,
26
+ "num_experts_per_tok": 2,
27
+ "num_hidden_layers": 72,
28
+ "num_key_value_heads": 8,
29
+ "num_logits_to_keep": 1,
30
+ "output_router_logits": false,
31
+ "pad_token_id": 0,
32
+ "rms_norm_eps": 1e-06,
33
+ "router_aux_loss_coef": 0.001,
34
+ "sliding_window": null,
35
+ "tie_word_embeddings": false,
36
+ "torch_dtype": "bfloat16",
37
+ "transformers_version": "4.41.2",
38
+ "use_cache": true,
39
+ "use_mamba_kernels": true,
40
+ "vocab_size": 65536
41
+ }
generation_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_from_model_config": true, "bos_token_id": 1, "eos_token_id": [2, 518], "pad_token_id": 0, "transformers_version": "4.41.2"}
model-00001-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:359b87105d3c954dd994982d15489ab2bc96d6c4cc4565f045bd5be809ccb88c
3
+ size 4768634672
model-00002-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8c1351e315306d52da5f6499d62df2cc3a3efa56836e368e1bd0a00d3b18d30
3
+ size 4831839840
model-00003-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c405e01d931a815cc73eb9cffc086e5ef6ebd4e6aec1c521faecd3af3ca3bd03
3
+ size 4831839840
model-00004-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71e94b7669d33e5ad09bd05d92d3894d30dbbcc149b4652274a9aafffabb557c
3
+ size 4831839848
model-00005-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cbb6384c20042a8de8270edb4fa4feab32bc1cd7789f041662ae977d12ab5df
3
+ size 4867231656
model-00006-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87f2a409c6823652ec2a17b98891710459579a03c49f6b0b58bb211e7b656d64
3
+ size 4867493880
model-00007-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd8d4d86f51d42058d4413b277347b587a2bd4e43c3c6205f564fca73eaf7098
3
+ size 4831839840
model-00008-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bf5e4bc413ea78eb68eef804385e6463692d8e8545dea57159f66f28ae3e427
3
+ size 4831839840
model-00009-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31b952323f70082cfa4ee6ff0568f6f10650c022529865e09f69980a0e8d83af
3
+ size 4831839848
model-00010-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be5612a40e6a14657c2ec74587ef0bfcacd54d8ba95f4350d7442b1856967e44
3
+ size 4766863912
model-00011-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfc356f24a128181b2cbdf3a969b365d855718b64059690b69af6942315de448
3
+ size 4831839840
model-00012-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84bf53d9af9a1ec38f4bff3db37efb883057dd9590893a5ebd04421edda32ea9
3
+ size 4831839840
model-00013-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b8d93611cfe90838bdba298d7b10afd4d361192d8fadb7c5374c6ee79d5335d
3
+ size 4831839848
model-00014-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817e74201449379f66e69ca5040c22dacc0b0ef9ccdb749ccf7e9529eca83821
3
+ size 4984637768
model-00015-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b64c2ecfa033225e338a65d2291ea771cada8eee4659a48692dac147c20e489
3
+ size 4750087760
model-00016-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28abceb15017bb4bf84b8c87e05d5403abe1f0398a8d9e22add4d322a00ce0ab
3
+ size 4831839840
model-00017-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ca2564152ff22684f4d70d61b32bc6baca802c283d3f02a15528da695a7118a
3
+ size 4831839840
model-00018-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20b4d26b6a47fcf464d14097687935de1bd90740f11d2dcd38ec7778749febe6
3
+ size 4831839848
model-00019-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:407b72a6a08eecb42df5b17f593e638600cf5c30b99c6eaba34b39d9de0cf618
3
+ size 4465332608
model-00020-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfe365c18a8bc8d478b255a06f208c6d951009d37e61661442df2c784a22591b
3
+ size 4866739600
model-00021-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e366daddd16cd92d9a62fdd70f1b9ccc17107df28028e8b6b0b582969f53d82c
3
+ size 4831839840
model-00022-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a70600ec3f75825f5c11ca21875162ede7356177825e9a06fb5d3170221ab95
3
+ size 4831839840
model-00023-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87609bd9e1969fa279a928bb9068796b856492f4af22231508a4118845b476eb
3
+ size 4831839848
model-00024-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ac6b6d820cd04b823b5964ceb4f816f13407b430f0c5d49fd8e3792ff71ebcc
3
+ size 4902885720
model-00025-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aec3e78a1b1d11d6af0f28110fb79b9bff69ef4d86528911af822adde4333b83
3
+ size 4831839848
model-00026-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2335e763dcd1bc209230b58586cf0e81e22cb54e54d8d10a6e84686e350fb87
3
+ size 4831839848
model-00027-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a65a7720da4e7cd7894b8c98404ee374fb897454a5e21a1e30ca7323b74dcb09
3
+ size 4831839856
model-00028-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f69ce5b37a402524d7a9e35e8ffb9d1fe8d61540f326f034a6a14b35f36317bf
3
+ size 4731209872
model-00029-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:165ca1395a26cb06effb80c683fd199061debee47eb13724e854c123f209f173
3
+ size 4867493920
model-00030-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36b3fafaf403129522ae47c6b4a4ab19f0ff2beac2552e9a1d62d446217835c6
3
+ size 4831839848
model-00031-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fcbe84290fbf2f006dc6b8d0be2968e011372030f2c4f2cad517f9181120a55
3
+ size 4831839856
model-00032-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60acd4a51b343d70db1e87cf6f85ba6d1113e5755d81f32ed5dfd50888f4db71
3
+ size 4831839864
model-00033-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15511c932f9b9a4ff0118360dff394920461f378b7b6c4ebadd3155645912969
3
+ size 4902885720
model-00034-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dad09a79db18bbfe8f0fafe17546959454451dc8b4cc54f0ff73b7a978078996
3
+ size 4831839848
model-00035-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11a6c8db4175095eb9eff23de842546e96cb49556b5af1bd39e0bd163c5ad110
3
+ size 4831839848
model-00036-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:656a8dbadaca5c0257ce71e4ba43ab24fb613a7287a85a6533d615d2c272de55
3
+ size 4831839856
model-00037-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70f2b9fd621dd868adbe56b6b1a7d75c1ea27a453ff81d42562524c887c3b36e
3
+ size 4867231680
model-00038-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eace8f56109b06f8e42fcac004483beed4725acb1dd08f82ee2711fefab0218f
3
+ size 4867493904
model-00039-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb55aabad7b28bf7862647cb7a63d3b22f49674e736f67d282ef2c847b819576
3
+ size 4831839848
model-00040-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3221e0b80dc79abe7205af1a375f13e8f398598572cfe7d803f2092cd6753ed9
3
+ size 4831839848
model-00041-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2edabb942459f5f6112a65f26d3e0d68793da3c777d86f0dd420b44628a958e8
3
+ size 4831839864
model-00042-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9d12af53f2204119458e506faa79d9524f6b51e0ae9b99a1721b32af620b8d6
3
+ size 4902885728
model-00043-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:072f3ecd8901bb6d8abb863a44a001e57ebf1697f64158f0350b805850fafb7f
3
+ size 4831839848
model-00044-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ad5054c3a3f5c09bd124b824747d530714e178acd065ffd5176a9bc2d4ff8d
3
+ size 4831839848
model-00045-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de5dfa5be219838e44b82ac3dfec471f0bdd9cb2dc570b42ccf55e4808ce75fa
3
+ size 4831839856
model-00046-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b46176416fa9de573cf6980c9c1118195ea2f50931715fe05f1cdf47f8fd51bd
3
+ size 4999645368
model-00047-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc3a7918317217f3e1dd493096c45995c65b7569bb3fcc0e371e5034339afc4f
3
+ size 4599058432
model-00048-of-00166.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03e50a52a7e3ac83585c59292e0eb441e04e55d21c30640ad878734bbbff4b02
3
+ size 4831839848