Kaz-K commited on
Commit
ecb6624
·
verified ·
1 Parent(s): 9cccf50

Initial upload of SIP-jmed-llm-3-8x13b-OP-4k-base

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. model-00001-of-00061.safetensors +3 -0
  3. model-00002-of-00061.safetensors +3 -0
  4. model-00003-of-00061.safetensors +3 -0
  5. model-00004-of-00061.safetensors +3 -0
  6. model-00005-of-00061.safetensors +3 -0
  7. model-00006-of-00061.safetensors +3 -0
  8. model-00007-of-00061.safetensors +3 -0
  9. model-00008-of-00061.safetensors +3 -0
  10. model-00009-of-00061.safetensors +3 -0
  11. model-00010-of-00061.safetensors +3 -0
  12. model-00011-of-00061.safetensors +3 -0
  13. model-00012-of-00061.safetensors +3 -0
  14. model-00013-of-00061.safetensors +3 -0
  15. model-00014-of-00061.safetensors +3 -0
  16. model-00015-of-00061.safetensors +3 -0
  17. model-00016-of-00061.safetensors +3 -0
  18. model-00017-of-00061.safetensors +3 -0
  19. model-00018-of-00061.safetensors +3 -0
  20. model-00019-of-00061.safetensors +3 -0
  21. model-00020-of-00061.safetensors +3 -0
  22. model-00021-of-00061.safetensors +3 -0
  23. model-00022-of-00061.safetensors +3 -0
  24. model-00023-of-00061.safetensors +3 -0
  25. model-00024-of-00061.safetensors +3 -0
  26. model-00025-of-00061.safetensors +3 -0
  27. model-00026-of-00061.safetensors +3 -0
  28. model-00027-of-00061.safetensors +3 -0
  29. model-00028-of-00061.safetensors +3 -0
  30. model-00029-of-00061.safetensors +3 -0
  31. model-00030-of-00061.safetensors +3 -0
  32. model-00031-of-00061.safetensors +3 -0
  33. model-00032-of-00061.safetensors +3 -0
  34. model-00033-of-00061.safetensors +3 -0
  35. model-00034-of-00061.safetensors +3 -0
  36. model-00035-of-00061.safetensors +3 -0
  37. model-00036-of-00061.safetensors +3 -0
  38. model-00037-of-00061.safetensors +3 -0
  39. model-00038-of-00061.safetensors +3 -0
  40. model-00039-of-00061.safetensors +3 -0
  41. model-00040-of-00061.safetensors +3 -0
  42. model-00041-of-00061.safetensors +3 -0
  43. model-00042-of-00061.safetensors +3 -0
  44. model-00043-of-00061.safetensors +3 -0
  45. model-00044-of-00061.safetensors +3 -0
  46. model-00045-of-00061.safetensors +3 -0
  47. model-00046-of-00061.safetensors +3 -0
  48. model-00047-of-00061.safetensors +3 -0
  49. model-00048-of-00061.safetensors +3 -0
  50. model-00049-of-00061.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MixtralForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 5120,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 13824,
13
+ "max_position_embeddings": 4096,
14
+ "mlp_bias": false,
15
+ "model_type": "mixtral",
16
+ "num_attention_heads": 40,
17
+ "num_experts_per_tok": 2,
18
+ "num_hidden_layers": 40,
19
+ "num_key_value_heads": 40,
20
+ "num_local_experts": 8,
21
+ "output_router_logits": false,
22
+ "rms_norm_eps": 1e-05,
23
+ "rope_theta": 10000,
24
+ "router_aux_loss_coef": 0.01,
25
+ "router_jitter_noise": 0.0,
26
+ "sliding_window": null,
27
+ "tie_word_embeddings": false,
28
+ "torch_dtype": "float32",
29
+ "transformers_version": "4.46.0",
30
+ "use_cache": true,
31
+ "vocab_size": 99584
32
+ }
model-00001-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0ec49fd80071ad29cb06d9d0f06385314b5247f045c158796dfa31673732a47
3
+ size 4976932536
model-00002-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48d51dd5f8648066b5e8372cab6be2256efc324df05337232857b00a6a1058f
3
+ size 4939411512
model-00003-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:489a64baddb6723caaa1f9d5128036cfd2dd2907d8c0417559d2eb15fd812c8b
3
+ size 4812966080
model-00004-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a648c8e9aec8ee2ad75f79dcab3aa3ec30a257f32fba81a55a936b510a96036
3
+ size 4812966080
model-00005-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5861ccd7209319fd7302d7541dc4cc680fa3dd978db8ead47eb0a70887ec9c7d
3
+ size 4812966080
model-00006-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca5f01e65856f5dc5a5ebbeaa766e929f6426e9a820e3966348451f8aca10b3d
3
+ size 4812966080
model-00007-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c9159a934beec8d32ffdc5ac3f347ff5ba87073716c47ca48e3e5186e2814b3
3
+ size 4812966080
model-00008-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660aedec961acc9099a491b470a48b278b6ec9c2556939b7fb02a83022c5c6a0
3
+ size 4812966080
model-00009-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c1bec802616b2bbf7d7417b3dc0cdff320a12cd7cf723b1048485d1f5705220
3
+ size 4812966080
model-00010-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53720b558dbfb77474ca39cd1396f399c2df448358f520411dc295f7ce390e6d
3
+ size 4812966080
model-00011-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b5bfc31aed2894289aee9c4ae65b0906b7764e190a39d65cce4d740e25b3e8c
3
+ size 4812966080
model-00012-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fc6e1194ee2cbb696f5e098710fd1fd003902cc78cd45069b834cb3b42e835a
3
+ size 4812966080
model-00013-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73829150b33f43e58e2eccbd4a15d5e9bbb5d0ab0c8df6c814b26a3b4ccecc99
3
+ size 4812966080
model-00014-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc0e244ef4b18641ab81f5be1b6a0b814ca3ebb73ecb64e1c29f6ad4e77c0ea7
3
+ size 4812966080
model-00015-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf50d8df298f57a135113c2abb73e3811e5b3cebf1954b463cc0aebb713f8d8d
3
+ size 4812966080
model-00016-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8fcb59037dd7916c6e041724cdc406002ed65bfc119bcdfe1aa044ab0400b3b
3
+ size 4950739752
model-00017-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a11a84ca90974245db2a558cea13ad51431a89a6f48f390a12e5684b80c15a6
3
+ size 4907933456
model-00018-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64c0cf1caaf5afe305badcf0eaf0de83fa4fddbc7b606d0bf890d421fa5b37cf
3
+ size 4812966096
model-00019-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a74e65bb211c9c0c76977de6f1a111963ac1c49ea59d7968c670a793b4e17d5b
3
+ size 4812966096
model-00020-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e473f13191059b2f79b93e966d65d035f21292b6ed7b51092bba2bcdf9f0fe4d
3
+ size 4812966096
model-00021-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a88c9197c00a8b27b243e587118d81a36c05e42896cf7bd981a092a75b255e27
3
+ size 4812966096
model-00022-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45d0bebc585baed0b643eeed11612797b46adc2dc8e6c50071b3cb024f590b00
3
+ size 4812966096
model-00023-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f5757925f395e0e623b6abbc6df6cbfb929fbfa14bef4adb3619e59fc48f60
3
+ size 4812966096
model-00024-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6cd21d6f57376c318d3acdaf9622aefc7ccb29c2710438e38106a7065293f5a
3
+ size 4812966096
model-00025-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:846e9c9d28ca9c4015f5774ddfd9e0fbca8e480f81257a7041e1b1398fb5cd53
3
+ size 4812966096
model-00026-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bdc5a112a43e9916429390d85b978ace97da18838c1b37a112b50cc01c21d0b
3
+ size 4812966096
model-00027-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:746faf9adda23deb2ad7901c587bfffc81f8b5f2124eddb7a0786df13a010b30
3
+ size 4812966096
model-00028-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7beb924bd49d27773f55fa7a12a3a7315a04556e814ab284405e9c989539e59
3
+ size 4812966096
model-00029-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be98ee19dceecf8fc271381af4b2cd67e8d5f99c3cc0d08911683bec878d0f79
3
+ size 4812966096
model-00030-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:507fc691dca49c2c55d43503ce2df03ec0fa659d9aec9561626962e496d9506e
3
+ size 4812966096
model-00031-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8222a505026a4325037dd41e93599b349794316ea6b43f948feafff3ab85e1e7
3
+ size 4982402456
model-00032-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d989c427d948614a3f3fe4eecdaca6459a00aa5cc1da8a6e241e1e28a421873c
3
+ size 4876270808
model-00033-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3d14d01e588792f7da00b5b9e2a01795bcf9f9351e633eea0d79d3f5065c2a9
3
+ size 4812966096
model-00034-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4acd37afb0c2ee4f98bc7dc10094d4360b9c73e4be0a448df390084c0e5563
3
+ size 4812966096
model-00035-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ddb5d770cf2bc2ce9b7f95407d2db30c1a794b4ad4577e9b0b55057e721503d
3
+ size 4812966096
model-00036-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:294e62c0ffc0b3589e32abe7aa9afe6d46753a6163f6b61733eed03dd131010b
3
+ size 4812966096
model-00037-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab45901cb1e06293bb7fdc30f8fbc89100503bb6eaacfa8105894087752254e0
3
+ size 4812966096
model-00038-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fc87435eeed9674cae77bf80465f29394cae101aef887118e778000aeba1c2c
3
+ size 4812966096
model-00039-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e992deb86ace83d3d2608d1ba95892ed5a16811e65fee53717c50918c8fa9276
3
+ size 4812966096
model-00040-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a3c9fbff2b43c3099caa7b6c19afbc652c6d44be1a92f8a00712e914735732f
3
+ size 4812966096
model-00041-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be31f58e31d045cba6e35d7c2766092e1a4cfb425e609d4537d658c5461844eb
3
+ size 4812966096
model-00042-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af606fa639f82b962b6cdcfb9f2839a057c74ea7f9de6d0d7320c7cb992020a
3
+ size 4812966096
model-00043-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80937e6e6eec51baa00ed237258224b63a883f5f85160d26b10070e4336a96b3
3
+ size 4812966096
model-00044-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81366ad9bfcb94839dcd0fc79f5144258a80b46846667548a8dbc0d447245017
3
+ size 4812966096
model-00045-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d69f6ed27a62b3920ccbbc4d4caffc57e3b9b84cf34218d42a60311e0269276b
3
+ size 4812966096
model-00046-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e98b50336ad9a09d1f9f5ef941accccd4764f3a3d0bf39b23a4904407b29df8
3
+ size 4909186792
model-00047-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa4991a5e0e3376a08e49facfe2823d723f80660027b96fd0ddb19312306e757
3
+ size 4949486464
model-00048-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7338efb4ab490e6776dec1fd3300b15ada4ec4b77482813a0744949a2721616
3
+ size 4812966096
model-00049-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:056e95d5119231de8d5bdfbcb832a2cb7c763e19f80ae25e9b4ae49d2de47147
3
+ size 4812966096