Update models

Files changed (15) hide show

.gitattributes CHANGED Viewed

@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-14B-Instruct-1M-f16.gguf filter=lfs diff=lfs merge=lfs -text

Qwen2.5-14B-Instruct-1M-Q2_K.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1ecb0f51445c2a92d2857d166b894ceb96f779be394c907be47788ebb4afded7
+size 5770497824

Qwen2.5-14B-Instruct-1M-Q3_K_L.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a19dbdbbbece500f620ae0c0bd94aabc3247608233a9f8e3015044eff2d0b89
+size 7924768544

Qwen2.5-14B-Instruct-1M-Q3_K_M.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d52bced57c5c252b917aac1de083939a32ece2b391cdbdf2441738e83379a40
+size 7339204384

Qwen2.5-14B-Instruct-1M-Q3_K_S.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d5988708812e690353cc37019ef3b9cd9c28cec5bde948acc7677e8819af615
+size 6659596064

Qwen2.5-14B-Instruct-1M-Q4_0.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7d336999c544ebecc0494145bc5b04ebc6740fc6c9013bf7512dfca5c7b05ed
+size 8517725984

Qwen2.5-14B-Instruct-1M-Q4_K_M.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:246ce41732d3a6f242bba466b37eff8c011b19b26ff6d6e4c4e997b87f551ab0
+size 8988110624

Qwen2.5-14B-Instruct-1M-Q4_K_S.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:45ad3e1d470d287b064a509535c6f60241887db66cd792c38e74096c2c8fc978
+size 8573431584

Qwen2.5-14B-Instruct-1M-Q5_0.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fff6fd41569527fa7b260b6434b5622bbaef06d132e36be8a4d4083fc7c777f
+size 10266554144

Qwen2.5-14B-Instruct-1M-Q5_K_M.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b882d8fbe72559c42bc452273bdcd551f564463227a6d87dc84c1f0017aa18de
+size 10508873504

Qwen2.5-14B-Instruct-1M-Q5_K_S.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f7011372585fb13e450ec30a229cc2681a2955852ff4c1beb58d97115e825fe
+size 10266554144

Qwen2.5-14B-Instruct-1M-Q6_K.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:df3ede3de849f4482580f124582d784a789fa375d000c63c23d8da7f63cc6dda
+size 12124684064

Qwen2.5-14B-Instruct-1M-Q8_0.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ea3e3b82f5fd9305a98e325da2522a4e4e2fc9d2128a26b65b7bb9a130a71229
+size 15701597984

Qwen2.5-14B-Instruct-1M-f16.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:00517c6fabea6f9f19bdf59af62f3884127c80f7e03bb78b5e96bf060d8e6eb4
+size 29547716384

config.json ADDED Viewed

+{
+  "architectures": [
+    "Qwen2ForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 5120,
+  "initializer_range": 0.02,
+  "intermediate_size": 13824,
+  "max_position_embeddings": 1010000,
+  "max_window_layers": 48,
+  "model_type": "qwen2",
+  "num_attention_heads": 40,
+  "num_hidden_layers": 48,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000000.0,
+  "sliding_window": 1010000,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.45.2",
+  "use_cache": true,
+  "use_sliding_window": false,
+  "vocab_size": 152064,
+  "dual_chunk_attention_config": {
+    "chunk_size": 262144,
+    "local_size": 8192,
+    "original_max_position_embeddings": 262144
+  }
+}