Upload DeepSeekV2Lite DenseMixer model
Browse filesDeepSeekV2Lite model with DenseMixer architecture
download_original.py
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
#!/usr/bin/env python3
|
2 |
+
"""
|
3 |
+
Download original DeepSeek-V2-Lite model and copy to our directory
|
4 |
+
"""
|
5 |
+
|
6 |
+
import os
|
7 |
+
from huggingface_hub import snapshot_download
|
8 |
+
import shutil
|
9 |
+
|
10 |
+
# Download original model
|
11 |
+
print("Downloading original DeepSeek-V2-Lite model...")
|
12 |
+
original_path = snapshot_download(
|
13 |
+
repo_id="deepseek-ai/DeepSeek-V2-Lite",
|
14 |
+
cache_dir="/tmp/deepseek_download"
|
15 |
+
)
|
16 |
+
|
17 |
+
print(f"Downloaded to: {original_path}")
|
18 |
+
|
19 |
+
# Target directory
|
20 |
+
target_dir = "/mnt/weka/home/shibo.hao/feng/code/junxia/deepseekv2lite"
|
21 |
+
|
22 |
+
# Files to copy (only model weights, keep our custom files)
|
23 |
+
files_to_copy = [
|
24 |
+
"model-00001-of-000004.safetensors",
|
25 |
+
"model-00002-of-000004.safetensors",
|
26 |
+
"model-00003-of-000004.safetensors",
|
27 |
+
"model-00004-of-000004.safetensors",
|
28 |
+
"model.safetensors.index.json"
|
29 |
+
]
|
30 |
+
|
31 |
+
# Copy files
|
32 |
+
print("Copying model weight files...")
|
33 |
+
for filename in files_to_copy:
|
34 |
+
src = os.path.join(original_path, filename)
|
35 |
+
dst = os.path.join(target_dir, filename)
|
36 |
+
|
37 |
+
if os.path.exists(src):
|
38 |
+
print(f"Copying {filename}...")
|
39 |
+
shutil.copy2(src, dst)
|
40 |
+
# Check file size
|
41 |
+
size = os.path.getsize(dst)
|
42 |
+
print(f" Size: {size / (1024**3):.2f} GB")
|
43 |
+
else:
|
44 |
+
print(f"Warning: {filename} not found in original model")
|
45 |
+
|
46 |
+
print("Done! Model weights copied successfully.")
|
model-00001-of-000004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d7e9f39bde40111a4c0f390b87497dce4565cf578d916395e6b2c7851f1e8da
|
3 |
+
size 8594887408
|
model-00002-of-000004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0656832b0d594b4a64cad40ff8465231de6ed44c854f74f6b217797660aa4bb
|
3 |
+
size 8591757448
|
model-00003-of-000004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:843ec689624f3a520526e040f0326c4dc9865e8172942ca98a084fe136fdb21a
|
3 |
+
size 8590718520
|
model-00004-of-000004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfb51658f67cedfbbc4d62ad14187830ceec8ee82c788c5f718feea98905ef31
|
3 |
+
size 5636263200
|