autoprogrammer commited on
Commit
f10caa3
·
verified ·
1 Parent(s): f5ab0b8

Upload DeepSeekV2Lite DenseMixer model

Browse files

DeepSeekV2Lite model with DenseMixer architecture

download_original.py ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ """
3
+ Download original DeepSeek-V2-Lite model and copy to our directory
4
+ """
5
+
6
+ import os
7
+ from huggingface_hub import snapshot_download
8
+ import shutil
9
+
10
+ # Download original model
11
+ print("Downloading original DeepSeek-V2-Lite model...")
12
+ original_path = snapshot_download(
13
+ repo_id="deepseek-ai/DeepSeek-V2-Lite",
14
+ cache_dir="/tmp/deepseek_download"
15
+ )
16
+
17
+ print(f"Downloaded to: {original_path}")
18
+
19
+ # Target directory
20
+ target_dir = "/mnt/weka/home/shibo.hao/feng/code/junxia/deepseekv2lite"
21
+
22
+ # Files to copy (only model weights, keep our custom files)
23
+ files_to_copy = [
24
+ "model-00001-of-000004.safetensors",
25
+ "model-00002-of-000004.safetensors",
26
+ "model-00003-of-000004.safetensors",
27
+ "model-00004-of-000004.safetensors",
28
+ "model.safetensors.index.json"
29
+ ]
30
+
31
+ # Copy files
32
+ print("Copying model weight files...")
33
+ for filename in files_to_copy:
34
+ src = os.path.join(original_path, filename)
35
+ dst = os.path.join(target_dir, filename)
36
+
37
+ if os.path.exists(src):
38
+ print(f"Copying {filename}...")
39
+ shutil.copy2(src, dst)
40
+ # Check file size
41
+ size = os.path.getsize(dst)
42
+ print(f" Size: {size / (1024**3):.2f} GB")
43
+ else:
44
+ print(f"Warning: {filename} not found in original model")
45
+
46
+ print("Done! Model weights copied successfully.")
model-00001-of-000004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:258811fe017b955eb542325c73f8cd8fc2f77f7c5c27dc1721877212182bffe4
3
- size 135
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d7e9f39bde40111a4c0f390b87497dce4565cf578d916395e6b2c7851f1e8da
3
+ size 8594887408
model-00002-of-000004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46264772a9631656d6f8ff201943336f45d298e2dade91cbf3bf87f61dbc10eb
3
- size 135
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0656832b0d594b4a64cad40ff8465231de6ed44c854f74f6b217797660aa4bb
3
+ size 8591757448
model-00003-of-000004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5c3a29ec4c6a815eaf1fbff20ca641ce9f3dc030fd7f7d5ea6d4962605322f7
3
- size 135
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843ec689624f3a520526e040f0326c4dc9865e8172942ca98a084fe136fdb21a
3
+ size 8590718520
model-00004-of-000004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:900e5ae475e2105613495a483a4aca219d3de2c07757e01d6db3ea4abe682790
3
- size 135
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfb51658f67cedfbbc4d62ad14187830ceec8ee82c788c5f718feea98905ef31
3
+ size 5636263200