Upload DeepSeekV2Lite DenseMixer model
Browse filesDeepSeekV2Lite model with DenseMixer architecture
download_original.py
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/usr/bin/env python3
|
| 2 |
+
"""
|
| 3 |
+
Download original DeepSeek-V2-Lite model and copy to our directory
|
| 4 |
+
"""
|
| 5 |
+
|
| 6 |
+
import os
|
| 7 |
+
from huggingface_hub import snapshot_download
|
| 8 |
+
import shutil
|
| 9 |
+
|
| 10 |
+
# Download original model
|
| 11 |
+
print("Downloading original DeepSeek-V2-Lite model...")
|
| 12 |
+
original_path = snapshot_download(
|
| 13 |
+
repo_id="deepseek-ai/DeepSeek-V2-Lite",
|
| 14 |
+
cache_dir="/tmp/deepseek_download"
|
| 15 |
+
)
|
| 16 |
+
|
| 17 |
+
print(f"Downloaded to: {original_path}")
|
| 18 |
+
|
| 19 |
+
# Target directory
|
| 20 |
+
target_dir = "/mnt/weka/home/shibo.hao/feng/code/junxia/deepseekv2lite"
|
| 21 |
+
|
| 22 |
+
# Files to copy (only model weights, keep our custom files)
|
| 23 |
+
files_to_copy = [
|
| 24 |
+
"model-00001-of-000004.safetensors",
|
| 25 |
+
"model-00002-of-000004.safetensors",
|
| 26 |
+
"model-00003-of-000004.safetensors",
|
| 27 |
+
"model-00004-of-000004.safetensors",
|
| 28 |
+
"model.safetensors.index.json"
|
| 29 |
+
]
|
| 30 |
+
|
| 31 |
+
# Copy files
|
| 32 |
+
print("Copying model weight files...")
|
| 33 |
+
for filename in files_to_copy:
|
| 34 |
+
src = os.path.join(original_path, filename)
|
| 35 |
+
dst = os.path.join(target_dir, filename)
|
| 36 |
+
|
| 37 |
+
if os.path.exists(src):
|
| 38 |
+
print(f"Copying {filename}...")
|
| 39 |
+
shutil.copy2(src, dst)
|
| 40 |
+
# Check file size
|
| 41 |
+
size = os.path.getsize(dst)
|
| 42 |
+
print(f" Size: {size / (1024**3):.2f} GB")
|
| 43 |
+
else:
|
| 44 |
+
print(f"Warning: {filename} not found in original model")
|
| 45 |
+
|
| 46 |
+
print("Done! Model weights copied successfully.")
|
model-00001-of-000004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d7e9f39bde40111a4c0f390b87497dce4565cf578d916395e6b2c7851f1e8da
|
| 3 |
+
size 8594887408
|
model-00002-of-000004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0656832b0d594b4a64cad40ff8465231de6ed44c854f74f6b217797660aa4bb
|
| 3 |
+
size 8591757448
|
model-00003-of-000004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:843ec689624f3a520526e040f0326c4dc9865e8172942ca98a084fe136fdb21a
|
| 3 |
+
size 8590718520
|
model-00004-of-000004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfb51658f67cedfbbc4d62ad14187830ceec8ee82c788c5f718feea98905ef31
|
| 3 |
+
size 5636263200
|