AlexCheema commited on
Commit
d462d2d
·
verified ·
1 Parent(s): 37a0e22

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. README.md +37 -0
  2. config.json +66 -0
  3. generation_config.json +9 -0
  4. model-00003-of-00175.safetensors +3 -0
  5. model-00006-of-00175.safetensors +3 -0
  6. model-00009-of-00175.safetensors +3 -0
  7. model-00020-of-00175.safetensors +3 -0
  8. model-00023-of-00175.safetensors +3 -0
  9. model-00031-of-00175.safetensors +3 -0
  10. model-00032-of-00175.safetensors +3 -0
  11. model-00034-of-00175.safetensors +3 -0
  12. model-00038-of-00175.safetensors +3 -0
  13. model-00041-of-00175.safetensors +3 -0
  14. model-00042-of-00175.safetensors +3 -0
  15. model-00044-of-00175.safetensors +3 -0
  16. model-00047-of-00175.safetensors +3 -0
  17. model-00048-of-00175.safetensors +3 -0
  18. model-00059-of-00175.safetensors +3 -0
  19. model-00062-of-00175.safetensors +3 -0
  20. model-00067-of-00175.safetensors +3 -0
  21. model-00070-of-00175.safetensors +3 -0
  22. model-00075-of-00175.safetensors +3 -0
  23. model-00080-of-00175.safetensors +3 -0
  24. model-00083-of-00175.safetensors +3 -0
  25. model-00086-of-00175.safetensors +3 -0
  26. model-00089-of-00175.safetensors +3 -0
  27. model-00091-of-00175.safetensors +3 -0
  28. model-00101-of-00175.safetensors +3 -0
  29. model-00102-of-00175.safetensors +3 -0
  30. model-00110-of-00175.safetensors +3 -0
  31. model-00115-of-00175.safetensors +3 -0
  32. model-00116-of-00175.safetensors +3 -0
  33. model-00119-of-00175.safetensors +3 -0
  34. model-00122-of-00175.safetensors +3 -0
  35. model-00127-of-00175.safetensors +3 -0
  36. model-00128-of-00175.safetensors +3 -0
  37. model-00130-of-00175.safetensors +3 -0
  38. model-00140-of-00175.safetensors +3 -0
  39. model-00151-of-00175.safetensors +3 -0
  40. model-00152-of-00175.safetensors +3 -0
  41. model-00154-of-00175.safetensors +3 -0
  42. model-00158-of-00175.safetensors +3 -0
  43. model-00163-of-00175.safetensors +3 -0
  44. model-00165-of-00175.safetensors +3 -0
  45. model-00166-of-00175.safetensors +3 -0
  46. model-00169-of-00175.safetensors +3 -0
  47. model.safetensors.index.json +0 -0
  48. special_tokens_map.json +23 -0
  49. tokenizer.json +0 -0
  50. tokenizer_config.json +0 -0
README.md ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ library_name: mlx
4
+ base_model: deepseek-ai/DeepSeek-V3.2
5
+ base_model_relation: finetune
6
+ pipeline_tag: text-generation
7
+ tags:
8
+ - mlx
9
+ ---
10
+
11
+ # mlx-community/DeepSeek-V3.2-8bit
12
+
13
+ This model [mlx-community/DeepSeek-V3.2-8bit](https://huggingface.co/mlx-community/DeepSeek-V3.2-8bit) was
14
+ converted to MLX format from [deepseek-ai/DeepSeek-V3.2](https://huggingface.co/deepseek-ai/DeepSeek-V3.2)
15
+ using mlx-lm version **0.28.4**.
16
+
17
+ ## Use with mlx
18
+
19
+ ```bash
20
+ pip install mlx-lm
21
+ ```
22
+
23
+ ```python
24
+ from mlx_lm import load, generate
25
+
26
+ model, tokenizer = load("mlx-community/DeepSeek-V3.2-8bit")
27
+
28
+ prompt = "hello"
29
+
30
+ if tokenizer.chat_template is not None:
31
+ messages = [{"role": "user", "content": prompt}]
32
+ prompt = tokenizer.apply_chat_template(
33
+ messages, add_generation_prompt=True
34
+ )
35
+
36
+ response = generate(model, tokenizer, prompt=prompt, verbose=True)
37
+ ```
config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV32ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 1,
9
+ "ep_size": 1,
10
+ "first_k_dense_replace": 3,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 7168,
13
+ "index_head_dim": 128,
14
+ "index_n_heads": 64,
15
+ "index_topk": 2048,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 18432,
18
+ "kv_lora_rank": 512,
19
+ "max_position_embeddings": 163840,
20
+ "model_type": "deepseek_v32",
21
+ "moe_intermediate_size": 2048,
22
+ "moe_layer_freq": 1,
23
+ "n_group": 8,
24
+ "n_routed_experts": 256,
25
+ "n_shared_experts": 1,
26
+ "norm_topk_prob": true,
27
+ "num_attention_heads": 128,
28
+ "num_experts_per_tok": 8,
29
+ "num_hidden_layers": 61,
30
+ "num_key_value_heads": 128,
31
+ "num_nextn_predict_layers": 1,
32
+ "q_lora_rank": 1536,
33
+ "qk_nope_head_dim": 128,
34
+ "qk_rope_head_dim": 64,
35
+ "quantization": {
36
+ "group_size": 32,
37
+ "bits": 8,
38
+ "mode": "affine"
39
+ },
40
+ "quantization_config": {
41
+ "group_size": 32,
42
+ "bits": 8,
43
+ "mode": "affine"
44
+ },
45
+ "rms_norm_eps": 1e-06,
46
+ "rope_scaling": {
47
+ "beta_fast": 32,
48
+ "beta_slow": 1,
49
+ "factor": 40,
50
+ "mscale": 1.0,
51
+ "mscale_all_dim": 1.0,
52
+ "original_max_position_embeddings": 4096,
53
+ "type": "yarn"
54
+ },
55
+ "rope_theta": 10000,
56
+ "routed_scaling_factor": 2.5,
57
+ "scoring_func": "sigmoid",
58
+ "tie_word_embeddings": false,
59
+ "topk_group": 4,
60
+ "topk_method": "noaux_tc",
61
+ "torch_dtype": "bfloat16",
62
+ "transformers_version": "4.44.2",
63
+ "use_cache": true,
64
+ "v_head_dim": 128,
65
+ "vocab_size": 129280
66
+ }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "eos_token_id": 1,
5
+ "do_sample": true,
6
+ "temperature": 1.0,
7
+ "top_p": 0.95,
8
+ "transformers_version": "4.46.3"
9
+ }
model-00003-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b4b54bf32fe51509b459621399e8426887f8755dd01749ec96ea09671d85d80
3
+ size 4227858838
model-00006-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2b6576a543fa98d98f2495c85094034a774bcf9a1c0258a127ab047a292b7a2
3
+ size 4227858838
model-00009-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08bbab654988f2d9a9992a787f4fdbcacb68ceb0c934d4aa40d0cd5f82cef253
3
+ size 4227858838
model-00020-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21b87512f897851a64ece5a52559e17cb72faed9f4062c1b87b6b4e86ded18dd
3
+ size 4227858844
model-00023-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b9e21fddb8453766b1b41f56cd637a67986e8359b9add7a09cb7062094f5bca
3
+ size 4227858847
model-00031-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06dae087412af0fe8c5f0273ff2bc94a96fe5cfa941ed6f2036d1cc1d4dbd9aa
3
+ size 4507310818
model-00032-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2326b2714e92b141093d1fe1122a6776cacb03c7449286b071085b06a2a3ddbf
3
+ size 4227858847
model-00034-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a597f6d699916f4ac27a728389e29445fb399f30a04fbe4906b12d30f9e5de3
3
+ size 4507310800
model-00038-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1c0699350d71754cc9e7727b31252116652e37ab793038ceef387c36497374
3
+ size 4227858847
model-00041-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4347d9cfec14593d2a3e2cd2ea2b016c77cefff132dbe06c0f8a898ba0896b8b
3
+ size 4227858847
model-00042-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23eb0c591e5aa48304e04563219b3ab6da7fe6d49c5cdb21fdef5a96ac007188
3
+ size 4227858841
model-00044-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4a0be5beb51d6db179329289012da9946bf28cbc46d3f6238394fa0b42d0323
3
+ size 4227858847
model-00047-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e60abc9f6fdc61408bddc2b8214c30b3d3236da32e728c9cfadb1e8242a0aeb
3
+ size 4227858847
model-00048-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0b0d47e46e1369301f57278eb46f69480a77a5897447881341cad5fa599ccb4
3
+ size 4227858841
model-00059-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9abda0f573eae2311f13190b6a6ee66a771796f51ad414f334dd57353771bca6
3
+ size 4227858847
model-00062-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe927565d50dbda46581cd5b099177d0f7402adec46549f439b7cc5dbf5ede64
3
+ size 4227858847
model-00067-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fc725ee64992be6eea8aa620053d8c84b64c77a6157e596a86cd7157f33e7fb
3
+ size 4507310792
model-00070-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d126ef0714454fc76e4c27e863f9ddcb71771f1cc393de1202c17620d13e6df
3
+ size 4507310798
model-00075-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33d83ab8f668c0bb87ac90bbb338b7df11303d991ca0b5a2b77b0aa09188b063
3
+ size 4227858841
model-00080-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e066541be5390342d35599d80ea96f444ea9935d6fa4e15f00c4f3ed3a778363
3
+ size 4227858847
model-00083-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:902aff9580a24bc75b64105a6d1e3ff56599dd9e8629ebc77f5365d114b4d193
3
+ size 4227858847
model-00086-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5415141fc5ce7cc025904511886bc8bfe0f8f457ca08f2e3b8f187b137c0dec
3
+ size 4227858847
model-00089-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c9a6de0993908451a8f163a843bb4d71d6a572f39264f150295f292aa44d636
3
+ size 4227858847
model-00091-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9150cf5f40621ef657ebf81af778d1594e5afe63a6cc3eda8c5b20f918a7c940
3
+ size 4507310770
model-00101-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fc64b14bf4ad32eba845be6f8c2146fc59104f5e165ffc1059f47aff91c3d13
3
+ size 4227858847
model-00102-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:590c24d4f69b2c198f91eb260ffed4378275b38524c127a1c39bfab9a504181c
3
+ size 4227858841
model-00110-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c60575cf478cc19bca68cad1007503c5899538e16d75504e3fcc92ee25b2501
3
+ size 4227858847
model-00115-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3011f19399d207ec21dac5a670d1210f71ed3cc74efab82343f939625e22dc4e
3
+ size 4507310768
model-00116-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23db45dca16e0bbc1cd663d89003d9befc826a7706402778b03b4d6a7800ebfc
3
+ size 4227858847
model-00119-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37be721fb1f3015c0d47411844526083d7480f0d2b99ed9ec00abd803177c7ec
3
+ size 4227858847
model-00122-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:326545e47248795ec2d3c0950a6adbbc899310f0e16917ff0571f14b2e806b57
3
+ size 4227858847
model-00127-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a56b66a5c06146852fe68528771336a24779445970a23549efa135d233594a90
3
+ size 4507310784
model-00128-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52f90c778b5b7651082b67af236da8262d5c3f86fe7c170ca701bf15d67df62a
3
+ size 4227858847
model-00130-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aad64252113b6f2ba2e090b818504bb94819eb0470ea9747d60980af7090e7bf
3
+ size 4507310812
model-00140-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:795a789892283d8f47a71c326611ba9f57eca73895b10e3b0e2e19e764bbc751
3
+ size 4227858847
model-00151-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddc54cf09a0c50a215fc9a8a325be738a9a490dcf256fbe2d1362cc30676cfd0
3
+ size 4507310740
model-00152-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09eff982a07f747e43113d889861195bd5dbd50bca2d71ed1d672869bbaaeea5
3
+ size 4227858847
model-00154-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:637550d5b3f8a1908f95679c9ffad19ef84e5d22d9c6645055a1e16d0c164377
3
+ size 4507310762
model-00158-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0456daea5ba66aaa271f3d81bf33010a77fad664a8a602d23dbc1fe22f7de2bb
3
+ size 4227858847
model-00163-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f41a27c621bc123a080605b19cafd95a5e82cb7262b28d3bd1c8c3f649d91d9
3
+ size 4507310776
model-00165-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97a4ae4148bf3e46396d03ec08b3b7dd9117453d57e3ac6b947df40f3460c55c
3
+ size 4227858841
model-00166-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f645bc315e9975ac849d001e8a7ba0fa7a0a73223f452b628ac8bc62de687bc0
3
+ size 4507310778
model-00169-of-00175.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:509db5a32339d18a6ef94f0e8a87067f3299878ced1f7d203f9c8c571d6180e1
3
+ size 4507310800
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|begin▁of▁sentence|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|end▁of▁sentence|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|end▁of▁sentence|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff