Add files using upload-large-folder tool
Browse files- README.md +37 -0
- config.json +66 -0
- generation_config.json +9 -0
- model-00003-of-00175.safetensors +3 -0
- model-00006-of-00175.safetensors +3 -0
- model-00009-of-00175.safetensors +3 -0
- model-00020-of-00175.safetensors +3 -0
- model-00023-of-00175.safetensors +3 -0
- model-00031-of-00175.safetensors +3 -0
- model-00032-of-00175.safetensors +3 -0
- model-00034-of-00175.safetensors +3 -0
- model-00038-of-00175.safetensors +3 -0
- model-00041-of-00175.safetensors +3 -0
- model-00042-of-00175.safetensors +3 -0
- model-00044-of-00175.safetensors +3 -0
- model-00047-of-00175.safetensors +3 -0
- model-00048-of-00175.safetensors +3 -0
- model-00059-of-00175.safetensors +3 -0
- model-00062-of-00175.safetensors +3 -0
- model-00067-of-00175.safetensors +3 -0
- model-00070-of-00175.safetensors +3 -0
- model-00075-of-00175.safetensors +3 -0
- model-00080-of-00175.safetensors +3 -0
- model-00083-of-00175.safetensors +3 -0
- model-00086-of-00175.safetensors +3 -0
- model-00089-of-00175.safetensors +3 -0
- model-00091-of-00175.safetensors +3 -0
- model-00101-of-00175.safetensors +3 -0
- model-00102-of-00175.safetensors +3 -0
- model-00110-of-00175.safetensors +3 -0
- model-00115-of-00175.safetensors +3 -0
- model-00116-of-00175.safetensors +3 -0
- model-00119-of-00175.safetensors +3 -0
- model-00122-of-00175.safetensors +3 -0
- model-00127-of-00175.safetensors +3 -0
- model-00128-of-00175.safetensors +3 -0
- model-00130-of-00175.safetensors +3 -0
- model-00140-of-00175.safetensors +3 -0
- model-00151-of-00175.safetensors +3 -0
- model-00152-of-00175.safetensors +3 -0
- model-00154-of-00175.safetensors +3 -0
- model-00158-of-00175.safetensors +3 -0
- model-00163-of-00175.safetensors +3 -0
- model-00165-of-00175.safetensors +3 -0
- model-00166-of-00175.safetensors +3 -0
- model-00169-of-00175.safetensors +3 -0
- model.safetensors.index.json +0 -0
- special_tokens_map.json +23 -0
- tokenizer.json +0 -0
- tokenizer_config.json +0 -0
README.md
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: mit
|
| 3 |
+
library_name: mlx
|
| 4 |
+
base_model: deepseek-ai/DeepSeek-V3.2
|
| 5 |
+
base_model_relation: finetune
|
| 6 |
+
pipeline_tag: text-generation
|
| 7 |
+
tags:
|
| 8 |
+
- mlx
|
| 9 |
+
---
|
| 10 |
+
|
| 11 |
+
# mlx-community/DeepSeek-V3.2-8bit
|
| 12 |
+
|
| 13 |
+
This model [mlx-community/DeepSeek-V3.2-8bit](https://huggingface.co/mlx-community/DeepSeek-V3.2-8bit) was
|
| 14 |
+
converted to MLX format from [deepseek-ai/DeepSeek-V3.2](https://huggingface.co/deepseek-ai/DeepSeek-V3.2)
|
| 15 |
+
using mlx-lm version **0.28.4**.
|
| 16 |
+
|
| 17 |
+
## Use with mlx
|
| 18 |
+
|
| 19 |
+
```bash
|
| 20 |
+
pip install mlx-lm
|
| 21 |
+
```
|
| 22 |
+
|
| 23 |
+
```python
|
| 24 |
+
from mlx_lm import load, generate
|
| 25 |
+
|
| 26 |
+
model, tokenizer = load("mlx-community/DeepSeek-V3.2-8bit")
|
| 27 |
+
|
| 28 |
+
prompt = "hello"
|
| 29 |
+
|
| 30 |
+
if tokenizer.chat_template is not None:
|
| 31 |
+
messages = [{"role": "user", "content": prompt}]
|
| 32 |
+
prompt = tokenizer.apply_chat_template(
|
| 33 |
+
messages, add_generation_prompt=True
|
| 34 |
+
)
|
| 35 |
+
|
| 36 |
+
response = generate(model, tokenizer, prompt=prompt, verbose=True)
|
| 37 |
+
```
|
config.json
ADDED
|
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"DeepseekV32ForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": false,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"eos_token_id": 1,
|
| 9 |
+
"ep_size": 1,
|
| 10 |
+
"first_k_dense_replace": 3,
|
| 11 |
+
"hidden_act": "silu",
|
| 12 |
+
"hidden_size": 7168,
|
| 13 |
+
"index_head_dim": 128,
|
| 14 |
+
"index_n_heads": 64,
|
| 15 |
+
"index_topk": 2048,
|
| 16 |
+
"initializer_range": 0.02,
|
| 17 |
+
"intermediate_size": 18432,
|
| 18 |
+
"kv_lora_rank": 512,
|
| 19 |
+
"max_position_embeddings": 163840,
|
| 20 |
+
"model_type": "deepseek_v32",
|
| 21 |
+
"moe_intermediate_size": 2048,
|
| 22 |
+
"moe_layer_freq": 1,
|
| 23 |
+
"n_group": 8,
|
| 24 |
+
"n_routed_experts": 256,
|
| 25 |
+
"n_shared_experts": 1,
|
| 26 |
+
"norm_topk_prob": true,
|
| 27 |
+
"num_attention_heads": 128,
|
| 28 |
+
"num_experts_per_tok": 8,
|
| 29 |
+
"num_hidden_layers": 61,
|
| 30 |
+
"num_key_value_heads": 128,
|
| 31 |
+
"num_nextn_predict_layers": 1,
|
| 32 |
+
"q_lora_rank": 1536,
|
| 33 |
+
"qk_nope_head_dim": 128,
|
| 34 |
+
"qk_rope_head_dim": 64,
|
| 35 |
+
"quantization": {
|
| 36 |
+
"group_size": 32,
|
| 37 |
+
"bits": 8,
|
| 38 |
+
"mode": "affine"
|
| 39 |
+
},
|
| 40 |
+
"quantization_config": {
|
| 41 |
+
"group_size": 32,
|
| 42 |
+
"bits": 8,
|
| 43 |
+
"mode": "affine"
|
| 44 |
+
},
|
| 45 |
+
"rms_norm_eps": 1e-06,
|
| 46 |
+
"rope_scaling": {
|
| 47 |
+
"beta_fast": 32,
|
| 48 |
+
"beta_slow": 1,
|
| 49 |
+
"factor": 40,
|
| 50 |
+
"mscale": 1.0,
|
| 51 |
+
"mscale_all_dim": 1.0,
|
| 52 |
+
"original_max_position_embeddings": 4096,
|
| 53 |
+
"type": "yarn"
|
| 54 |
+
},
|
| 55 |
+
"rope_theta": 10000,
|
| 56 |
+
"routed_scaling_factor": 2.5,
|
| 57 |
+
"scoring_func": "sigmoid",
|
| 58 |
+
"tie_word_embeddings": false,
|
| 59 |
+
"topk_group": 4,
|
| 60 |
+
"topk_method": "noaux_tc",
|
| 61 |
+
"torch_dtype": "bfloat16",
|
| 62 |
+
"transformers_version": "4.44.2",
|
| 63 |
+
"use_cache": true,
|
| 64 |
+
"v_head_dim": 128,
|
| 65 |
+
"vocab_size": 129280
|
| 66 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_from_model_config": true,
|
| 3 |
+
"bos_token_id": 0,
|
| 4 |
+
"eos_token_id": 1,
|
| 5 |
+
"do_sample": true,
|
| 6 |
+
"temperature": 1.0,
|
| 7 |
+
"top_p": 0.95,
|
| 8 |
+
"transformers_version": "4.46.3"
|
| 9 |
+
}
|
model-00003-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b4b54bf32fe51509b459621399e8426887f8755dd01749ec96ea09671d85d80
|
| 3 |
+
size 4227858838
|
model-00006-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2b6576a543fa98d98f2495c85094034a774bcf9a1c0258a127ab047a292b7a2
|
| 3 |
+
size 4227858838
|
model-00009-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08bbab654988f2d9a9992a787f4fdbcacb68ceb0c934d4aa40d0cd5f82cef253
|
| 3 |
+
size 4227858838
|
model-00020-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21b87512f897851a64ece5a52559e17cb72faed9f4062c1b87b6b4e86ded18dd
|
| 3 |
+
size 4227858844
|
model-00023-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b9e21fddb8453766b1b41f56cd637a67986e8359b9add7a09cb7062094f5bca
|
| 3 |
+
size 4227858847
|
model-00031-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06dae087412af0fe8c5f0273ff2bc94a96fe5cfa941ed6f2036d1cc1d4dbd9aa
|
| 3 |
+
size 4507310818
|
model-00032-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2326b2714e92b141093d1fe1122a6776cacb03c7449286b071085b06a2a3ddbf
|
| 3 |
+
size 4227858847
|
model-00034-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a597f6d699916f4ac27a728389e29445fb399f30a04fbe4906b12d30f9e5de3
|
| 3 |
+
size 4507310800
|
model-00038-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d1c0699350d71754cc9e7727b31252116652e37ab793038ceef387c36497374
|
| 3 |
+
size 4227858847
|
model-00041-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4347d9cfec14593d2a3e2cd2ea2b016c77cefff132dbe06c0f8a898ba0896b8b
|
| 3 |
+
size 4227858847
|
model-00042-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23eb0c591e5aa48304e04563219b3ab6da7fe6d49c5cdb21fdef5a96ac007188
|
| 3 |
+
size 4227858841
|
model-00044-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4a0be5beb51d6db179329289012da9946bf28cbc46d3f6238394fa0b42d0323
|
| 3 |
+
size 4227858847
|
model-00047-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e60abc9f6fdc61408bddc2b8214c30b3d3236da32e728c9cfadb1e8242a0aeb
|
| 3 |
+
size 4227858847
|
model-00048-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0b0d47e46e1369301f57278eb46f69480a77a5897447881341cad5fa599ccb4
|
| 3 |
+
size 4227858841
|
model-00059-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9abda0f573eae2311f13190b6a6ee66a771796f51ad414f334dd57353771bca6
|
| 3 |
+
size 4227858847
|
model-00062-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe927565d50dbda46581cd5b099177d0f7402adec46549f439b7cc5dbf5ede64
|
| 3 |
+
size 4227858847
|
model-00067-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fc725ee64992be6eea8aa620053d8c84b64c77a6157e596a86cd7157f33e7fb
|
| 3 |
+
size 4507310792
|
model-00070-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d126ef0714454fc76e4c27e863f9ddcb71771f1cc393de1202c17620d13e6df
|
| 3 |
+
size 4507310798
|
model-00075-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33d83ab8f668c0bb87ac90bbb338b7df11303d991ca0b5a2b77b0aa09188b063
|
| 3 |
+
size 4227858841
|
model-00080-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e066541be5390342d35599d80ea96f444ea9935d6fa4e15f00c4f3ed3a778363
|
| 3 |
+
size 4227858847
|
model-00083-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:902aff9580a24bc75b64105a6d1e3ff56599dd9e8629ebc77f5365d114b4d193
|
| 3 |
+
size 4227858847
|
model-00086-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5415141fc5ce7cc025904511886bc8bfe0f8f457ca08f2e3b8f187b137c0dec
|
| 3 |
+
size 4227858847
|
model-00089-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c9a6de0993908451a8f163a843bb4d71d6a572f39264f150295f292aa44d636
|
| 3 |
+
size 4227858847
|
model-00091-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9150cf5f40621ef657ebf81af778d1594e5afe63a6cc3eda8c5b20f918a7c940
|
| 3 |
+
size 4507310770
|
model-00101-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fc64b14bf4ad32eba845be6f8c2146fc59104f5e165ffc1059f47aff91c3d13
|
| 3 |
+
size 4227858847
|
model-00102-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:590c24d4f69b2c198f91eb260ffed4378275b38524c127a1c39bfab9a504181c
|
| 3 |
+
size 4227858841
|
model-00110-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c60575cf478cc19bca68cad1007503c5899538e16d75504e3fcc92ee25b2501
|
| 3 |
+
size 4227858847
|
model-00115-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3011f19399d207ec21dac5a670d1210f71ed3cc74efab82343f939625e22dc4e
|
| 3 |
+
size 4507310768
|
model-00116-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23db45dca16e0bbc1cd663d89003d9befc826a7706402778b03b4d6a7800ebfc
|
| 3 |
+
size 4227858847
|
model-00119-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37be721fb1f3015c0d47411844526083d7480f0d2b99ed9ec00abd803177c7ec
|
| 3 |
+
size 4227858847
|
model-00122-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:326545e47248795ec2d3c0950a6adbbc899310f0e16917ff0571f14b2e806b57
|
| 3 |
+
size 4227858847
|
model-00127-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a56b66a5c06146852fe68528771336a24779445970a23549efa135d233594a90
|
| 3 |
+
size 4507310784
|
model-00128-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52f90c778b5b7651082b67af236da8262d5c3f86fe7c170ca701bf15d67df62a
|
| 3 |
+
size 4227858847
|
model-00130-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aad64252113b6f2ba2e090b818504bb94819eb0470ea9747d60980af7090e7bf
|
| 3 |
+
size 4507310812
|
model-00140-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:795a789892283d8f47a71c326611ba9f57eca73895b10e3b0e2e19e764bbc751
|
| 3 |
+
size 4227858847
|
model-00151-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ddc54cf09a0c50a215fc9a8a325be738a9a490dcf256fbe2d1362cc30676cfd0
|
| 3 |
+
size 4507310740
|
model-00152-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09eff982a07f747e43113d889861195bd5dbd50bca2d71ed1d672869bbaaeea5
|
| 3 |
+
size 4227858847
|
model-00154-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:637550d5b3f8a1908f95679c9ffad19ef84e5d22d9c6645055a1e16d0c164377
|
| 3 |
+
size 4507310762
|
model-00158-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0456daea5ba66aaa271f3d81bf33010a77fad664a8a602d23dbc1fe22f7de2bb
|
| 3 |
+
size 4227858847
|
model-00163-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f41a27c621bc123a080605b19cafd95a5e82cb7262b28d3bd1c8c3f649d91d9
|
| 3 |
+
size 4507310776
|
model-00165-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97a4ae4148bf3e46396d03ec08b3b7dd9117453d57e3ac6b947df40f3460c55c
|
| 3 |
+
size 4227858841
|
model-00166-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f645bc315e9975ac849d001e8a7ba0fa7a0a73223f452b628ac8bc62de687bc0
|
| 3 |
+
size 4507310778
|
model-00169-of-00175.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:509db5a32339d18a6ef94f0e8a87067f3299878ced1f7d203f9c8c571d6180e1
|
| 3 |
+
size 4507310800
|
model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<|begin▁of▁sentence|>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"eos_token": {
|
| 10 |
+
"content": "<|end▁of▁sentence|>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "<|end▁of▁sentence|>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
}
|
| 23 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|