Update app.py
Browse files
app.py
CHANGED
|
@@ -120,7 +120,7 @@ import transformers
|
|
| 120 |
# model.half()
|
| 121 |
|
| 122 |
MODEL_ID = "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B"
|
| 123 |
-
MODEL_ID = "microsoft/phi-4"
|
| 124 |
|
| 125 |
CHAT_TEMPLATE = "َAuto"
|
| 126 |
MODEL_NAME = MODEL_ID.split("/")[-1]
|
|
@@ -133,7 +133,7 @@ quantization_config = BitsAndBytesConfig(
|
|
| 133 |
bnb_4bit_compute_dtype=torch.bfloat16
|
| 134 |
)
|
| 135 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
| 136 |
-
model =
|
| 137 |
MODEL_ID,
|
| 138 |
device_map="auto",
|
| 139 |
low_cpu_mem_usage=True,
|
|
|
|
| 120 |
# model.half()
|
| 121 |
|
| 122 |
MODEL_ID = "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B"
|
| 123 |
+
# MODEL_ID = "microsoft/phi-4"
|
| 124 |
|
| 125 |
CHAT_TEMPLATE = "َAuto"
|
| 126 |
MODEL_NAME = MODEL_ID.split("/")[-1]
|
|
|
|
| 133 |
bnb_4bit_compute_dtype=torch.bfloat16
|
| 134 |
)
|
| 135 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
| 136 |
+
model = AutoModel.from_pretrained(
|
| 137 |
MODEL_ID,
|
| 138 |
device_map="auto",
|
| 139 |
low_cpu_mem_usage=True,
|