Commit
·
3187f15
1
Parent(s):
466ab94
test
Browse files- app.py +1 -1
- requirements.txt +2 -2
app.py
CHANGED
|
@@ -38,7 +38,7 @@ class MyModel:
|
|
| 38 |
# )
|
| 39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
| 40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
| 41 |
-
client = AutoPeftModelForCausalLM.from_pretrained(model
|
| 42 |
|
| 43 |
self.client = client
|
| 44 |
self.tokenizer = tokenizer
|
|
|
|
| 38 |
# )
|
| 39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
| 40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
| 41 |
+
client = AutoPeftModelForCausalLM.from_pretrained(model, load_in_4bit=True)
|
| 42 |
|
| 43 |
self.client = client
|
| 44 |
self.tokenizer = tokenizer
|
requirements.txt
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
huggingface_hub==0.25.2
|
| 2 |
transformers>=4.45.1
|
| 3 |
-
torch
|
| 4 |
peft
|
| 5 |
-
|
|
|
|
|
|
| 1 |
huggingface_hub==0.25.2
|
| 2 |
transformers>=4.45.1
|
|
|
|
| 3 |
peft
|
| 4 |
+
torch
|
| 5 |
+
#https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_multi-backend-refactor/bitsandbytes-0.44.1.dev0-py3-none-manylinux_2_24_x86_64.whl
|