Update app.py
Browse files
app.py
CHANGED
|
@@ -38,7 +38,7 @@ class MyModel:
|
|
| 38 |
# )
|
| 39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
| 40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
| 41 |
-
client = AutoPeftModelForCausalLM.from_pretrained(model
|
| 42 |
|
| 43 |
self.client = client
|
| 44 |
self.tokenizer = tokenizer
|
|
|
|
| 38 |
# )
|
| 39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
| 40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
| 41 |
+
client = AutoPeftModelForCausalLM.from_pretrained(model) #, load_in_4bit=True)
|
| 42 |
|
| 43 |
self.client = client
|
| 44 |
self.tokenizer = tokenizer
|