Spaces:
Runtime error
Runtime error
Feature(MInference): add dtype
Browse files
app.py
CHANGED
|
@@ -57,7 +57,7 @@ h1 {
|
|
| 57 |
# Load the tokenizer and model
|
| 58 |
model_name = "gradientai/Llama-3-8B-Instruct-262k"
|
| 59 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 60 |
-
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto") # to("cuda:0")
|
| 61 |
|
| 62 |
from minference import MInference
|
| 63 |
minference_patch = MInference("minference", model_name)
|
|
|
|
| 57 |
# Load the tokenizer and model
|
| 58 |
model_name = "gradientai/Llama-3-8B-Instruct-262k"
|
| 59 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 60 |
+
model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto") # to("cuda:0")
|
| 61 |
|
| 62 |
from minference import MInference
|
| 63 |
minference_patch = MInference("minference", model_name)
|