Spaces:
Running
on
Zero
Running
on
Zero
Update app_quant_latent.py
Browse files- app_quant_latent.py +1 -0
app_quant_latent.py
CHANGED
|
@@ -232,6 +232,7 @@ try:
|
|
| 232 |
transformer=transformer,
|
| 233 |
text_encoder=text_encoder,
|
| 234 |
torch_dtype=torch_dtype,
|
|
|
|
| 235 |
)
|
| 236 |
pipe.to(device)
|
| 237 |
log("✅ Pipeline built successfully.")
|
|
|
|
| 232 |
transformer=transformer,
|
| 233 |
text_encoder=text_encoder,
|
| 234 |
torch_dtype=torch_dtype,
|
| 235 |
+
attn_implementation="kernels-community/vllm-flash-attn3",
|
| 236 |
)
|
| 237 |
pipe.to(device)
|
| 238 |
log("✅ Pipeline built successfully.")
|