multimodalart HF Staff commited on
Commit
4a89237
·
verified ·
1 Parent(s): e17facd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -0
app.py CHANGED
@@ -2,6 +2,7 @@ import torch
2
  import spaces
3
  import gradio as gr
4
  from diffusers import DiffusionPipeline
 
5
 
6
  # Load the pipeline once at startup
7
  print("Loading Z-Image-Turbo pipeline...")
@@ -11,6 +12,16 @@ pipe = DiffusionPipeline.from_pretrained(
11
  low_cpu_mem_usage=False,
12
  )
13
  pipe.to("cuda")
 
 
 
 
 
 
 
 
 
 
14
  print("Pipeline loaded!")
15
 
16
  @spaces.GPU
 
2
  import spaces
3
  import gradio as gr
4
  from diffusers import DiffusionPipeline
5
+ from optimization import optimize_pipeline_
6
 
7
  # Load the pipeline once at startup
8
  print("Loading Z-Image-Turbo pipeline...")
 
12
  low_cpu_mem_usage=False,
13
  )
14
  pipe.to("cuda")
15
+ pipe.transformer.set_attention_backend("_flash_3_hub")
16
+
17
+ #warmup
18
+ optimize_pipeline_(
19
+ pipe,
20
+ prompt="prompt",
21
+ num_inference_steps=1,
22
+ guidance_scale=0.0
23
+ )
24
+
25
  print("Pipeline loaded!")
26
 
27
  @spaces.GPU