multimodalart HF Staff commited on
Commit
eee0c8d
·
verified ·
1 Parent(s): e17facd

Performance enhancements (#2)

Browse files

- Update app.py (4a892379d783a3ac642585be81313dcee9a6262f)
- Update requirements.txt (aa854da254c1ff82bda2ea19115b837e4bf2954e)
- Create optimization.py (579120fd169946f14aeeb643af8be59976f32748)
- Update app.py (b619a3366181b6ef0a418ea1e4594f4eefb7a101)
- Update app.py (98b5ab5e7f8ecaeda306170041fa982d65679d49)
- Delete optimization.py (0866e2dbdce41ed5aaaf637c53f2cf7786b259e8)
- Update app.py (35a8941a336a4943855807004d4cdf43cfec017d)

Files changed (2) hide show
  1. app.py +6 -1
  2. requirements.txt +2 -1
app.py CHANGED
@@ -11,10 +11,15 @@ pipe = DiffusionPipeline.from_pretrained(
11
  low_cpu_mem_usage=False,
12
  )
13
  pipe.to("cuda")
 
 
 
 
 
14
  print("Pipeline loaded!")
15
 
16
  @spaces.GPU
17
- def generate_image(prompt, height, width, num_inference_steps, seed, randomize_seed):
18
  """Generate an image from the given prompt."""
19
  if randomize_seed:
20
  seed = torch.randint(0, 2**32 - 1, (1,)).item()
 
11
  low_cpu_mem_usage=False,
12
  )
13
  pipe.to("cuda")
14
+
15
+ # ======== AoTI compilation + FA3 ========
16
+ pipe.transformer.layers._repeated_blocks = ["ZImageTransformerBlock"]
17
+ spaces.aoti_blocks_load(pipe.transformer.layers, "zerogpu-aoti/Z-Image", variant="fa3")
18
+
19
  print("Pipeline loaded!")
20
 
21
  @spaces.GPU
22
+ def generate_image(prompt, height, width, num_inference_steps, seed, randomize_seed, progress=gr.Progress(track_tqdm=True)):
23
  """Generate an image from the given prompt."""
24
  if randomize_seed:
25
  seed = torch.randint(0, 2**32 - 1, (1,)).item()
requirements.txt CHANGED
@@ -1,3 +1,4 @@
1
  gradio
2
  git+https://github.com/huggingface/diffusers
3
- transformers
 
 
1
  gradio
2
  git+https://github.com/huggingface/diffusers
3
+ transformers
4
+ kernels