giannisdaras
/

ambient-o

ambient diffusion

low-quality data

Model card Files Files and versions

adrianrm commited on Aug 16

Commit

66c7512

·

verified ·

1 Parent(s): c936d1f

Update README.md

Files changed (1) hide show

README.md +23 -13

README.md CHANGED Viewed

@@ -51,36 +51,46 @@ At low diffusion times, the model exploits locality properties of natural images
 ## Usage
 ```python
-from micro_diffusion.models.model import create_latent_diffusion
 import torch
 params = {
     'latent_res': 64,
     'in_channels': 4,
     'pos_interp_scale': 2.0,
 }
 model = create_latent_diffusion(**params).to('cuda')
-checkpoint = torch.load(ckpt_path, map_location='cuda', weights_only=False)
-model_dict = checkpoint['state']['model']
-# Convert parameters to float32
 float_model_params = {
-    k.replace('dit.', ''): v.to(torch.float32) for k, v in model_dict.items() if 'dit' in k
 }
 model.dit.load_state_dict(float_model_params)
 prompts = [
     "Pirate ship trapped in a cosmic maelstrom nebula, rendered in cosmic beach whirlpool engine, volumet",
     "A illustration from a graphic novel. A bustling city street under the shine of a full moon.",
 ]
-model = model.eval()
-gen_images = model.generate(prompt=prompts, num_inference_steps=30,
-                           guidance_scale=5.0, seed=42)
 ```
 ## Citation

 ## Usage
 ```python
 import torch
+from micro_diffusion.models.model import create_latent_diffusion
+from huggingface_hub import hf_hub_download
+from safetensors import safe_open
+# Init model
 params = {
     'latent_res': 64,
     'in_channels': 4,
     'pos_interp_scale': 2.0,
 }
 model = create_latent_diffusion(**params).to('cuda')
+# Download weights from HF
+model_dict_path = hf_hub_download(repo_id="giannisdaras/ambient-o", filename="model.safetensors")
+model_dict = {}
+with safe_open(model_dict_path, framework="pt", device="cpu") as f:
+   for key in f.keys():
+       model_dict[key] = f.get_tensor(key)
+# Convert parameters to float32 + load
 float_model_params = {
+    k: v.to(torch.float32) for k, v in model_dict.items()
 }
 model.dit.load_state_dict(float_model_params)
+# Eval mode
+model = model.eval()
+# Generate images
 prompts = [
     "Pirate ship trapped in a cosmic maelstrom nebula, rendered in cosmic beach whirlpool engine, volumet",
     "A illustration from a graphic novel. A bustling city street under the shine of a full moon.",
+    "A giant cobra snake made from corn",
+    "A fierce garden gnome warrior, clad in armor crafted from leaves and bark, brandishes a tiny sword.",
+    "A capybara made of lego sitting in a realistic, natural field",
+    "a close-up of a fire spitting dragon, cinematic shot.",
+    "Panda mad scientist mixing sparkling chemicals, artstation"
 ]
+images = model.generate(prompt=prompts, num_inference_steps=30, guidance_scale=5.0, seed=42)
 ```
 ## Citation