Spaces:

primerz
/

face-to-pixel-art

Running on Zero

App Files Files Community

primerz commited on 26 days ago

Commit

ea17e03

verified ·

1 Parent(s): 8d98c0c

Update model.py

Browse files

Files changed (1) hide show

model.py +28 -92

model.py CHANGED Viewed

@@ -6,7 +6,7 @@ from config import Config
 from diffusers import (
     ControlNetModel,
-    TCDScheduler,
 )
 from diffusers.models.controlnets.multicontrolnet import MultiControlNetModel
@@ -15,17 +15,15 @@ from pipeline_stable_diffusion_xl_instantid_img2img import StableDiffusionXLInst
 from huggingface_hub import snapshot_download, hf_hub_download
 from insightface.app import FaceAnalysis
-from controlnet_aux import LeresDetector, LineartAnimeDetector, CannyDetector
 class ModelHandler:
     def __init__(self):
         self.pipeline = None
-        self.app = None  # InsightFace
         self.leres_detector = None
         self.lineart_anime_detector = None
-        self.canny_detector = None
         self.face_analysis_loaded = False
-        self.edge_type = Config.DEFAULT_EDGE_TYPE
     def load_face_analysis(self):
         """
@@ -41,7 +39,7 @@ class ModelHandler:
             try:
                 snapshot_download(
                     repo_id=Config.ANTELOPEV2_REPO,
-                    local_dir=model_path,
                 )
             except Exception as e:
                 print(f"  [ERROR] Failed to download AntelopeV2 models: {e}")
@@ -61,65 +59,25 @@ class ModelHandler:
             print(f"  [WARNING] Face detection system failed to initialize: {e}")
             return False
-    def load_models(self, edge_type="canny"):
-        """
-        Load all models with support for different edge detection types.
-        Args:
-            edge_type: "canny", "lineart", or "both"
-        """
-        self.edge_type = edge_type
         # 1. Load Face Analysis
         self.face_analysis_loaded = self.load_face_analysis()
-        # 2. Load ControlNets based on edge_type
-        print(f"Loading ControlNets (InstantID, Zoe, {edge_type.upper()})...")
         cn_instantid = ControlNetModel.from_pretrained(
             Config.INSTANTID_REPO,
             subfolder="ControlNetModel",
             torch_dtype=Config.DTYPE
         )
-        cn_zoe = ControlNetModel.from_pretrained(
-            Config.CN_ZOE_REPO,
-            torch_dtype=Config.DTYPE
-        )
-        # Load edge ControlNet(s)
-        controlnet_list = [cn_instantid, cn_zoe]
-        if edge_type == "canny":
-            cn_canny = ControlNetModel.from_pretrained(
-                Config.CN_CANNY_REPO,
-                torch_dtype=Config.DTYPE
-            )
-            controlnet_list.append(cn_canny)
-            print("  [OK] Loaded Canny ControlNet")
-        elif edge_type == "lineart":
-            cn_lineart = ControlNetModel.from_pretrained(
-                Config.CN_LINEART_REPO,
-                torch_dtype=Config.DTYPE
-            )
-            controlnet_list.append(cn_lineart)
-            print("  [OK] Loaded LineArt ControlNet")
-        elif edge_type == "both":
-            cn_canny = ControlNetModel.from_pretrained(
-                Config.CN_CANNY_REPO,
-                torch_dtype=Config.DTYPE
-            )
-            cn_lineart = ControlNetModel.from_pretrained(
-                Config.CN_LINEART_REPO,
-                torch_dtype=Config.DTYPE
-            )
-            controlnet_list.extend([cn_canny, cn_lineart])
-            print("  [OK] Loaded both Canny and LineArt ControlNets")
         print("Wrapping ControlNets in MultiControlNetModel...")
         controlnet = MultiControlNetModel(controlnet_list)
-        # 3. Load SDXL Pipeline
         print(f"Loading SDXL Pipeline ({Config.CHECKPOINT_FILENAME})...")
         checkpoint_local_path = os.path.join("./models", Config.CHECKPOINT_FILENAME)
@@ -148,15 +106,18 @@ class ModelHandler:
         except Exception as e:
             print(f"  [WARNING] Failed to enable xFormers: {e}")
-        # 4. Set TCD Scheduler
-        print("Configuring TCDScheduler...")
-        self.pipeline.scheduler = TCDScheduler.from_config(self.pipeline.scheduler.config)
-        print("  [OK] TCDScheduler loaded.")
         # 5. Load Adapters
         print("Loading Adapters...")
-        # 5a. Load and Fuse Style LoRA
         print(f"Loading and Fusing Style LoRA ({Config.LORA_FILENAME})...")
         style_lora_path = os.path.join("./models", Config.LORA_FILENAME)
         if not os.path.exists(style_lora_path):
@@ -170,7 +131,7 @@ class ModelHandler:
         self.pipeline.fuse_lora(lora_scale=Config.LORA_STRENGTH)
         print("  [OK] Style LoRA fused.")
-        # 5b. Load IP-Adapter for InstantID
         ip_adapter_filename = "ip-adapter.bin"
         ip_adapter_local_path = os.path.join("./models", ip_adapter_filename)
         if not os.path.exists(ip_adapter_local_path):
@@ -181,19 +142,14 @@ class ModelHandler:
                 local_dir_use_symlinks=False
             )
         self.pipeline.load_ip_adapter_instantid(ip_adapter_local_path)
-        print("  [OK] InstantID IP-Adapter loaded.")
-        # 6. Load Preprocessors
-        print("Loading Preprocessors...")
         self.leres_detector = LeresDetector.from_pretrained(Config.ANNOTATOR_REPO)
-        if edge_type in ["canny", "both"]:
-            self.canny_detector = CannyDetector()
-            print("  [OK] Canny detector loaded")
-        if edge_type in ["lineart", "both"]:
-            self.lineart_anime_detector = LineartAnimeDetector.from_pretrained(Config.ANNOTATOR_REPO)
-            print("  [OK] LineArt detector loaded")
         print("--- All models loaded successfully ---")
@@ -206,28 +162,8 @@ class ModelHandler:
             faces = self.app.get(cv2_img)
             if len(faces) == 0:
                 return None
-            faces = sorted(
-                faces,
-                key=lambda x: (x['bbox'][2]-x['bbox'][0])*(x['bbox'][3]-x['bbox'][1]),
-                reverse=True
-            )
             return faces[0]
         except Exception as e:
             print(f"Face embedding extraction failed: {e}")
-            return None
-    def extract_depth(self, image):
-        """Extract depth map using LeReS detector"""
-        return self.leres_detector(image)
-    def extract_canny(self, image, low_threshold=100, high_threshold=200):
-        """Extract Canny edges"""
-        if self.canny_detector is None:
-            raise ValueError("Canny detector not loaded. Initialize with edge_type='canny' or 'both'")
-        return self.canny_detector(image, low_threshold=low_threshold, high_threshold=high_threshold)
-    def extract_lineart(self, image):
-        """Extract LineArt edges"""
-        if self.lineart_anime_detector is None:
-            raise ValueError("LineArt detector not loaded. Initialize with edge_type='lineart' or 'both'")
-        return self.lineart_anime_detector(image)

 from diffusers import (
     ControlNetModel,
+    DPMSolverMultistepScheduler,
 )
 from diffusers.models.controlnets.multicontrolnet import MultiControlNetModel
 from huggingface_hub import snapshot_download, hf_hub_download
 from insightface.app import FaceAnalysis
+from controlnet_aux import LeresDetector, LineartAnimeDetector
 class ModelHandler:
     def __init__(self):
         self.pipeline = None
+        self.app = None # InsightFace
         self.leres_detector = None
         self.lineart_anime_detector = None
         self.face_analysis_loaded = False
     def load_face_analysis(self):
         """
             try:
                 snapshot_download(
                     repo_id=Config.ANTELOPEV2_REPO,
+                    local_dir=model_path, # Download to the correct expected path
                 )
             except Exception as e:
                 print(f"  [ERROR] Failed to download AntelopeV2 models: {e}")
             print(f"  [WARNING] Face detection system failed to initialize: {e}")
             return False
+    def load_models(self):
         # 1. Load Face Analysis
         self.face_analysis_loaded = self.load_face_analysis()
+        # 2. Load ControlNets
+        print("Loading ControlNets (InstantID, Zoe, LineArt)...")
         cn_instantid = ControlNetModel.from_pretrained(
             Config.INSTANTID_REPO,
             subfolder="ControlNetModel",
             torch_dtype=Config.DTYPE
         )
+        cn_zoe = ControlNetModel.from_pretrained(Config.CN_ZOE_REPO, torch_dtype=Config.DTYPE)
+        cn_lineart = ControlNetModel.from_pretrained(Config.CN_LINEART_REPO, torch_dtype=Config.DTYPE)
         print("Wrapping ControlNets in MultiControlNetModel...")
+        controlnet_list = [cn_instantid, cn_zoe, cn_lineart]
         controlnet = MultiControlNetModel(controlnet_list)
+        # 3. Load SDXL Pipeline (Now from 'reality.safetensors')
         print(f"Loading SDXL Pipeline ({Config.CHECKPOINT_FILENAME})...")
         checkpoint_local_path = os.path.join("./models", Config.CHECKPOINT_FILENAME)
         except Exception as e:
             print(f"  [WARNING] Failed to enable xFormers: {e}")
+        # 4. Set DPMSolver++ Scheduler with Karras sigmas
+        print("Configuring DPMSolverMultistepScheduler...")
+        self.pipeline.scheduler = DPMSolverMultistepScheduler.from_config(
+            self.pipeline.scheduler.config,
+            use_karras_sigmas=True
+        )
+        print("  [OK] DPMSolverMultistepScheduler loaded with Karras sigmas.")
         # 5. Load Adapters
         print("Loading Adapters...")
+        # 5b. Load and Fuse Style LoRA (lucasart)
         print(f"Loading and Fusing Style LoRA ({Config.LORA_FILENAME})...")
         style_lora_path = os.path.join("./models", Config.LORA_FILENAME)
         if not os.path.exists(style_lora_path):
         self.pipeline.fuse_lora(lora_scale=Config.LORA_STRENGTH)
         print("  [OK] Style LoRA fused.")
+        # 5c. Load IP-Adapter (for InstantID) - *Must be loaded AFTER fusing*
         ip_adapter_filename = "ip-adapter.bin"
         ip_adapter_local_path = os.path.join("./models", ip_adapter_filename)
         if not os.path.exists(ip_adapter_local_path):
                 local_dir_use_symlinks=False
             )
         self.pipeline.load_ip_adapter_instantid(ip_adapter_local_path)
+        print("  [OK] IP-Adapter loaded.")
+        # --- END FIX ---
+        # 7. Load Preprocessors
+        print("Loading Preprocessors (LeReS, LineArtAnime)...")
         self.leres_detector = LeresDetector.from_pretrained(Config.ANNOTATOR_REPO)
+        self.lineart_anime_detector = LineartAnimeDetector.from_pretrained(Config.ANNOTATOR_REPO)
         print("--- All models loaded successfully ---")
             faces = self.app.get(cv2_img)
             if len(faces) == 0:
                 return None
+            faces = sorted(faces, key=lambda x: (x['bbox'][2]-x['bbox'][0])*(x['bbox'][3]-x['bbox'][1]), reverse=True)
             return faces[0]
         except Exception as e:
             print(f"Face embedding extraction failed: {e}")
+            return None