Spaces:

doinglean
/

yolov8

Runtime error

App Files Files Community

doinglean commited on Sep 4

Commit

b65ef32

verified ·

1 Parent(s): c7ca595

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -55

app.py CHANGED Viewed

@@ -2,77 +2,55 @@ import gradio as gr
 import cv2
 import numpy as np
 from ultralytics import YOLO
-import easyocr
 # Lade YOLOv8-Modell
-model = YOLO("yolov8n.pt", weights_only=False)  # Nano-Modell, weights_only=False für einfaches Laden
-# Lade EasyOCR
-reader = easyocr.Reader(['en'], gpu=False)  # Englisch, CPU für Free Tier
 def analyze_image(image, prompt):
     # Konvertiere PIL-Bild zu numpy-Format
     image_np = np.array(image)
     image_cv = cv2.cvtColor(image_np, cv2.COLOR_RGB2BGR)
-    # Allgemeine Bildbeschreibung
-    if "what do you see" in prompt.lower() or "was siehst du" in prompt.lower():
-        return "Ein Candlestick-Chart mit grünen und roten Kerzen, Preisen auf der y-Achse und weißem Hintergrund."
-    # Kerzen-Analyse
-    elif "last 8 candles" in prompt.lower() or "letzte 8 kerzen" in prompt.lower():
-        # YOLOv8 für Kerzen-Erkennung
-        results = model.predict(source=image_np, conf=0.3, iou=0.5)
-        detections = []
-        for r in results:
-            boxes = r.boxes.xyxy.cpu().numpy()
-            for box in boxes:
-                # Filter für Kerzen (schmal und hoch)
-                xmin, ymin, xmax, ymax = map(int, box)
-                if (ymax - ymin) / (xmax - xmin) > 2:  # Verhältnis für Kerzen
-                    candle_roi = image_cv[ymin:ymax, xmin:xmax]
-                    if candle_roi.size == 0:
-                        continue
-                    mean_color = np.mean(candle_roi, axis=(0, 1)).astype(int)
-                    color_rgb = f"RGB({mean_color[2]},{mean_color[1]},{mean_color[0]})"
-                    # OCR für Preise
-                    price_roi = image_cv[max(0, ymin-200):min(image_np.shape[0], ymax+200),
-                                        max(0, xmin-200):min(image_np.shape[1], xmax+200)]
-                    ocr_results = reader.readtext(price_roi, detail=0)
-                    prices = " ".join(ocr_results) if ocr_results else "Kein Preis erkannt"
-                    detections.append({
-                        "Kerze": f"Farbe: {color_rgb}, Preise: {prices}",
-                        "x_center": (xmin + xmax) / 2
-                    })
-        # Sortiere nach x-Position (rechts nach links = neueste Kerzen)
-        detections = sorted(detections, key=lambda x: x["x_center"], reverse=True)[:8]
-        if not detections:
-            return "Keine Kerzen erkannt. Bitte lade ein klares Bild mit sichtbaren Kerzen und Preisen hoch."
-        # Textantwort erstellen
-        response = "Letzte 8 Kerzen:\n"
-        for i, detection in enumerate(detections, 1):
-            response += f"Kerze {i}: {detection['Kerze']}\n"
-        return response
-    else:
-        return "Nicht unterstützter Prompt. Verwende 'Was siehst du auf dem Bild?' oder 'List last 8 candles with their colors'."
 # Erstelle Gradio-Schnittstelle
 iface = gr.Interface(
     fn=analyze_image,
     inputs=[
         gr.Image(type="pil", label="Bild hochladen"),
-        gr.Textbox(label="Prompt", placeholder="z. B. 'Was siehst du auf dem Bild?' oder 'List last 8 candles with their colors'")
     ],
     outputs="text",
-    title="Einfache Chart-Analyse mit YOLOv8",
-    description="Lade einen TradingView-Screenshot hoch, um Kerzen zu analysieren oder eine Beschreibung zu erhalten."
 )
 iface.launch()

 import cv2
 import numpy as np
 from ultralytics import YOLO
 # Lade YOLOv8-Modell
+model = YOLO("yolov8n.pt")  # Nano-Modell, Standard-Laden
 def analyze_image(image, prompt):
+    # Prüfe Prompt
+    if "what do you see" not in prompt.lower() and "was siehst du" not in prompt.lower():
+        return "Nicht unterstützter Prompt. Verwende 'Was siehst du auf dem Bild?'"
     # Konvertiere PIL-Bild zu numpy-Format
     image_np = np.array(image)
     image_cv = cv2.cvtColor(image_np, cv2.COLOR_RGB2BGR)
+    # YOLOv8 für Objekterkennung
+    results = model.predict(source=image_np, conf=0.3, iou=0.5)
+    objects = []
+    for r in results:
+        boxes = r.boxes.xyxy.cpu().numpy()
+        labels = r.boxes.cls.cpu().numpy()
+        class_names = model.names  # Klassen-Namen aus dem Modell
+        for box, label in zip(boxes, labels):
+            class_name = class_names[int(label)]
+            objects.append(class_name)
+    # Erstelle Textbeschreibung
+    if not objects:
+        return "Keine Objekte erkannt. Es sieht aus wie ein Chart oder ein anderes Bild ohne klar erkennbare Objekte."
+    object_count = {}
+    for obj in objects:
+        object_count[obj] = object_count.get(obj, 0) + 1
+    response = "Ich sehe folgende Objekte im Bild:\n"
+    for obj, count in object_count.items():
+        response += f"- {obj} ({count}x)\n"
+    return response
 # Erstelle Gradio-Schnittstelle
 iface = gr.Interface(
     fn=analyze_image,
     inputs=[
         gr.Image(type="pil", label="Bild hochladen"),
+        gr.Textbox(label="Prompt", placeholder="z. B. 'Was siehst du auf dem Bild?'")
     ],
     outputs="text",
+    title="Einfache Bildanalyse mit YOLOv8",
+    description="Lade ein Bild hoch und frage 'Was siehst du auf dem Bild?' für eine Beschreibung."
 )
 iface.launch()