Spaces:

LLDDWW
/

MedCard

Running

LLDDWW commited on Oct 13

Commit

2879fbc

1 Parent(s): ea3177c

Handle new PaddleOCR output format

Files changed (1) hide show

app.py CHANGED Viewed

@@ -90,15 +90,32 @@ def analyze_medication_image(image: Image.Image) -> Tuple[str, str]:
         # Step 1: OCR - PaddleOCR로 한글 텍스트 추출
         start_time = time.time()
         img_array = np.array(image)
-        ocr_results = OCR_READER.ocr(img_array, cls=True)
         ocr_time = time.time() - start_time
         print(f"⏱️ OCR took {ocr_time:.2f}s")
-        if not ocr_results or not ocr_results[0]:
             return "텍스트를 찾을 수 없습니다.", ""
         # 텍스트 추출
-        texts = [line[1][0] for line in ocr_results[0]]
         ocr_text = "\n".join(texts)
         # Step 2: 약 정보 분석 - MedGemma로 의료 정보 제공

         # Step 1: OCR - PaddleOCR로 한글 텍스트 추출
         start_time = time.time()
         img_array = np.array(image)
+        ocr_results = OCR_READER.ocr(img_array)
         ocr_time = time.time() - start_time
         print(f"⏱️ OCR took {ocr_time:.2f}s")
+        if not ocr_results:
             return "텍스트를 찾을 수 없습니다.", ""
         # 텍스트 추출
+        texts: List[str] = []
+        first_entry = ocr_results[0]
+        if isinstance(first_entry, list):
+            texts = [line[1][0] for line in first_entry if len(line) > 1 and line[1]]
+        elif isinstance(first_entry, dict):
+            rec_results = first_entry.get("text_recognition") or first_entry.get("rec_results")
+            if isinstance(rec_results, list):
+                for rec in rec_results:
+                    if isinstance(rec, dict) and rec.get("text"):
+                        texts.append(rec["text"])
+            if not texts and isinstance(first_entry.get("text"), str):
+                texts.append(first_entry["text"])
+        if not texts:
+            return "텍스트를 찾을 수 없습니다.", ""
         ocr_text = "\n".join(texts)
         # Step 2: 약 정보 분석 - MedGemma로 의료 정보 제공