Spaces:

gkdud00
/

project-tdm

Running

App Files Files Community

hy commited on 20 days ago

Commit

61d0a1d

1 Parent(s): 1ae484c

e

Browse files

Files changed (1) hide show

aggro_model.py +82 -19

aggro_model.py CHANGED Viewed

@@ -152,48 +152,111 @@ except Exception as e:
 # 3. 메인 함수
 # =============================================================================
 def get_aggro_score(title: str) -> dict:
     # 1. 규칙 기반 점수
     rule_score = 0.0
     rule_pattern = "분석 불가"
-    if rule_scorer:
-        try:
-            res = rule_scorer.get_score(title)
-            rule_score = res['score']
-            rule_pattern = res.get('pattern_name', '알 수 없음')
-        except Exception as e:
-            print(f"규칙 계산 에러: {e}")
-            rule_score = 50.0
     # 2. KoBERT 점수
     bert_score = 0.0
     if aggro_model and tokenizer:
         try:
             inputs = tokenizer(
-                title, return_tensors='pt', padding="max_length", truncation=True, max_length=64
             )
             input_ids = inputs['input_ids'].to(device)
             mask = inputs['attention_mask'].to(device)
             with torch.no_grad():
                 outputs = aggro_model(input_ids, mask)
-                probs = F.softmax(outputs / 2.0, dim=1)
                 bert_score = probs[0][1].item() * 100
-        except:
             bert_score = 50.0
-     # Safety Net 적용 (규칙 점수가 낮으면 AI 점수도 깎음)
     if rule_score < 5:
-        bert_score *= 0.3 # 규칙 점수가 거의 없으면 AI 점수 70% 삭감
     elif rule_score < 20:
-        bert_score *= 0.8 # 규칙 점수가 낮으면 AI 점수 20% 삭감
-    #3. 합산
-    w_rule = 0.0
-    w_bert = 1.0
     final_score = (rule_score * w_rule) + (bert_score * w_bert)
     # 4. 결과
     normalized_score = min(final_score / 100.0, 1.0)

 # 3. 메인 함수
 # =============================================================================
 def get_aggro_score(title: str) -> dict:
+    print(f"\n[DEBUG] 분석할 제목: {title}") # 1. 제목이 잘 들어왔나 확인
     # 1. 규칙 기반 점수
     rule_score = 0.0
     rule_pattern = "분석 불가"
+    try:
+        res = rule_scorer.get_score(title)
+        rule_score = res['score'] # 0~100점
+        rule_pattern = res.get('pattern_name', '알 수 없음')
+    except Exception as e:
+        print(f"[DEBUG] 규칙 계산 에러: {e}")
+        rule_score = 0.0
+    print(f"[DEBUG] 1. 규칙 점수: {rule_score}") # 2. 규칙 점수 확인
     # 2. KoBERT 점수
     bert_score = 0.0
     if aggro_model and tokenizer:
         try:
             inputs = tokenizer(
+                title,
+                return_tensors='pt',
+                padding="max_length",
+                truncation=True,
+                max_length=64
             )
             input_ids = inputs['input_ids'].to(device)
             mask = inputs['attention_mask'].to(device)
+            # 토큰화 결과 확인 (제대로 잘렸는지)
+            # print(f"[DEBUG] 토큰화 결과: {inputs['input_ids'][0][:10]}")
             with torch.no_grad():
                 outputs = aggro_model(input_ids, mask)
+                # 🚨 원본 로직 (Logits 값 확인)
+                print(f"[DEBUG] 모델 출력값(Logits): {outputs}")
+                # Temperature Scaling 적용 전/후 비교
+                probs = F.softmax(outputs / 2.0, dim=1)
                 bert_score = probs[0][1].item() * 100
+            print(f"[DEBUG] 2. BERT 원본 점수: {bert_score}") # 3. AI 점수 확인
+        except Exception as e:
+            print(f"[Aggro] KoBERT 예측 오류: {e}")
             bert_score = 50.0
+    # 3. Safety Net (점수 깎기)
     if rule_score < 5:
+        print("[DEBUG] Safety Net 발동! (규칙 점수 미달 -> AI 점수 70% 삭감)")
+        bert_score *= 0.3
     elif rule_score < 20:
+        print("[DEBUG] Safety Net 발동! (규칙 점수 낮음 -> AI 점수 20% 삭감)")
+        bert_score *= 0.8
+    print(f"[DEBUG] 3. 보정된 BERT 점수: {bert_score}") # 4. 깎인 점수 확인
+    # 4. 최종 합산
+    w_rule = 0.4
+    w_bert = 0.6
     final_score = (rule_score * w_rule) + (bert_score * w_bert)
+    print(f"[DEBUG] 4. 최종 합산 점수: {final_score}")
+    # # 1. 규칙 기반 점수
+    # rule_score = 0.0
+    # rule_pattern = "분석 불가"
+    # if rule_scorer:
+    #     try:
+    #         res = rule_scorer.get_score(title)
+    #         rule_score = res['score']
+    #         rule_pattern = res.get('pattern_name', '알 수 없음')
+    #     except Exception as e:
+    #         print(f"규칙 계산 에러: {e}")
+    #         rule_score = 50.0
+    # # 2. KoBERT 점수
+    # bert_score = 0.0
+    # if aggro_model and tokenizer:
+    #     try:
+    #         inputs = tokenizer(
+    #             title, return_tensors='pt', padding="max_length", truncation=True, max_length=64
+    #         )
+    #         input_ids = inputs['input_ids'].to(device)
+    #         mask = inputs['attention_mask'].to(device)
+    #         with torch.no_grad():
+    #             outputs = aggro_model(input_ids, mask)
+    #             probs = F.softmax(outputs / 2.0, dim=1)
+    #             bert_score = probs[0][1].item() * 100
+    #     except:
+    #         bert_score = 50.0
+    #  # Safety Net 적용 (규칙 점수가 낮으면 AI 점수도 깎음)
+    # if rule_score < 5:
+    #     bert_score *= 0.3 # 규칙 점수가 거의 없으면 AI 점수 70% 삭감
+    # elif rule_score < 20:
+    #     bert_score *= 0.8 # 규칙 점수가 낮으면 AI 점수 20% 삭감
+    # #3. 합산
+    # w_rule = 0.0
+    # w_bert = 1.0
+    # final_score = (rule_score * w_rule) + (bert_score * w_bert)
     # 4. 결과
     normalized_score = min(final_score / 100.0, 1.0)