Spaces:

davidtran999
/

hue-portal-backend-v2

Sleeping

Davidtran99 commited on 19 days ago

Commit

9bb60b8

1 Parent(s): 0c2f39a

Fix: Frontend kh��ng nh��n ��c response - Th��m validation v�� error handling

- Fix logic ��p intent: Kh��ng ��p greeting th��nh search_legal
- T��i ��u LLM: T��ng threads t�� 4��8, gi��m context t�� 8192��4096
- R��t g��n prompts: Gi��m tokens �� t��ng t��c ��
- Th��m response validation: ��m b��o lu��n c�� message/clarification
- C��i thi��n error handling: ��m b��o response lu��n h��p l��

Files changed (3) hide show

backend/hue_portal/chatbot/chatbot.py +83 -23
backend/hue_portal/chatbot/llm_integration.py +12 -28
backend/hue_portal/chatbot/views.py +26 -0

backend/hue_portal/chatbot/chatbot.py CHANGED Viewed

@@ -111,12 +111,32 @@ class Chatbot(CoreChatbot):
             intent = route_decision.forced_intent
         # Nếu session đã có selected_document_code (user đã chọn văn bản ở wizard)
-        # thì luôn ép intent về search_legal và route sang SEARCH,
-        # tránh bị kẹt ở nhánh small-talk/off-topic do nội dung câu hỏi ban đầu.
-        if selected_doc_code:
-            intent = "search_legal"
-            route_decision.route = IntentRoute.SEARCH
-            route_decision.forced_intent = "search_legal"
         # Map tất cả intent tra cứu nội dung về search_legal
         domain_search_intents = {
@@ -217,19 +237,31 @@ class Chatbot(CoreChatbot):
         if intent == "search_legal" and not selected_doc_code and not has_doc_code_in_query:
             print("[WIZARD] ✅ Stage 1: Using direct semantic search from slow_path_handler")
             # Delegate to slow_path_handler which uses direct semantic search (no query rewrite)
-            slow_handler = SlowPathHandler()
-            response = slow_handler.handle(
-                query=query,
-                intent=intent,
-                session_id=session_id,
-                selected_document_code=None,  # No document selected yet
-            )
-            # Ensure response has wizard metadata
-            if response:
                 response.setdefault("wizard_stage", "choose_document")
                 response.setdefault("routing", "legal_wizard")
                 response.setdefault("type", "options")
                 # Update session metadata
                 if session_id:
@@ -248,20 +280,48 @@ class Chatbot(CoreChatbot):
                 if session_id:
                     try:
                         bot_message = response.get("message") or response.get("clarification", {}).get("message", "")
-                        ConversationContext.add_message(
-                            session_id=session_id,
-                            role="bot",
-                            content=bot_message,
-                            intent=intent,
-                        )
                     except Exception as e:
                         print(f"⚠️ Failed to save wizard bot message: {e}")
-            return response if response else {
-                "message": "Xin lỗi, có lỗi xảy ra khi tìm kiếm văn bản.",
                 "intent": intent,
                 "results": [],
                 "count": 0,
             }
         # Stage 2: Choose topic/section (if document selected but no topic yet)

             intent = route_decision.forced_intent
         # Nếu session đã có selected_document_code (user đã chọn văn bản ở wizard)
+        # thì ép intent về search_legal CHỈ KHI query không phải greeting/small_talk
+        # Tránh ép greeting thành search_legal (gây chậm và sai logic)
+        if selected_doc_code and route_decision.route != IntentRoute.GREETING:
+            # Chỉ ép intent nếu không phải greeting đơn giản
+            query_lower = query.lower().strip()
+            is_simple_greeting = (
+                len(query_lower.split()) <= 3 and
+                any(greeting in query_lower for greeting in ["xin chào", "xin chao", "chào", "chao", "hello", "hi", "hey"]) and
+                not any(kw in query_lower for kw in ["phạt", "mức phạt", "vi phạm", "thủ tục", "hồ sơ", "địa chỉ", "công an", "cảnh báo", "kỷ luật", "đảng"])
+            )
+            if not is_simple_greeting:
+                intent = "search_legal"
+                route_decision.route = IntentRoute.SEARCH
+                route_decision.forced_intent = "search_legal"
+            else:
+                # Reset selected_doc_code nếu user gửi greeting mới
+                if session_id:
+                    try:
+                        ConversationContext.update_session_metadata(
+                            session_id,
+                            {"selected_document_code": None, "selected_topic": None, "wizard_stage": None}
+                        )
+                        selected_doc_code = None
+                        logger.info("[WIZARD] Reset selected_doc_code for new greeting")
+                    except Exception:
+                        pass
         # Map tất cả intent tra cứu nội dung về search_legal
         domain_search_intents = {
         if intent == "search_legal" and not selected_doc_code and not has_doc_code_in_query:
             print("[WIZARD] ✅ Stage 1: Using direct semantic search from slow_path_handler")
             # Delegate to slow_path_handler which uses direct semantic search (no query rewrite)
+            try:
+                slow_handler = SlowPathHandler()
+                response = slow_handler.handle(
+                    query=query,
+                    intent=intent,
+                    session_id=session_id,
+                    selected_document_code=None,  # No document selected yet
+                )
+            except Exception as e:
+                logger.error("[WIZARD] Error in slow_path_handler: %s", e, exc_info=True)
+                print(f"⚠️ [WIZARD] Error in slow_path_handler: {e}")
+                response = None
+            # Ensure response has wizard metadata and required fields
+            if response and isinstance(response, dict):
+                # Ensure message field exists
+                if not response.get("message") and not response.get("clarification"):
+                    response["message"] = "Tôi đã tìm thấy các văn bản pháp luật liên quan. Bạn hãy chọn văn bản muốn tra cứu:"
                 response.setdefault("wizard_stage", "choose_document")
                 response.setdefault("routing", "legal_wizard")
                 response.setdefault("type", "options")
+                response.setdefault("intent", intent)
+                response.setdefault("results", [])
+                response.setdefault("count", 0)
                 # Update session metadata
                 if session_id:
                 if session_id:
                     try:
                         bot_message = response.get("message") or response.get("clarification", {}).get("message", "")
+                        if bot_message:
+                            ConversationContext.add_message(
+                                session_id=session_id,
+                                role="bot",
+                                content=bot_message,
+                                intent=intent,
+                            )
                     except Exception as e:
                         print(f"⚠️ Failed to save wizard bot message: {e}")
+                return response
+            # Fallback response if slow_handler failed or returned invalid response
+            logger.warning("[WIZARD] slow_path_handler returned invalid response, using fallback")
+            return {
+                "message": "Tôi đã tìm thấy các văn bản pháp luật liên quan. Bạn hãy chọn văn bản muốn tra cứu:",
                 "intent": intent,
                 "results": [],
                 "count": 0,
+                "type": "options",
+                "wizard_stage": "choose_document",
+                "routing": "legal_wizard",
+                "clarification": {
+                    "message": "Tôi đã tìm thấy các văn bản pháp luật liên quan. Bạn hãy chọn văn bản muốn tra cứu:",
+                    "options": [
+                        {
+                            "code": "264-QD-TW",
+                            "title": "Quyết định 264-QĐ/TW về kỷ luật đảng viên",
+                            "reason": "Quy định chung về xử lý kỷ luật đối với đảng viên vi phạm.",
+                        },
+                        {
+                            "code": "QD-69-TW",
+                            "title": "Quy định 69-QĐ/TW về kỷ luật tổ chức đảng, đảng viên",
+                            "reason": "Quy định chi tiết về các hành vi vi phạm và hình thức kỷ luật.",
+                        },
+                        {
+                            "code": "TT-02-CAND",
+                            "title": "Thông tư 02/2021/TT-BCA về điều lệnh CAND",
+                            "reason": "Quy định về điều lệnh, lễ tiết, tác phong trong CAND.",
+                        },
+                    ],
+                },
             }
         # Stage 2: Choose topic/section (if document selected but no topic yet)

backend/hue_portal/chatbot/llm_integration.py CHANGED Viewed

@@ -465,9 +465,10 @@ class LLMGenerator:
             return
         # CPU-friendly defaults: smaller context/batch to reduce latency/RAM
-        n_ctx = int(os.environ.get("LLAMA_CPP_CONTEXT", "8192"))
-        n_threads = int(os.environ.get("LLAMA_CPP_THREADS", "4"))
-        n_batch = int(os.environ.get("LLAMA_CPP_BATCH", "1024"))
         n_gpu_layers = int(os.environ.get("LLAMA_CPP_GPU_LAYERS", "0"))
         use_mmap = os.environ.get("LLAMA_CPP_USE_MMAP", "true").lower() == "true"
         use_mlock = os.environ.get("LLAMA_CPP_USE_MLOCK", "true").lower() == "true"
@@ -859,24 +860,11 @@ class LLMGenerator:
                 f"Lịch sử hội thoại gần đây:\n{context_summary}\n\n"
             )
         prompt += (
-            "Đây là các điều khoản/chủ đề trong văn bản có thể liên quan:\n"
-            f"{os.linesep.join(candidate_lines)}\n\n"
-            f"Hãy chọn tối đa {max_options} chủ đề/điều khoản quan trọng nhất cần người dùng xác nhận.\n"
-            "Yêu cầu trả về JSON với dạng:\n"
-            "{\n"
-            '  "message": "Câu nhắc người dùng bằng tiếng Việt",\n'
-            '  "options": [\n'
-            '    {"title": "Tên chủ đề/điều khoản", "article": "Điều X", "reason": "Lý do gợi ý", "keywords": ["từ", "khóa", "tìm", "kiếm"]},\n'
-            "    ...\n"
-            "  ],\n"
-            '  "search_keywords": ["từ", "khóa", "chính", "để", "tìm", "kiếm"]\n'
-            "}\n"
-            "Trong đó:\n"
-            "- options: Danh sách chủ đề/điều khoản để người dùng chọn\n"
-            "- search_keywords: Danh sách từ khóa quan trọng để tìm kiếm thông tin liên quan\n"
-            "- Mỗi option nên có keywords riêng để tìm kiếm chính xác hơn\n"
-            "Chỉ in JSON, không thêm lời giải thích khác."
         )
         raw = self._generate_from_prompt(prompt)
@@ -1053,15 +1041,11 @@ class LLMGenerator:
             ]
             context_text += " " + " ".join(recent_user_messages)
         prompt = (
-            "Bạn là trợ lý pháp luật. Tôi cần bạn trích xuất các từ khóa quan trọng để tìm kiếm thông tin.\n\n"
-            f"Ngữ cảnh: {context_text[:500]}\n\n"
-            "Hãy trích xuất 5-10 từ khóa quan trọng nhất (tiếng Việt) để tìm kiếm.\n"
-            "Yêu cầu trả về JSON với dạng:\n"
-            "{\n"
-            '  "keywords": ["từ", "khóa", "quan", "trọng"]\n'
-            "}\n"
-            "Chỉ in JSON, không thêm lời giải thích khác."
         )
         raw = self._generate_from_prompt(prompt)

             return
         # CPU-friendly defaults: smaller context/batch to reduce latency/RAM
+        # Tăng threads để tăng tốc độ trên CPU (HF Spaces có nhiều cores)
+        n_ctx = int(os.environ.get("LLAMA_CPP_CONTEXT", "4096"))  # Giảm context để nhanh hơn
+        n_threads = int(os.environ.get("LLAMA_CPP_THREADS", "8"))  # Tăng từ 4 lên 8 threads
+        n_batch = int(os.environ.get("LLAMA_CPP_BATCH", "512"))  # Giảm batch để giảm RAM
         n_gpu_layers = int(os.environ.get("LLAMA_CPP_GPU_LAYERS", "0"))
         use_mmap = os.environ.get("LLAMA_CPP_USE_MMAP", "true").lower() == "true"
         use_mlock = os.environ.get("LLAMA_CPP_USE_MLOCK", "true").lower() == "true"
                 f"Lịch sử hội thoại gần đây:\n{context_summary}\n\n"
             )
+        # Tối ưu prompt: rút gọn để giảm tokens và tăng tốc độ
         prompt += (
+            f"Các điều khoản liên quan:\n{os.linesep.join(candidate_lines[:5])}\n\n"
+            f"Chọn {max_options} chủ đề quan trọng nhất. JSON:\n"
+            "{\"message\": \"Câu nhắc\", \"options\": [{\"title\": \"...\", \"article\": \"...\", \"reason\": \"...\", \"keywords\": [...]}], \"search_keywords\": [...]}"
         )
         raw = self._generate_from_prompt(prompt)
             ]
             context_text += " " + " ".join(recent_user_messages)
+        # Tối ưu prompt: ngắn gọn hơn để giảm tokens và tăng tốc độ
         prompt = (
+            "Trích xuất 5-8 từ khóa quan trọng từ:\n"
+            f"{context_text[:300]}\n\n"
+            "JSON: {\"keywords\": [\"từ\", \"khóa\"]}"
         )
         raw = self._generate_from_prompt(prompt)

backend/hue_portal/chatbot/views.py CHANGED Viewed

@@ -228,10 +228,36 @@ def chat(request: Request) -> Response:
         chatbot = get_chatbot()
         response = chatbot.generate_response(message, session_id=session_id)
         # Ensure session_id is in response
         if "session_id" not in response:
             response["session_id"] = session_id
         # Enhanced logging for search_legal queries
         intent = response.get("intent", "unknown")
         if intent == "search_legal":

         chatbot = get_chatbot()
         response = chatbot.generate_response(message, session_id=session_id)
+        # Validate response - ensure it's a dict with required fields
+        if not response or not isinstance(response, dict):
+            logger.error("[CHAT] ❌ Invalid response from chatbot.generate_response: %s", type(response))
+            response = {
+                "message": "Xin lỗi, có lỗi xảy ra khi xử lý câu hỏi của bạn. Vui lòng thử lại.",
+                "intent": "error",
+                "results": [],
+                "count": 0,
+                "session_id": session_id,
+            }
+        # Ensure required fields exist
+        if "message" not in response and "clarification" not in response:
+            logger.warning("[CHAT] ⚠️ Response missing 'message' field, adding default")
+            response["message"] = "Xin lỗi, không thể tìm thấy thông tin."
         # Ensure session_id is in response
         if "session_id" not in response:
             response["session_id"] = session_id
+        # Ensure intent exists
+        if "intent" not in response:
+            response["intent"] = "unknown"
+        # Ensure results and count exist
+        if "results" not in response:
+            response["results"] = []
+        if "count" not in response:
+            response["count"] = len(response.get("results", []))
         # Enhanced logging for search_legal queries
         intent = response.get("intent", "unknown")
         if intent == "search_legal":

Fix: Frontend kh��ng nh���n �������c response - Th��m validation v�� error handling

Fix: Frontend kh��ng nh��n ��c response - Th��m validation v�� error handling