Xu ly SSO

This commit is contained in:
2026-05-09 10:31:28 +00:00
parent 9d04e7484c
commit f937d1a98e
21 changed files with 2515 additions and 271 deletions

View File

@@ -5,37 +5,46 @@ from .llm_factory import LLMFactory
logger = logging.getLogger("RAGEngine")
class RAGEngine:
def __init__(self):
self.retriever = SearchRetriever()
self.llm = LLMFactory.get_provider()
logger.info(f"RAG Engine đã sẵn sàng với LLM Provider: {type(self.llm).__name__}")
logger.info(f"RAG Engine ready with LLM Provider: {type(self.llm).__name__}")
def chat(self, user_query: str, history: List[Dict[str, str]] = None) -> Dict:
def chat(self, user_query: str, history: List[Dict[str, str]] = None, user_email: str = None, is_admin: bool = False) -> Dict:
"""
Quy trình RAG hoàn chỉnh: Search -> Augment -> Generate
Quy trình RAG: Search -> Augment -> Generate
Args:
user_query: Câu hỏi
history: Lịch sử chat
user_email: Email user để filter quyền
is_admin: True = bypass ACL
"""
# 1. RETRIEVAL: Tìm kiếm ngữ cảnh liên quan
relevant_chunks = self.retriever.retrieve(user_query, top_k=5)
logger.info(f"Search query: {user_query[:100]} (user={user_email or 'none'}, admin={is_admin})")
relevant_chunks = self.retriever.retrieve(user_query, top_k=5, user_email=user_email, is_admin=is_admin)
if not relevant_chunks:
context_text = "Không tìm thấy thông tin liên quan trong cơ sở dữ liệu nội bộ."
logger.info("Search result: 0 chunks found")
else:
# Gộp text từ các chunks lại thành 1 khối context
context_text = "\n---\n".join([
f"[Nguồn: {c.file_name}, Trang: {c.page_from}]\nNội dung: {c.text}"
for c in relevant_chunks
])
logger.info(f"Search result: {len(relevant_chunks)} chunks from {len(set(c.file_name for c in relevant_chunks))} files")
# 2. GENERATION: Gửi sang LLM để trả lời
logger.info("Đang yêu cầu LLM tổng hợp câu trả lời...")
# 2. GENERATION
logger.info("Requesting LLM to generate answer...")
answer = self.llm.generate_response(
prompt=user_query,
context=context_text,
history=history
)
logger.info(f"LLM response length: {len(answer)} chars")
# 3. Trả về kết quả kèm theo nguồn trích dẫn (Citations)
# 3. Return with citations
return {
"answer": answer,
"context_used": context_text,
@@ -43,7 +52,8 @@ class RAGEngine:
{
"file_name": c.file_name,
"page": c.page_from,
"url": c.source_url
"url": c.source_url,
"download_url": c.download_url
} for c in relevant_chunks
]
}