Spaces:

Dongjin1203
/

RFP_summary_chatbot

Paused

File size: 12,733 Bytes

03c7f28

from langchain_openai import ChatOpenAI
from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
from langchain_core.output_parsers import StrOutputParser
from langchain_core.runnables import RunnablePassthrough, RunnableLambda
from langchain_core.messages import HumanMessage, AIMessage
from langsmith import traceable
import time
from typing import List, Dict

from src.utils.config import RAGConfig
from src.retriever.retriever import RAGRetriever


class RAGPipeline:
    """대화형 RAG 파이프라인 - LangChain Chain 기반"""

    def __init__(self, config: RAGConfig = None, model: str = None, top_k: int = None):
        """초기화"""
        self.config = config or RAGConfig()
        self.model = model or self.config.LLM_MODEL_NAME
        self.top_k = top_k or self.config.DEFAULT_TOP_K
        
        # 검색 설정
        self.search_mode = self.config.DEFAULT_SEARCH_MODE
        self.alpha = self.config.DEFAULT_ALPHA

        # LLM 초기화 (LangChain ChatOpenAI)
        self.llm = ChatOpenAI(
            model=self.model,
            openai_api_key=self.config.OPENAI_API_KEY,
            timeout=60.0,
            max_retries=3
        )

        # Retriever 초기화
        self.retriever = RAGRetriever(config=self.config)
        
        # 대화 히스토리
        self.chat_history: List[Dict] = []
        
        # 마지막 검색 결과 저장 (sources 반환용)
        self._last_retrieved_docs = []

        # 프롬프트 템플릿 (대화 히스토리 포함)
        self.prompt = ChatPromptTemplate.from_messages([
            ("system", """당신은 공공입찰 RFP를 분석하는 입찰메이트 사내 분석가입니다. 제공된 컨텍스트만으로 요구사항·예산·대상 기관·제출 방식 등을 구조화해 의사결정을 지원하세요.

            # 규칙
            - 답변은 한국어로 작성합니다.
            - 컨텍스트 밖 내용을 추측하지 않습니다.
            - 정보가 없으면 "문서에서 해당 정보를 찾을 수 없습니다."라고 밝힙니다.
            - 여러 문서를 비교할 때는 문서별 차이를 표 또는 목록으로 정리합니다.
            - 숫자에는 가능한 단위를 포함합니다.
            - 직전 대화 맥락을 반영합니다.

            # 답변 형식
            1. 한 줄 요약: 질문 핵심을 한두 문장으로 작성합니다.
            2. 상세 답변: [요구사항], [대상 기관], [예산], [제출 형식/방법], [평가 기준] 등 문서에서 확인된 항목만 정리합니다.
            3. 근거 정보: 위 답변의 근거가 된 문장이나 문단을 요약합니다.
            4. 부족한 정보: 문서에서 찾을 수 없는 항목은 "문서에서 확인 불가"로 표기합니다."""),
                        
                        # 대화 히스토리
                        MessagesPlaceholder(variable_name="chat_history"),
                        
                        # 현재 질문과 컨텍스트
                        ("user", """# 컨텍스트
            {context}

            # 질문
            {question}

            위 규칙에 따라 답변하세요.""")
        ])

        # Chain 구성
        self.chain = (
            {
                "context": RunnableLambda(self._retrieve_and_format),
                "question": RunnablePassthrough(),
                "chat_history": RunnableLambda(lambda x: self._get_chat_history())
            }
            | self.prompt
            | self.llm
            | StrOutputParser()
        )

        print(f"✅ RAG 파이프라인 초기화 완료")
        print(f"   - 모델: {self.model}")
        print(f"   - 기본 top_k: {self.top_k}")
        print(f"   - 검색 모드: {self.search_mode}")

    def _get_chat_history(self) -> List:
        """대화 히스토리를 LangChain 메시지 형식으로 변환"""
        messages = []
        for msg in self.chat_history:
            if msg["role"] == "user":
                messages.append(HumanMessage(content=msg["content"]))
            else:
                messages.append(AIMessage(content=msg["content"]))
        return messages

    def _retrieve_and_format(self, query: str) -> str:
        """검색 수행 및 컨텍스트 포맷팅"""
        # 검색 모드에 따라 문서 검색
        if self.search_mode == "embedding":
            docs = self.retriever.search(query, top_k=self.top_k)
        elif self.search_mode == "hybrid":
            docs = self.retriever.hybrid_search(query, top_k=self.top_k, alpha=self.alpha)
        elif self.search_mode == "hybrid_rerank":
            docs = self.retriever.hybrid_search_with_rerank(
                query, top_k=self.top_k, alpha=self.alpha
            )
        else:
            docs = self.retriever.search(query, top_k=self.top_k)
        
        # 마지막 검색 결과 저장
        self._last_retrieved_docs = docs
        
        # 컨텍스트 포맷팅
        return self._format_context(docs)

    def _format_context(self, retrieved_docs: list) -> str:
        """검색된 문서를 컨텍스트로 변환"""
        if not retrieved_docs:
            return "관련 문서를 찾을 수 없습니다."
        
        context_parts = []
        for i, doc in enumerate(retrieved_docs, 1):
            context_parts.append(f"[문서 {i}]\n{doc['content']}\n")
        return "\n".join(context_parts)

    def _format_sources(self, retrieved_docs: list) -> list:
        """검색된 문서를 sources 형식으로 변환"""
        sources = []
        for doc in retrieved_docs:
            source_info = {
                'content': doc['content'],
                'metadata': doc['metadata'],
                'filename': doc.get('filename', 'N/A'),
                'organization': doc.get('organization', 'N/A')
            }
            
            # 검색 모드에 따라 점수 필드가 다름
            if 'rerank_score' in doc:
                source_info['score'] = doc['rerank_score']
                source_info['score_type'] = 'rerank'
            elif 'hybrid_score' in doc:
                source_info['score'] = doc['hybrid_score']
                source_info['score_type'] = 'hybrid'
            elif 'relevance_score' in doc:
                source_info['score'] = doc['relevance_score']
                source_info['score_type'] = 'embedding'
            else:
                source_info['score'] = 0
                source_info['score_type'] = 'unknown'
            
            sources.append(source_info)
        return sources

    @traceable(
        name="RAG_Generate_Answer",
        metadata={"component": "generator", "version": "2.0"}
    )
    def generate_answer(
        self, 
        query: str, 
        top_k: int = None,
        search_mode: str = None,
        alpha: float = None
    ) -> dict:
        """
        답변 생성 (Chain 기반)
        
        Args:
            query: 질문
            top_k: 검색할 문서 수
            search_mode: 검색 모드 ("embedding", "hybrid", "hybrid_rerank")
            alpha: 임베딩 가중치 (0~1)
        
        Returns:
            dict: answer, sources, search_mode, usage
        """
        try:
            start_time = time.time()
            
            # 파라미터 설정
            if top_k is not None:
                self.top_k = top_k
            if search_mode is not None:
                self.search_mode = search_mode
            if alpha is not None:
                self.alpha = alpha
            
            # Chain 실행
            answer = self.chain.invoke(query)
            
            elapsed_time = time.time() - start_time
            
            # 대화 히스토리에 추가
            self.chat_history.append({"role": "user", "content": query})
            self.chat_history.append({"role": "assistant", "content": answer})
            
            # 토큰 사용량 추정 (LangChain에서는 직접 접근 어려움)
            estimated_tokens = len(query.split()) + len(answer.split()) * 2
            
            return {
                'answer': answer,
                'sources': self._format_sources(self._last_retrieved_docs),
                'search_mode': self.search_mode,
                'elapsed_time': elapsed_time,
                'usage': {
                    'total_tokens': estimated_tokens,
                    'prompt_tokens': 0,
                    'completion_tokens': 0
                }
            }
        
        except Exception as e:
            print(f"❌ 답변 생성 실패: {e}")
            import traceback
            traceback.print_exc()
            raise RuntimeError(f"답변 생성 실패: {str(e)}") from e

    def chat(self, query: str) -> str:
        """
        간단한 대화 인터페이스
        
        Args:
            query: 질문
        
        Returns:
            str: 답변 텍스트만 반환
        """
        result = self.generate_answer(query)
        return result['answer']

    def clear_history(self):
        """대화 히스토리 초기화"""
        self.chat_history = []
        print("🗑️ 대화 히스토리가 초기화되었습니다.")

    def get_history(self) -> List[Dict]:
        """대화 히스토리 반환"""
        return self.chat_history.copy()

    def set_search_config(self, search_mode: str = None, top_k: int = None, alpha: float = None):
        """검색 설정 변경"""
        if search_mode is not None:
            self.search_mode = search_mode
        if top_k is not None:
            self.top_k = top_k
        if alpha is not None:
            self.alpha = alpha
        
        print(f"🔧 검색 설정 변경: mode={self.search_mode}, top_k={self.top_k}, alpha={self.alpha}")

    def print_result(self, result: dict, query: str = None):
        """결과 출력"""
        print("\n" + "="*60)
        if query:
            print(f"질문: {query}")
        print(f"검색 모드: {result.get('search_mode', 'N/A')}")
        if 'elapsed_time' in result:
            print(f"소요 시간: {result['elapsed_time']:.2f}초")
        print("="*60)
        print(f"\n💬 답변:\n{result['answer']}")
        print(f"\n📚 참고 문서 ({len(result['sources'])}개):")
        for i, source in enumerate(result['sources'], 1):
            score = source.get('score', 0)
            score_type = source.get('score_type', '')
            print(f"  [{i}] {source['filename']}")
            print(f"      점수: {score:.3f} ({score_type})")
        print("="*60)


# 대화형 실행
def interactive_mode():
    """대화형 모드 실행"""
    print("=" * 60)
    print("대화형 RAG 시스템 초기화 중...")
    print("=" * 60)
    
    config = RAGConfig()
    pipeline = RAGPipeline(config=config)
    
    print("\n" + "=" * 60)
    print("대화형 모드 시작")
    print("명령어: 'quit' (종료), 'clear' (히스토리 초기화), 'mode' (검색모드 변경)")
    print("=" * 60)
    
    while True:
        user_query = input("\n질문: ").strip()
        
        if not user_query:
            continue
        
        if user_query.lower() in ['quit', 'exit', '종료', 'q']:
            print("시스템을 종료합니다.")
            break
        
        if user_query.lower() == 'clear':
            pipeline.clear_history()
            continue
        
        if user_query.lower() == 'mode':
            print("\n검색 모드 선택:")
            print("1. embedding - 임베딩 검색")
            print("2. hybrid - BM25 + 임베딩")
            print("3. hybrid_rerank - Hybrid + Re-ranker (권장)")
            choice = input("선택 (1/2/3): ").strip()
            modes = {'1': 'embedding', '2': 'hybrid', '3': 'hybrid_rerank'}
            if choice in modes:
                pipeline.set_search_config(search_mode=modes[choice])
            continue
        
        try:
            result = pipeline.generate_answer(query=user_query)
            pipeline.print_result(result, user_query)
            
            # 소스 출력 여부
            show_source = input("\n참조 문서 상세 보기? (y/n): ").strip().lower()
            if show_source == 'y':
                for i, source in enumerate(result['sources'], 1):
                    print(f"\n{'='*40}")
                    print(f"[문서 {i}] {source['filename']}")
                    print(f"발주기관: {source['organization']}")
                    print(f"내용:\n{source['content'][:500]}...")
        
        except Exception as e:
            print(f"❌ 오류 발생: {e}")


# 사용 예시
if __name__ == "__main__":
    interactive_mode()