File size: 5,202 Bytes
24510a0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
import os
import gradio as gr
from langchain_community.document_loaders import TextLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain_community.embeddings import HuggingFaceEmbeddings
from langchain_community.vectorstores import Chroma
from langchain_community.llms import HuggingFacePipeline
from langchain.chains import ConversationalRetrievalChain
from langchain.memory import ConversationBufferMemory
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline

# -------------------------------------------------------------------
# Constants
DB_DIR = "chroma_db"
MODEL_NAME_EMBEDDINGS = "sentence-transformers/all-MiniLM-L6-v2"
MODEL_ID_LLM = "google/flan-t5-base"
DOC_PATH = "temp_docs/samsung_manual.txt"  # fixed document path

# Globals
conversation_chain = None
chat_history = []  # [{"role": "user/assistant", "content": "..."}]

# -------------------------------------------------------------------
def load_and_process_document():
    """Load the Samsung manual, split it, embed it, and create vectorstore."""
    if not os.path.exists(DOC_PATH):
        raise FileNotFoundError(f"❌ Document not found at: {DOC_PATH}")

    print("📄 Loading document...")
    # Force UTF-8 encoding to handle special characters
    loader = TextLoader(DOC_PATH, encoding="utf-8")
    docs = loader.load()

    print("✂️ Splitting document into chunks...")
    text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
    texts = text_splitter.split_documents(docs)

    print("🧠 Creating embeddings...")
    embeddings = HuggingFaceEmbeddings(model_name=MODEL_NAME_EMBEDDINGS)

    print("💾 Building Chroma vectorstore...")
    vectorstore = Chroma.from_documents(
        documents=texts,
        embedding=embeddings,
        persist_directory=DB_DIR
    )
    return vectorstore, len(texts)  # return number of chunks


def get_conversational_chain(vectorstore):
    """Create the conversational retrieval chain."""
    tokenizer = AutoTokenizer.from_pretrained(MODEL_ID_LLM)
    model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_ID_LLM)
    pipe = pipeline(
        "text2text-generation",
        model=model,
        tokenizer=tokenizer,
        max_length=512,
        temperature=0.1,
        top_p=0.95,
        repetition_penalty=1.2
    )
    llm = HuggingFacePipeline(pipeline=pipe)

    memory = ConversationBufferMemory(
        memory_key="chat_history",
        return_messages=True
    )

    chain = ConversationalRetrievalChain.from_llm(
        llm=llm,
        retriever=vectorstore.as_retriever(search_kwargs={"k": 2}),
        memory=memory
    )
    return chain

def chatbot_response(user_input):
    """Generate chatbot response from conversation chain."""
    global conversation_chain, chat_history

    if conversation_chain is None:
        chat_history.append({
            "role": "assistant",
            "content": "⚠️ The chatbot is not ready. Please check the server logs."
        })
        return chat_history

    chat_history.append({"role": "user", "content": user_input})
    response = conversation_chain({"question": user_input})
    ai_answer = response["answer"]
    chat_history.append({"role": "assistant", "content": ai_answer})
    return chat_history

# -------------------------------------------------------------------
# Gradio Interface
with gr.Blocks() as demo:
    gr.Markdown("## 🤖 Chat with Samsung Manual")
    gr.Markdown("Ask questions about the **Samsung Manual** document below:")

    # Status info
    status_md = gr.Markdown("⏳ Initializing chatbot...")

    # Chat interface
    chatbot = gr.Chatbot(label="Conversation", type="messages")
    user_input = gr.Textbox(
        label="Type your question here…",
        placeholder="Ask me about the Samsung manual..."
    )
    submit_btn = gr.Button("Ask")

    # -------------------------------------------------------------------
    # Initialization function to show status
    def init_chatbot():
        global conversation_chain
        try:
            if not os.path.exists(DB_DIR) or not os.listdir(DB_DIR):
                # Rebuild vectorstore
                vectorstore, chunks = load_and_process_document()
                msg = f"✅ Manual processed and stored! Total chunks: {chunks}"
            else:
                embeddings = HuggingFaceEmbeddings(model_name=MODEL_NAME_EMBEDDINGS)
                vectorstore = Chroma(persist_directory=DB_DIR, embedding_function=embeddings)
                chunks = len(vectorstore._collection.get()["metadatas"])
                msg = f"✅ Chroma DB loaded! Total chunks: {chunks}"

            conversation_chain = get_conversational_chain(vectorstore)
            return msg
        except Exception as e:
            import traceback
            traceback.print_exc()
            return f"❌ Failed to initialize chatbot: {e}"

    # Initialize on startup
    status_md.value = init_chatbot()

    submit_btn.click(
        fn=chatbot_response,
        inputs=user_input,
        outputs=chatbot
    )

# -------------------------------------------------------------------
if __name__ == "__main__":
    demo.launch()