File size: 788 Bytes
b5c43cc
 
 
9411030
b5c43cc
85ba3c4
 
 
 
 
 
 
c4fa4f1
 
85ba3c4
b5c43cc
c4fa4f1
b5c43cc
85ba3c4
 
b5c43cc
 
85ba3c4
b5c43cc
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
# Chat agent using LlamaIndex SimpleChatEngine + Gradio
from llama_index.core.chat_engine import SimpleChatEngine
from llama_index.core.memory import ChatMemoryBuffer
from llama_index.llms.huggingface_api import HuggingFaceInferenceAPI
import gradio as gr
import os
from dotenv import load_dotenv

load_dotenv()

hf_token = os.getenv("HF_TOKEN")

llm = HuggingFaceInferenceAPI(
    model_name="Qwen/Qwen2.5-Coder-32B-Instruct",
    temperature=0.7,
    max_tokens=1024,
    token=hf_token,
    provider="auto",
)

memory = ChatMemoryBuffer.from_defaults(token_limit=3000)
chat_engine = SimpleChatEngine.from_defaults(llm=llm, memory=memory)


def respond(message, history):
    response = chat_engine.chat(message)
    return str(response)


demo = gr.ChatInterface(respond)
demo.launch()