Spaces:
Sleeping
Sleeping
File size: 788 Bytes
b5c43cc 9411030 b5c43cc 85ba3c4 c4fa4f1 85ba3c4 b5c43cc c4fa4f1 b5c43cc 85ba3c4 b5c43cc 85ba3c4 b5c43cc | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 | # Chat agent using LlamaIndex SimpleChatEngine + Gradio
from llama_index.core.chat_engine import SimpleChatEngine
from llama_index.core.memory import ChatMemoryBuffer
from llama_index.llms.huggingface_api import HuggingFaceInferenceAPI
import gradio as gr
import os
from dotenv import load_dotenv
load_dotenv()
hf_token = os.getenv("HF_TOKEN")
llm = HuggingFaceInferenceAPI(
model_name="Qwen/Qwen2.5-Coder-32B-Instruct",
temperature=0.7,
max_tokens=1024,
token=hf_token,
provider="auto",
)
memory = ChatMemoryBuffer.from_defaults(token_limit=3000)
chat_engine = SimpleChatEngine.from_defaults(llm=llm, memory=memory)
def respond(message, history):
response = chat_engine.chat(message)
return str(response)
demo = gr.ChatInterface(respond)
demo.launch() |