Pixal1.0 / app.py
peterpeter8585's picture
Update app.py
fb3ffb2 verified
raw
history blame
9.82 kB
# app_pixal_chat.py
import os, re, json, gradio as gr, requests
from typing import Optional, List, Dict, Any
from requests.adapters import HTTPAdapter, Retry
from langchain.llms.base import LLM
from langchain.memory import ConversationBufferMemory
from langchain.agents import initialize_agent, AgentType, load_tools
from langchain.tools import Tool
from langchain_experimental.tools.python.tool import PythonREPLTool
from langchain_community.retrievers import WikipediaRetriever
import datetime
# ──────────────────────────────
# βœ… GitHubModelLLM (κ·ΈλŒ€λ‘œ μœ μ§€)
# ──────────────────────────────
from typing import Optional, List, Dict, Any
from langchain.llms.base import LLM
import requests, os, json
from requests.adapters import HTTPAdapter, Retry
'''
class GitHubModelLLM(LLM):
"""GitHub Models API 기반 LangChain LLM (λŒ€ν™” λ©”λͺ¨λ¦¬ 톡합 지원)"""
model: str = "openai/gpt-4.1"
endpoint: str = "https://models.github.ai/inference"
token: Optional[str] = os.environ.get("token")
system_prompt: Optional[str] = "λ„ˆλŠ” PIXAL(Primary Interactive X-ternal Assistant with multi Language)이야. λ„ˆμ˜ κ°œλ°œμžλŠ” μ •μ„±μœ€ μ΄λΌλŠ” 6ν•™λ…„ 파이썬 ν”„λ‘œκ·Έλž˜λ¨Έμ•Ό.이것은 μ‹œμŠ€ν…œ λ©”μ‹œμ§€μž…λ‹ˆλ‹€.μ°Έκ³  ν•˜μ‹­μ‹œμ˜€."
request_timeout: float = 30.0
max_retries: int = 2
backoff_factor: float = 0.3
@property
def _llm_type(self) -> str:
return "github_models_api"
def _post_chat(self, body: Dict[str, Any]) -> Dict[str, Any]:
token = self.token or os.getenv("GITHUB_TOKEN") or os.getenv("token")
session = requests.Session()
retries = Retry(total=self.max_retries, backoff_factor=self.backoff_factor,
status_forcelist=[429, 500, 502, 503, 504])
session.mount("https://", HTTPAdapter(max_retries=retries))
session.headers.update({
"Content-Type": "application/json",
"Authorization": f"Bearer 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"
})
resp = session.post(f"{self.endpoint}/chat/completions", json=body, timeout=self.request_timeout)
resp.raise_for_status()
return resp.json()
def _call(
self,
prompt: str,
stop: Optional[List[str]] = None,
**kwargs
) -> str:
"""λŒ€ν™” λ©”λͺ¨λ¦¬(chat_history)λ₯Ό ν¬ν•¨ν•˜μ—¬ λͺ¨λΈ 호좜"""
# πŸ’¬ λ©”λͺ¨λ¦¬μ— μ €μž₯된 λŒ€ν™” λ©”μ‹œμ§€ 뢈러였기
memory = kwargs.get("memory")
messages = []
if self.system_prompt:
messages.append({"role": "system", "content": self.system_prompt})
# memoryκ°€ μžˆμ„ 경우 (이전 λŒ€ν™” 포함)
if memory and hasattr(memory, "chat_memory"):
for msg in memory.chat_memory.messages:
role = "user" if msg.type == "human" else "assistant"
messages.append({"role": role, "content": msg.content})
# ν˜„μž¬ μ‚¬μš©μž μž…λ ₯
messages.append({"role": "user", "content": prompt})
body = {"model": self.model, "messages": messages}
if stop:
body["stop"] = stop
# API 호좜
res = self._post_chat(body)
msg = res.get("choices", [{}])[0].get("message", {})
return msg.get("content") or json.dumps(msg.get("function_call", {}))
'''
class GitHubModelLLM(LLM):
model: str = "openai/gpt-4.1"
endpoint: str = "https://models.github.ai/inference"
token: Optional[str] = os.environ.get("token")
system_prompt: Optional[str] = (
"λ„ˆλŠ” PIXAL(Primary Interactive X-ternal Assistant with multi Language)이야. "
"λ„ˆμ˜ κ°œλ°œμžλŠ” μ •μ„±μœ€ μ΄λΌλŠ” 6ν•™λ…„ 파이썬 ν”„λ‘œκ·Έλž˜λ¨Έμ•Ό."
)
request_timeout: float = 30.0
max_retries: int = 2
backoff_factor: float = 0.3
@property
def _llm_type(self) -> str:
return "github_models_api"
def _post_chat(self, body: Dict[str, Any]) -> Dict[str, Any]:
token = self.token or os.getenv("GITHUB_TOKEN") or os.getenv("token")
if not token:
raise ValueError("❌ GitHub token이 μ„€μ •λ˜μ§€ μ•Šμ•˜μŠ΅λ‹ˆλ‹€.")
session = requests.Session()
retries = Retry(total=self.max_retries, backoff_factor=self.backoff_factor,
status_forcelist=[429, 500, 502, 503, 504])
session.mount("https://", HTTPAdapter(max_retries=retries))
session.headers.update({
"Content-Type": "application/json",
"Authorization": f"Bearer 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"
})
resp = session.post(f"{self.endpoint}/chat/completions", json=body, timeout=self.request_timeout)
resp.raise_for_status()
return resp.json()
def _call(self, prompt: str, stop: Optional[List[str]] = None, **kwargs) -> str:
"""πŸ’¬ LangChain memory의 전체 λŒ€ν™” λ‚΄μš©μ„ λͺ¨λΈμ— 전달"""
memory = kwargs.get("memory")
messages = []
# 1️⃣ μ‹œμŠ€ν…œ ν”„λ‘¬ν”„νŠΈ
if self.system_prompt:
messages.append({"role": "system", "content": self.system_prompt})
# 2️⃣ λ©”λͺ¨λ¦¬μ— μ €μž₯된 이전 λŒ€ν™” 포함
if memory and hasattr(memory, "chat_memory"):
for msg in memory.chat_memory.messages:
if hasattr(msg, "type") and msg.type == "human":
messages.append({"role": "user", "content": msg.content})
elif hasattr(msg, "type") and msg.type == "ai":
messages.append({"role": "assistant", "content": msg.content})
# 3️⃣ ν˜„μž¬ μ‚¬μš©μž μž…λ ₯
messages.append({"role": "user", "content": prompt})
body = {"model": self.model, "messages": messages}
if stop:
body["stop"] = stop
res = self._post_chat(body)
msg = res.get("choices", [{}])[0].get("message", {})
return msg.get("content") or json.dumps(msg.get("function_call", {}))
# ──────────────────────────────
# βœ… LangChain 도ꡬ & μ—μ΄μ „νŠΈ ꡬ성
# ──────────────────────────────
llm = GitHubModelLLM()
tools = load_tools(["ddg-search", "requests_all", "llm-math"], llm=llm,allow_dangerous_tools=True)
tools.append(Tool(name="python_repl", func=PythonREPLTool().run, description="Python μ½”λ“œ μ‹€ν–‰ 도ꡬ"))
retriever = WikipediaRetriever(lang="ko")
tools.append(Tool(name="wiki", func=retriever.get_relevant_documents, description="μœ„ν‚€λ°±κ³Ό 검색"))
tools.append(Tool(name="time_now", func=lambda _: f"ν˜„μž¬ μ‹œκ°: {datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')} (Asia/Seoul)", description="ν˜„μž¬ μ‹œκ°„μ„ λ°˜ν™˜ν•©λ‹ˆλ‹€."))
# βœ… λŒ€ν™” κΈ°μ–΅ λ©”λͺ¨λ¦¬
memory = ConversationBufferMemory(memory_key="chat_history", return_messages=True)
# βœ… Agent (Memory 연동)
agent = initialize_agent(
tools,
llm,
agent_type=AgentType.STRUCTURED_CHAT_ZERO_SHOT_REACT_DESCRIPTION,
memory=memory,
verbose=True
)
# ──────────────────────────────
# βœ… Chat ν•¨μˆ˜ (Memory μœ μ§€)
# ──────────────────────────────
def chat(message, history):
raw = agent.run(message)
try:
# λŒ€ν™” 기둝을 LangChain memory에 반영
memory.chat_memory.add_user_message(message)
# JSON ν˜•νƒœλ‘œ λ°˜ν™˜ μ‹œ νŒŒμ‹±
text = str(raw)
match = re.search(r"\{.*\}", text, re.DOTALL)
if match:
try:
obj = json.loads(match.group(0))
text = obj.get("action_input") or obj.get("Final Answer") or obj.get("content") or text
except Exception:
pass
# AI 응닡을 memory에 μΆ”κ°€
memory.chat_memory.add_ai_message(text)
except Exception as e:
text = str(raw)
history = history + [(message, text)]
return history, history, ""
# ──────────────────────────────
# βœ… Gradio UI (ChatGPT μŠ€νƒ€μΌ)
# ──────────────────────────────
with gr.Blocks(theme=gr.themes.Soft(), title="PIXAL Assistant") as demo:
gr.HTML("""
<div style="background:#f1f5f9;padding:12px;border-bottom:1px solid #d1d5db;
display:flex;align-items:center;justify-content:space-between;">
<h2 style="margin:0;">πŸ€– PIXAL Assistant</h2>
<span style="font-size:0.9em;color:#555;">LangChain + GitHub LLM</span>
</div>
""")
chatbot = gr.Chatbot(
label=None,
height=720,
bubble_full_width=False,
render_markdown=True,
avatar_images=("https://avatars.githubusercontent.com/u/9919?s=280&v=4", None),
)
with gr.Row():
msg = gr.Textbox(placeholder="λ©”μ‹œμ§€λ₯Ό μž…λ ₯ν•˜μ„Έμš”...", show_label=False, scale=8)
send = gr.Button("전솑", variant="primary", scale=1)
clear = gr.Button("🧹 μ΄ˆκΈ°ν™”", scale=1)
msg.submit(chat, [msg, chatbot], [chatbot, chatbot, msg])
send.click(chat, [msg, chatbot], [chatbot, chatbot, msg])
clear.click(lambda: None, None, chatbot, queue=False)
gr.Markdown("""
<div style="text-align:center;color:#777;font-size:0.85em;margin-top:8px;">
πŸ’‘ λŒ€ν™” 기둝은 μ„Έμ…˜ λ™μ•ˆ μœ μ§€λ©λ‹ˆλ‹€.
Made with ❀️ by PIXAL
</div>
""")
if __name__ == "__main__":
demo.launch(server_name="0.0.0.0", server_port=7860)