Spaces:

K00B404
/

diffusion_try

Runtime error

K00B404 commited on Sep 29, 2024

Commit

cd218c1

verified ·

1 Parent(s): 1ce4091

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,39 @@
 import torch
 from diffusers import (
     DDIMScheduler,

+import gradio as gr
+from gradio_client import Client
+from langchain.llms import HuggingFaceTextGenInference
+from langchain.chains import LLMChain
+from langchain.prompts import PromptTemplate
+# Initialize the Qwen client
+qwen_client = Client("Qwen/Qwen2-0.5B")
+# Create a custom LLM class to use with LangChain
+class QwenLLM(HuggingFaceTextGenInference):
+    def _call(self, prompt, stop=None):
+        result = qwen_client.predict(
+            query=prompt,
+            history=[],
+            system="You are a helpful assistant.",
+            api_name="/model_chat"
+        )
+        return result[0][1]  # Extract the assistant's response
+# Initialize the LLM
+llm = QwenLLM(
+    inference_server_url="https://your-inference-server-url",  # This is a placeholder
+    max_new_tokens=512,
+    top_k=10,
+    top_p=0.95,
+    typical_p=0.95,
+    temperature=0.1,
+    repetition_penalty=1.03
+)
+# Create the LCel chain
+template = """You are a helpful AI assistant. Please respond to the following user input:
+User: {user_input}"""
 import torch
 from diffusers import (
     DDIMScheduler,