Spaces:

Anonymous0045
/

Coder

Sleeping

App Files Files Community

Anonymous0045 commited on Feb 23

Commit

0a7b900

verified ·

1 Parent(s): 2e24877

Create app.py

Browse files

Files changed (1) hide show

app.py +14 -38

app.py CHANGED Viewed

@@ -39,7 +39,6 @@ llm = Llama(
     n_threads=CPU_THREADS,
     n_batch=512,
     use_mmap=True,
-    use_mlock=False,
     verbose=False
 )
@@ -47,39 +46,36 @@ print("Model loaded successfully.")
 # ============================
-# Prompt Formatting
 # ============================
 SYSTEM_PROMPT = """You are DeepSeek Coder, an expert programming assistant.
-You write clean, efficient, production-ready code.
-Only explain if user asks.
 """
-def build_prompt(messages):
     prompt = SYSTEM_PROMPT + "\n\n"
-    for msg in messages:
-        if msg["role"] == "user":
-            prompt += f"User: {msg['content']}\n"
-        elif msg["role"] == "assistant":
-            prompt += f"Assistant: {msg['content']}\n"
-    prompt += "Assistant:"
     return prompt
 # ============================
-# Streaming Generator
 # ============================
-def generate_response(message, history):
-    messages = history + [{"role": "user", "content": message}]
-    prompt = build_prompt(messages)
     output = ""
@@ -90,38 +86,18 @@ def generate_response(message, history):
         top_p=0.95,
         stream=True
     ):
-        text = token["choices"][0]["text"]
-        output += text
         yield output
 # ============================
-# Gradio Chat Interface
-# ============================
-def chat(message, history):
-    history = history or []
-    assistant_response = ""
-    for partial in generate_response(message, history):
-        assistant_response = partial
-        yield history + [
-            {"role": "user", "content": message},
-            {"role": "assistant", "content": assistant_response},
-        ]
-# ============================
-# Launch UI
 # ============================
 demo = gr.ChatInterface(
     fn=chat,
     title="DeepSeek Coder 1.3B",
-    description="Production GGUF model running on llama.cpp",
-    type="messages"
 )
 demo.launch(

     n_threads=CPU_THREADS,
     n_batch=512,
     use_mmap=True,
     verbose=False
 )
 # ============================
+# Prompt Builder
 # ============================
 SYSTEM_PROMPT = """You are DeepSeek Coder, an expert programming assistant.
+Write clean and efficient code.
+Only explain when asked.
 """
+def build_prompt(message, history):
     prompt = SYSTEM_PROMPT + "\n\n"
+    for user_msg, assistant_msg in history:
+        prompt += f"User: {user_msg}\nAssistant: {assistant_msg}\n"
+    prompt += f"User: {message}\nAssistant:"
     return prompt
 # ============================
+# Generate Response
 # ============================
+def chat(message, history):
+    history = history or []
+    prompt = build_prompt(message, history)
     output = ""
         top_p=0.95,
         stream=True
     ):
+        output += token["choices"][0]["text"]
         yield output
 # ============================
+# Launch Gradio ChatInterface
 # ============================
 demo = gr.ChatInterface(
     fn=chat,
     title="DeepSeek Coder 1.3B",
+    description="Production GGUF model running on llama.cpp"
 )
 demo.launch(