Spaces:

sarekuwa
/

livecoder

Sleeping

App Files Files Community

Vladislav Krasnov commited on Jan 6

Commit

3c7b473

1 Parent(s): 57e83fb

Update space 7

Browse files

Files changed (1) hide show

app.py +18 -18

app.py CHANGED Viewed

@@ -2,6 +2,13 @@ import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
 # Load model and tokenizer
 model_name = "microsoft/phi-2"
 tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
@@ -15,16 +22,17 @@ model = AutoModelForCausalLM.from_pretrained(
 )
 def generate_response(message):
-    """API function - takes text, returns response"""
     prompt = f"### Instruction: {message}\n### Response:"
     inputs = tokenizer(prompt, return_tensors="pt", truncation=True, max_length=512)
-    attention_mask = inputs.get('attention_mask', None)
     with torch.no_grad():
         outputs = model.generate(
             inputs.input_ids,
-            attention_mask=attention_mask,
             max_new_tokens=256,
             temperature=0.7,
             do_sample=True,
@@ -36,23 +44,15 @@ def generate_response(message):
     response = tokenizer.decode(outputs[0][inputs.input_ids.shape[1]:], skip_special_tokens=True)
     return response.strip()
-# Create Gradio Interface
 interface = gr.Interface(
     fn=generate_response,
-    inputs=gr.Textbox(
-        label="Programming question",
-        placeholder="Example: Write a binary search function in C++...",
-        lines=3
-    ),
-    outputs=gr.Textbox(label="Model response", lines=10),
-    title="LiveCoder LLM API",
-    description="Phi-2 model for programming assistance",
-    examples=[
-        ["Write a hello world program in C++"],
-        ["Explain the OOP principle"],
-        ["How does a pointer work in C++?"]
-    ]
 )
-# Launch the application
 interface.launch(server_name="0.0.0.0", server_port=7860, share=False)

 from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
+# Hardcode your space details here
+USERNAME = "sarekuwa"  # Replace with your actual username
+SPACE_NAME = "livecoder"    # Replace with your actual space name
+API_ENDPOINT = f"https://{USERNAME}-{SPACE_NAME}.hf.space/api/predict"
+print(f"API Endpoint: {API_ENDPOINT}")
 # Load model and tokenizer
 model_name = "microsoft/phi-2"
 tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
 )
 def generate_response(message):
+    """Process user input and generate response"""
+    if not message.strip():
+        return "Please enter a question."
     prompt = f"### Instruction: {message}\n### Response:"
     inputs = tokenizer(prompt, return_tensors="pt", truncation=True, max_length=512)
     with torch.no_grad():
         outputs = model.generate(
             inputs.input_ids,
             max_new_tokens=256,
             temperature=0.7,
             do_sample=True,
     response = tokenizer.decode(outputs[0][inputs.input_ids.shape[1]:], skip_special_tokens=True)
     return response.strip()
+# Create interface
 interface = gr.Interface(
     fn=generate_response,
+    inputs=gr.Textbox(label="Input", placeholder="Enter programming question...", lines=3),
+    outputs=gr.Textbox(label="Output", lines=10),
+    title="LiveCoder API",
+    description="LLM programming assistant",
+    allow_flagging="never"
 )
+# Launch application
 interface.launch(server_name="0.0.0.0", server_port=7860, share=False)