Spaces:

druvx13
/

Ztar

Sleeping

App Files Files Community

druvx13 commited on May 28, 2025

Commit

0057689

verified ·

1 Parent(s): 9028e44

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -19

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import gradio as gr
 from llama_cpp import Llama
 import os
 # Model configuration
@@ -10,35 +11,52 @@ MAX_TOKENS = 200
 # Initialize model (loads once at startup)
 def load_model():
     os.makedirs(CACHE_DIR, exist_ok=True)
     return Llama(
-        model_path=None,  # Auto-download from HF
-        hf_repo=MODEL_REPO,
-        hf_file=MODEL_FILE,
-        n_ctx=2048,       # Context length
-        n_threads=4,      # CPU threads
-        verbose=False     # Disable debug logs
     )
 llm = load_model()
-# Generation function
 def generate_text(prompt, max_tokens=MAX_TOKENS, temp=0.7, top_p=0.95):
-    output = llm(
-        prompt=prompt,
-        max_tokens=max_tokens,
-        temperature=temp,
-        top_p=top_p,
-        echo=False
-    )
-    return output["choices"][0]["text"]
-# UI components
 with gr.Blocks(theme="soft") as demo:
-    gr.Markdown("# GPT2 Text Generator (GGUF Version)\nType a prompt and generate text using the quantized GPT2 model.")
     with gr.Row():
         with gr.Column():
             prompt = gr.Textbox(
                 label="Input Prompt",
                 placeholder="Enter your prompt here...",
@@ -56,7 +74,7 @@ with gr.Blocks(theme="soft") as demo:
                 maximum=1.0,
                 value=0.7,
                 step=0.1,
-                label="Temperature"
             )
             top_p = gr.Slider(
                 minimum=0.1,
@@ -67,13 +85,16 @@ with gr.Blocks(theme="soft") as demo:
             )
         with gr.Column():
             output = gr.Textbox(label="Generated Text", lines=10)
-            generate_btn = gr.Button("Generate", variant="primary")
     generate_btn.click(
         fn=generate_text,
         inputs=[prompt, max_tokens, temp, top_p],
         outputs=output
     )
 demo.launch()

 import gradio as gr
 from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
 import os
 # Model configuration
 # Initialize model (loads once at startup)
 def load_model():
+    """Download and load GGUF model with proper path handling"""
     os.makedirs(CACHE_DIR, exist_ok=True)
+    # Download model if not cached
+    model_path = hf_hub_download(
+        repo_id=MODEL_REPO,
+        filename=MODEL_FILE,
+        cache_dir=CACHE_DIR,
+        force_download=False  # Set to True to bypass cache
+    )
     return Llama(
+        model_path=model_path,  # Now a valid path string
+        n_ctx=2048,             # Context window size
+        n_threads=4,            # CPU threads for faster inference
+        verbose=False           # Disable debug logs
     )
+# Load model at startup
 llm = load_model()
+# Generation function with parameters
 def generate_text(prompt, max_tokens=MAX_TOKENS, temp=0.7, top_p=0.95):
+    """Generate text using GGUF model with parameter control"""
+    try:
+        output = llm(
+            prompt=prompt,
+            max_tokens=max_tokens,
+            temperature=temp,
+            top_p=top_p,
+            echo=False  # Don't repeat input in output
+        )
+        return output["choices"][0]["text"]
+    except Exception as e:
+        return f"Error generating text: {str(e)}"
+# UI Components
 with gr.Blocks(theme="soft") as demo:
+    gr.Markdown("""
+    # 🧠 GPT2 Text Generator (GGUF Version)
+    Enter a prompt and adjust parameters to generate AI text using the quantized GPT2 model.
+    """)
     with gr.Row():
         with gr.Column():
+            # Input components
             prompt = gr.Textbox(
                 label="Input Prompt",
                 placeholder="Enter your prompt here...",
                 maximum=1.0,
                 value=0.7,
                 step=0.1,
+                label="Creativity (Temperature)"
             )
             top_p = gr.Slider(
                 minimum=0.1,
             )
         with gr.Column():
+            # Output and button
             output = gr.Textbox(label="Generated Text", lines=10)
+            generate_btn = gr.Button("🚀 Generate", variant="primary")
+    # Event handler
     generate_btn.click(
         fn=generate_text,
         inputs=[prompt, max_tokens, temp, top_p],
         outputs=output
     )
+# Launch app
 demo.launch()