Spaces:

druvx13
/

Ztar

Sleeping

App Files Files Community

druvx13 commited on May 28, 2025

Commit

b0204a5

verified ·

1 Parent(s): 8181b3a

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -14

app.py CHANGED Viewed

@@ -9,12 +9,11 @@ MODEL_FILE = "gpt2-q4_k_m.gguf"
 CACHE_DIR = "./model_cache"
 MAX_TOKENS = 200
-# Initialize model (loads once at startup)
 def load_model():
     """Download and load GGUF model with proper path handling"""
     os.makedirs(CACHE_DIR, exist_ok=True)
-    # Download model if not cached
     model_path = hf_hub_download(
         repo_id=MODEL_REPO,
         filename=MODEL_FILE,
@@ -24,7 +23,7 @@ def load_model():
     return Llama(
         model_path=model_path,
-        n_ctx=2048,
         n_threads=4,
         verbose=False
     )
@@ -32,11 +31,14 @@ def load_model():
 # Load model at startup
 llm = load_model()
-# Generation function with anti-repetition
 def generate_text(prompt, max_tokens=MAX_TOKENS, temp=0.7, top_p=0.95):
-    """Generate text with repetition prevention and error handling"""
     if not prompt.strip():
-        return "Please enter a valid prompt."
     try:
         output = llm(
@@ -45,7 +47,6 @@ def generate_text(prompt, max_tokens=MAX_TOKENS, temp=0.7, top_p=0.95):
             temperature=temp,
             top_p=top_p,
             echo=False,
-            # Anti-repetition parameters
             repeat_penalty=1.2,
             no_repeat_ngram_size=3
         )
@@ -62,12 +63,10 @@ with gr.Blocks(theme="soft") as demo:
     with gr.Row():
         with gr.Column():
-            # Input components
             prompt = gr.Textbox(
                 label="Input Prompt",
-                placeholder="Enter your prompt here...",
-                lines=5,
-                min_length=10
             )
             max_tokens = gr.Slider(
                 minimum=50,
@@ -92,16 +91,13 @@ with gr.Blocks(theme="soft") as demo:
             )
         with gr.Column():
-            # Output and button
             output = gr.Textbox(label="Generated Text", lines=10)
             generate_btn = gr.Button("🚀 Generate", variant="primary")
-    # Event handler
     generate_btn.click(
         fn=generate_text,
         inputs=[prompt, max_tokens, temp, top_p],
         outputs=output
     )
-# Launch app
 demo.launch()

 CACHE_DIR = "./model_cache"
 MAX_TOKENS = 200
+# Initialize model
 def load_model():
     """Download and load GGUF model with proper path handling"""
     os.makedirs(CACHE_DIR, exist_ok=True)
     model_path = hf_hub_download(
         repo_id=MODEL_REPO,
         filename=MODEL_FILE,
     return Llama(
         model_path=model_path,
+        n_ctx=1024,       # Match model's training context length
         n_threads=4,
         verbose=False
     )
 # Load model at startup
 llm = load_model()
+# Generation function with validation
 def generate_text(prompt, max_tokens=MAX_TOKENS, temp=0.7, top_p=0.95):
+    """Generate text with repetition prevention and input validation"""
     if not prompt.strip():
+        return "⚠️ Please enter a valid prompt."
+    if len(prompt.split()) < 3:  # Minimum word count
+        return "⚠️ Please enter at least 3 words for better results."
     try:
         output = llm(
             temperature=temp,
             top_p=top_p,
             echo=False,
             repeat_penalty=1.2,
             no_repeat_ngram_size=3
         )
     with gr.Row():
         with gr.Column():
             prompt = gr.Textbox(
                 label="Input Prompt",
+                placeholder="Enter your prompt here... (at least 3 words)",
+                lines=5
             )
             max_tokens = gr.Slider(
                 minimum=50,
             )
         with gr.Column():
             output = gr.Textbox(label="Generated Text", lines=10)
             generate_btn = gr.Button("🚀 Generate", variant="primary")
     generate_btn.click(
         fn=generate_text,
         inputs=[prompt, max_tokens, temp, top_p],
         outputs=output
     )
 demo.launch()