Spaces:

jasvir-singh1021
/

CodeWhisperer-CPU

Sleeping

jasvir-singh1021 commited on Jul 27, 2025

Commit

7a6b61d

verified ·

1 Parent(s): bff4c38

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,10 +2,13 @@ import gradio as gr
 from ctransformers import AutoModelForCausalLM
 import time
-# Load the quantized GGUF model (optimized for CPU)
 llm = AutoModelForCausalLM.from_pretrained(
-    "TheBloke/WizardCoder-Python-13B-GGUF",  # You can change to CodeLlama, Phind, etc.
-    model_file="wizardcoder-python-13b.Q4_K_M.gguf",  # Use Q4_K_M for 16GB RAM
     model_type="llama",
     config={
         "max_new_tokens": 512,

 from ctransformers import AutoModelForCausalLM
 import time
+# Note: If this is a private or gated repo, you need to authenticate with your HF token.
+# You can do this by setting the environment variable HF_HOME or passing token to from_pretrained.
+# For public repos, no extra auth needed.
 llm = AutoModelForCausalLM.from_pretrained(
+    "TheBloke/WizardCoder-Python-7B-V1.0-GGUF",  # Updated model name
+    model_file="wizardcoder-python-7b-v1.0.Q4_K_M.gguf",  # Adjust the filename accordingly
     model_type="llama",
     config={
         "max_new_tokens": 512,