Spaces:

Sid26Roy
/

text2sql

Runtime error

App Files Files Community

Sid26Roy commited on Jun 25, 2025

Commit

c35bbf4

verified ·

1 Parent(s): a56d439

Update app.py

Browse files

Files changed (1) hide show

app.py +137 -61

app.py CHANGED Viewed

@@ -1,57 +1,93 @@
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import sqlparse
-import gradio as gr
 model_name = "defog/llama-3-sqlcoder-8b"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-# Load model on CPU
-model = AutoModelForCausalLM.from_pretrained(
-    model_name,
-    trust_remote_code=True,
-    device_map={"": "cpu"},
-    torch_dtype=torch.float32
-)
-# SQL Prompt Template
-prompt = """<|begin_of_text|><|start_header_id|>user<|end_header_id|>
 Generate a SQL query to answer this question: `{question}`
 DDL statements:
 CREATE TABLE expenses (
-  id INTEGER PRIMARY KEY,
-  date DATE NOT NULL,
-  amount DECIMAL(10,2) NOT NULL,
-  category VARCHAR(50) NOT NULL,
-  description TEXT,
-  payment_method VARCHAR(20),
-  user_id INTEGER
 );
 CREATE TABLE categories (
-  id INTEGER PRIMARY KEY,
-  name VARCHAR(50) UNIQUE NOT NULL,
-  description TEXT
 );
 CREATE TABLE users (
-  id INTEGER PRIMARY KEY,
-  username VARCHAR(50) UNIQUE NOT NULL,
-  email VARCHAR(100) UNIQUE NOT NULL,
-  created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
 );
 CREATE TABLE budgets (
-  id INTEGER PRIMARY KEY,
-  user_id INTEGER,
-  category VARCHAR(50),
-  amount DECIMAL(10,2) NOT NULL,
-  period VARCHAR(20) DEFAULT 'monthly',
-  start_date DATE,
-  end_date DATE
 );
 -- expenses.user_id can be joined with users.id
@@ -63,38 +99,78 @@ The following SQL query best answers the question `{question}`:
 ```sql
 """
-# Main function
 def generate_query(question):
-    formatted_prompt = prompt.format(question=question)
-    inputs = tokenizer(formatted_prompt, return_tensors="pt").to("cpu")
-    generated_ids = model.generate(
-        **inputs,
-        num_return_sequences=1,
-        eos_token_id=tokenizer.eos_token_id,
-        pad_token_id=tokenizer.eos_token_id,
-        max_new_tokens=400,
-        do_sample=False,
-        num_beams=1,
-        temperature=0.0,
-        top_p=1,
-    )
-    output = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
     try:
-        sql_code = output.split("```sql")[1].split("```")[0].strip()
-        return sqlparse.format(sql_code, reindent=True)
-    except Exception:
-        return "❌ SQL could not be parsed. Raw Output:\n\n" + output
-# Gradio UI
 iface = gr.Interface(
-    fn=generate_query,
-    inputs=gr.Textbox(lines=3, placeholder="Ask your SQL question..."),
-    outputs="text",
-    title="🦙 LLaMA 3 SQLCoder (CPU)",
-    description="Convert natural language into SQL queries based on the given schema. Running on CPU – may be slow.",
 )
 if __name__ == "__main__":
-    iface.launch()

+import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import sqlparse
+import psutil
+import os
+# Check available memory
+def get_available_memory():
+    return psutil.virtual_memory().available
 model_name = "defog/llama-3-sqlcoder-8b"
+# Initialize tokenizer
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+# CPU-compatible model loading
+def load_model():
+    try:
+        available_memory = get_available_memory()
+        print(f"Available memory: {available_memory / 1e9:.1f} GB")
+        # For CPU deployment, we'll use float32 or float16 without quantization
+        if available_memory > 16e9:  # 16GB+ RAM
+            print("Loading model in float16...")
+            model = AutoModelForCausalLM.from_pretrained(
+                model_name,
+                trust_remote_code=True,
+                torch_dtype=torch.float16,
+                device_map="cpu",
+                use_cache=True,
+                low_cpu_mem_usage=True
+            )
+        else:
+            print("Loading model in float32 with low memory usage...")
+            model = AutoModelForCausalLM.from_pretrained(
+                model_name,
+                trust_remote_code=True,
+                device_map="cpu",
+                use_cache=True,
+                low_cpu_mem_usage=True,
+                torch_dtype=torch.float32
+            )
+        return model
+    except Exception as e:
+        print(f"Error loading model: {e}")
+        return None
+# Load model (this will take some time on first run)
+print("Loading model... This may take a few minutes on CPU.")
+model = load_model()
+prompt_template = """<|begin_of_text|><|start_header_id|>user<|end_header_id|>
 Generate a SQL query to answer this question: `{question}`
 DDL statements:
 CREATE TABLE expenses (
+  id INTEGER PRIMARY KEY, -- Unique ID for each expense
+  date DATE NOT NULL, -- Date when the expense occurred
+  amount DECIMAL(10,2) NOT NULL, -- Amount spent
+  category VARCHAR(50) NOT NULL, -- Category of expense (food, transport, utilities, etc.)
+  description TEXT, -- Optional description of the expense
+  payment_method VARCHAR(20), -- How the payment was made (cash, credit_card, debit_card, bank_transfer)
+  user_id INTEGER -- ID of the user who made the expense
 );
 CREATE TABLE categories (
+  id INTEGER PRIMARY KEY, -- Unique ID for each category
+  name VARCHAR(50) UNIQUE NOT NULL, -- Category name (food, transport, utilities, entertainment, etc.)
+  description TEXT -- Optional description of the category
 );
 CREATE TABLE users (
+  id INTEGER PRIMARY KEY, -- Unique ID for each user
+  username VARCHAR(50) UNIQUE NOT NULL, -- Username
+  email VARCHAR(100) UNIQUE NOT NULL, -- Email address
+  created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP -- When the user account was created
 );
 CREATE TABLE budgets (
+  id INTEGER PRIMARY KEY, -- Unique ID for each budget
+  user_id INTEGER, -- ID of the user who set the budget
+  category VARCHAR(50), -- Category for which budget is set
+  amount DECIMAL(10,2) NOT NULL, -- Budget amount
+  period VARCHAR(20) DEFAULT 'monthly', -- Budget period (daily, weekly, monthly, yearly)
+  start_date DATE, -- Budget start date
+  end_date DATE -- Budget end date
 );
 -- expenses.user_id can be joined with users.id
 ```sql
 """
 def generate_query(question):
+    if model is None:
+        return "Error: Model not loaded properly"
     try:
+        updated_prompt = prompt_template.format(question=question)
+        inputs = tokenizer(updated_prompt, return_tensors="pt")
+        # Generate on CPU
+        with torch.no_grad():
+            generated_ids = model.generate(
+                **inputs,
+                num_return_sequences=1,
+                eos_token_id=tokenizer.eos_token_id,
+                pad_token_id=tokenizer.eos_token_id,
+                max_new_tokens=400,
+                do_sample=False,
+                num_beams=1,
+                temperature=0.0,
+                top_p=1,
+            )
+        outputs = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)
+        # Extract SQL from output
+        if "```sql" in outputs[0]:
+            sql_part = outputs[0].split("```sql")[1].split("```")[0].strip()
+        else:
+            # Fallback extraction
+            sql_part = outputs[0].split("The following SQL query best answers the question")[1].strip()
+            if sql_part.startswith("`"):
+                sql_part = sql_part[1:]
+            if "```" in sql_part:
+                sql_part = sql_part.split("```")[0].strip()
+        # Clean up the SQL
+        if sql_part.endswith(";"):
+            sql_part = sql_part[:-1]
+        # Format the SQL
+        formatted_sql = sqlparse.format(sql_part, reindent=True, keyword_case='upper')
+        return formatted_sql
+    except Exception as e:
+        return f"Error generating query: {str(e)}"
+def gradio_interface(question):
+    if not question.strip():
+        return "Please enter a question."
+    return generate_query(question)
+# Create Gradio interface
 iface = gr.Interface(
+    fn=gradio_interface,
+    inputs=gr.Textbox(
+        label="Question",
+        placeholder="Enter your question (e.g., 'Show me all expenses for food category')",
+        lines=3
+    ),
+    outputs=gr.Code(label="Generated SQL Query", language="sql"),
+    title="SQL Query Generator",
+    description="Generate SQL queries from natural language questions about expense tracking database.",
+    examples=[
+        ["Show me all expenses for food category"],
+        ["What's the total amount spent on transport this month?"],
+        ["Insert a new expense of 50 dollars for groceries on 2024-01-15"],
+        ["Find users who spent more than 1000 dollars total"],
+        ["Show me the budget vs actual spending for each category"]
+    ],
+    cache_examples=False
 )
 if __name__ == "__main__":
+    iface.launch()