Spaces:

Really-Amazing
/

SimpleAI-259M

Sleeping

App Files Files Community

Really-Amazing commited on Mar 14

Commit

6534cf7

verified ·

1 Parent(s): cff6f6c

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -15

app.py CHANGED Viewed

@@ -1,35 +1,35 @@
 import gradio as gr
 import torch
 from nanochat.engine import Engine
 MODEL_PATH = "model_000971.pt"
 META_PATH = "meta_000971.json"
 print("Waking up the toddler (NanoChat-ClimbMix-D12)...")
-engine = Engine(model_path=MODEL_PATH, meta_path=META_PATH, device="cpu")
-def chat_fn(message):
-    response = engine.generate(message, max_new_tokens=300, temperature=0.85)  # higher temp = more fun/confident nonsense
     return response
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="blue")) as demo:
     gr.Markdown("# 🧸 NanoChat-ClimbMix-D12 – The Confident Toddler LLM")
-    gr.Markdown("Inspired by Andrej Karpathy's nanochat. Currently in 'Preschool Phase': 100% confident spelling, 0% reliable facts. 😂")
-    gr.Markdown("**Coming soon:** D14 (Elementary), D16 (Middle School), D18 (High School), D20+ (University level) – less hallucinations, more wisdom!")
-    with gr.Accordion("⚠️ Hallucination Disclaimer", open=True):
-        gr.Markdown("This model boldly answers everything — even when wrong. Enjoy the comedy! Next versions will grow up fast.")
     gr.ChatInterface(
         fn=chat_fn,
-        examples=[
-            "Why is the sky blue?",
-            "How many planets are in the solar system?",
-            "Write Python code to say hello world",
-            "Explain photosynthesis in one sentence"
-        ],
         title="Chat with the Toddler",
-        description="Ask anything — it will reply with maximum confidence!"
     )
 if __name__ == "__main__":

 import gradio as gr
 import torch
 from nanochat.engine import Engine
+from nanochat.checkpoint_manager import load_model
+from nanochat.tokenizer import get_tokenizer
 MODEL_PATH = "model_000971.pt"
 META_PATH = "meta_000971.json"
 print("Waking up the toddler (NanoChat-ClimbMix-D12)...")
+# 1. Load the tokenizer and model first
+tokenizer = get_tokenizer(META_PATH)
+model, _ = load_model(MODEL_PATH, device="cpu")
+# 2. Pass the objects to the Engine
+engine = Engine(model=model, tokenizer=tokenizer)
+def chat_fn(message, history):
+    # Based on your engine.py, it expects a list of tokens or a string?
+    # Usually, generate handles the string-to-token conversion.
+    response = engine.generate(message, max_tokens=300, temperature=0.85)
     return response
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="blue")) as demo:
     gr.Markdown("# 🧸 NanoChat-ClimbMix-D12 – The Confident Toddler LLM")
+    gr.Markdown("Inspired by Andrej Karpathy's nanochat. Currently in 'Preschool Phase'!")
     gr.ChatInterface(
         fn=chat_fn,
         title="Chat with the Toddler",
+        examples=["Why is the sky blue?", "Tell me a joke."],
     )
 if __name__ == "__main__":