Spaces:

to0ony
/

final-thesis-plotgen-app

Runtime error

App Files Files Community

to0ony commited on Aug 31, 2025

Commit

79f1c31

1 Parent(s): 8a6a35c

implemented model choice dropdown

Browse files

Files changed (1) hide show

app.py +14 -8

app.py CHANGED Viewed

@@ -7,21 +7,20 @@ from mingpt.model import GPT
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 REPO_ID = "to0ony/final-thesis-plotgen"
-state = {"model": None, "enc": tiktoken.get_encoding("gpt2")}
-def load_model():
-    if state["model"] is not None:
         return state["model"]
     cfg_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
-    mdl_path = hf_hub_download(repo_id=REPO_ID, filename="cmu-plots-model.pt")
     with open(cfg_path, "r", encoding="utf-8") as f:
         cfg = json.load(f)
     gcfg = GPT.get_default_config()
     gcfg.model_type = None
     gcfg.vocab_size = int(cfg["vocab_size"])
     gcfg.block_size = int(cfg["block_size"])
     gcfg.n_layer    = int(cfg["n_layer"])
@@ -35,13 +34,14 @@ def load_model():
     model.eval()
     state["model"] = model
     return model
 @torch.inference_mode()
-def generate(prompt, max_new_tokens=200, temperature=0.7, top_k=50):
     """Generiranje teksta iz prompta"""
-    model = load_model()
     enc = state["enc"]
     x = torch.tensor([enc.encode(prompt)], dtype=torch.long, device=DEVICE)
@@ -56,10 +56,16 @@ def generate(prompt, max_new_tokens=200, temperature=0.7, top_k=50):
     return enc.decode(y[0].tolist())
 # Gradio UI
 with gr.Blocks(title="🎬 Final Thesis Plot Generator") as demo:
     gr.Markdown("## 🎬 Film Plot Generator\nUnesi prompt i generiraj radnju filma.")
     prompt = gr.Textbox(label="Prompt", lines=5, placeholder="E.g. A young detective arrives in a coastal town...")
     max_new_tokens = gr.Slider(32, 512, value=200, step=16, label="Max new tokens")
     temperature = gr.Slider(0.1, 1.5, value=0.7, step=0.1, label="Temperature")
@@ -67,7 +73,7 @@ with gr.Blocks(title="🎬 Final Thesis Plot Generator") as demo:
     btn = gr.Button("Generate")
     output = gr.Textbox(label="Output", lines=15)
-    btn.click(generate, [prompt, max_new_tokens, temperature, top_k], output)
 if __name__ == "__main__":
     demo.launch()

 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 REPO_ID = "to0ony/final-thesis-plotgen"
+state = {"model": None, "model_name": None, "enc": tiktoken.get_encoding("gpt2")}
+def load_model(model_name):
+    if state["model"] is not None and state["model_name"] == model_name:
         return state["model"]
     cfg_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
+    mdl_path = hf_hub_download(repo_id=REPO_ID, filename=model_name)
     with open(cfg_path, "r", encoding="utf-8") as f:
         cfg = json.load(f)
     gcfg = GPT.get_default_config()
     gcfg.model_type = None
     gcfg.vocab_size = int(cfg["vocab_size"])
     gcfg.block_size = int(cfg["block_size"])
     gcfg.n_layer    = int(cfg["n_layer"])
     model.eval()
     state["model"] = model
+    state["model_name"] = model_name
     return model
 @torch.inference_mode()
+def generate(prompt, model_choice, max_new_tokens=200, temperature=0.7, top_k=50):
     """Generiranje teksta iz prompta"""
+    model = load_model(model_choice)
     enc = state["enc"]
     x = torch.tensor([enc.encode(prompt)], dtype=torch.long, device=DEVICE)
     return enc.decode(y[0].tolist())
 # Gradio UI
 with gr.Blocks(title="🎬 Final Thesis Plot Generator") as demo:
     gr.Markdown("## 🎬 Film Plot Generator\nUnesi prompt i generiraj radnju filma.")
+    model_choice = gr.Dropdown(
+        choices=["cmu-plots-model.pt", "cmu-plots-model-enchanced.pt"],
+        value="cmu-plots-model.pt",
+        label="Model"
+    )
     prompt = gr.Textbox(label="Prompt", lines=5, placeholder="E.g. A young detective arrives in a coastal town...")
     max_new_tokens = gr.Slider(32, 512, value=200, step=16, label="Max new tokens")
     temperature = gr.Slider(0.1, 1.5, value=0.7, step=0.1, label="Temperature")
     btn = gr.Button("Generate")
     output = gr.Textbox(label="Output", lines=15)
+    btn.click(generate, [prompt, model_choice, max_new_tokens, temperature, top_k], output)
 if __name__ == "__main__":
     demo.launch()