Spaces:

Mlaana
/

Chatbot

Sleeping

Mlaana commited on Jun 11, 2025

Commit

d44c8ed

1 Parent(s): 8666fde

change id model from drive

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,10 +4,9 @@ import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, TextStreamer
 import gradio as gr
-# ==== STEP 1: Download model (kalau belum ada) ====
 os.makedirs("model", exist_ok=True)
-MODEL_URL = "https://drive.google.com/uc?id=1I9cM5OlZ1oBTPaJUY1pRzdhEGpZCpaL5"  # <- Ganti file ID-nya
 MODEL_PATH = "model/model.safetensors"
 if not os.path.exists(MODEL_PATH):
@@ -16,18 +15,14 @@ if not os.path.exists(MODEL_PATH):
 else:
     print("✅ Model file already exists")
-# ==== STEP 2: Load tokenizer & model ====
 print("🔧 Loading model & tokenizer...")
 tokenizer = AutoTokenizer.from_pretrained("model")
 model = AutoModelForCausalLM.from_pretrained("model", torch_dtype=torch.float16)
-# Gunakan CUDA kalau tersedia
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model.to(device)
-# Optional: streaming token
 streamer = TextStreamer(tokenizer, skip_prompt=True, skip_special_tokens=True)
-# ==== STEP 3: Define response logic ====
 def respond(message, history, max_tokens, temperature, top_p):
     input_ids = tokenizer.encode(message, return_tensors="pt").to(device)
     history_text = ""

 from transformers import AutoTokenizer, AutoModelForCausalLM, TextStreamer
 import gradio as gr
 os.makedirs("model", exist_ok=True)
+MODEL_URL = "https://drive.google.com/uc?id=1Kg8KSGIgjBopeOKSbYbFWEgUlYOcqyXX"  # <- Ganti file ID-nya
 MODEL_PATH = "model/model.safetensors"
 if not os.path.exists(MODEL_PATH):
 else:
     print("✅ Model file already exists")
 print("🔧 Loading model & tokenizer...")
 tokenizer = AutoTokenizer.from_pretrained("model")
 model = AutoModelForCausalLM.from_pretrained("model", torch_dtype=torch.float16)
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model.to(device)
 streamer = TextStreamer(tokenizer, skip_prompt=True, skip_special_tokens=True)
 def respond(message, history, max_tokens, temperature, top_p):
     input_ids = tokenizer.encode(message, return_tensors="pt").to(device)
     history_text = ""