aryo100 commited on
Commit
7cd4b81
·
1 Parent(s): 1076f33

update app

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -9,7 +9,7 @@ app = FastAPI()
9
 
10
  # Load model & tokenizer sekali saat startup
11
  # MODEL_NAME = "Qwen/Qwen1.5-1.8B-Chat"
12
- MODEL_NAME = "Qwen/Qwen3-1.7B-FP8"
13
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True)
14
  model = AutoModelForCausalLM.from_pretrained(
15
  MODEL_NAME,
@@ -53,6 +53,7 @@ def chat(req: ChatRequest):
53
  )
54
 
55
  response = tokenizer.decode(
 
56
  outputs[0][inputs["input_ids"].shape[1]:],
57
  skip_special_tokens=True
58
  )
 
9
 
10
  # Load model & tokenizer sekali saat startup
11
  # MODEL_NAME = "Qwen/Qwen1.5-1.8B-Chat"
12
+ MODEL_NAME = "Qwen/Qwen3Guard-Gen-0.6B"
13
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True)
14
  model = AutoModelForCausalLM.from_pretrained(
15
  MODEL_NAME,
 
53
  )
54
 
55
  response = tokenizer.decode(
56
+ # outputs[0][inputs["input_ids"]:].tolist(),
57
  outputs[0][inputs["input_ids"].shape[1]:],
58
  skip_special_tokens=True
59
  )