aryo100 commited on
Commit
809867d
·
1 Parent(s): c83545d

update app

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -8,8 +8,8 @@ import uvicorn
8
  app = FastAPI()
9
 
10
  # Load model & tokenizer sekali saat startup
11
- MODEL_NAME = "Qwen/Qwen1.5-1.8B-Chat"
12
- # MODEL_NAME = "Qwen/Qwen-14B-Chat"
13
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True)
14
  model = AutoModelForCausalLM.from_pretrained(
15
  MODEL_NAME,
 
8
  app = FastAPI()
9
 
10
  # Load model & tokenizer sekali saat startup
11
+ # MODEL_NAME = "Qwen/Qwen1.5-1.8B-Chat"
12
+ MODEL_NAME = "Qwen/Qwen3-0.6B-GPTQ-Int8"
13
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True)
14
  model = AutoModelForCausalLM.from_pretrained(
15
  MODEL_NAME,