programci48 commited on
Commit
7af1417
·
verified ·
1 Parent(s): 3858edd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +15 -3
app.py CHANGED
@@ -1,16 +1,28 @@
 
1
  import torch
2
  from fastapi import FastAPI, Request
3
  from transformers import AutoTokenizer, AutoModelForCausalLM
4
  from peft import PeftModel
5
 
 
 
 
 
6
  base_model_id = "google/gemma-1.1-2b-it"
7
  lora_model_id = "programci48/heytak-lora-v1"
8
 
9
- tokenizer = AutoTokenizer.from_pretrained(base_model_id)
10
- base_model = AutoModelForCausalLM.from_pretrained(base_model_id, torch_dtype=torch.float32, device_map=None)
11
- model = PeftModel.from_pretrained(base_model, lora_model_id)
 
 
 
 
 
 
12
  model.eval()
13
 
 
14
  app = FastAPI()
15
 
16
  @app.post("/run/predict")
 
1
+ import os
2
  import torch
3
  from fastapi import FastAPI, Request
4
  from transformers import AutoTokenizer, AutoModelForCausalLM
5
  from peft import PeftModel
6
 
7
+ # 🔐 HF_TOKEN değişkenini oku
8
+ hf_token = os.getenv("HF_TOKEN")
9
+
10
+ # 🔧 Model bilgisi
11
  base_model_id = "google/gemma-1.1-2b-it"
12
  lora_model_id = "programci48/heytak-lora-v1"
13
 
14
+ # 📦 Model yükleme
15
+ tokenizer = AutoTokenizer.from_pretrained(base_model_id, token=hf_token)
16
+ base_model = AutoModelForCausalLM.from_pretrained(
17
+ base_model_id,
18
+ torch_dtype=torch.float32,
19
+ device_map=None,
20
+ token=hf_token
21
+ )
22
+ model = PeftModel.from_pretrained(base_model, lora_model_id, token=hf_token)
23
  model.eval()
24
 
25
+ # 🚀 FastAPI app
26
  app = FastAPI()
27
 
28
  @app.post("/run/predict")