KJ24 commited on
Commit
a2428a8
·
verified ·
1 Parent(s): 226d4c3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -2
app.py CHANGED
@@ -3,10 +3,14 @@ from pydantic import BaseModel
3
  from transformers import AutoTokenizer, AutoModel
4
  import torch
5
  import torch.nn.functional as F
 
 
 
 
6
 
7
  app = FastAPI()
8
 
9
- # Charger le modèle depuis HF sans passer par SentenceTransformer
10
  MODEL_NAME = "thenlper/gte-small"
11
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
12
  model = AutoModel.from_pretrained(MODEL_NAME)
@@ -21,4 +25,4 @@ async def embed_text(payload: EmbedInput):
21
  outputs = model(**inputs)
22
  embeddings = outputs.last_hidden_state[:, 0] # CLS token
23
  normalized = F.normalize(embeddings, p=2, dim=1)
24
- return {"embedding": normalized[0].tolist()}
 
3
  from transformers import AutoTokenizer, AutoModel
4
  import torch
5
  import torch.nn.functional as F
6
+ import os
7
+
8
+ # 💡 Correction ici
9
+ os.environ['HF_HOME'] = '/data'
10
 
11
  app = FastAPI()
12
 
13
+ # Charger le modèle
14
  MODEL_NAME = "thenlper/gte-small"
15
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
16
  model = AutoModel.from_pretrained(MODEL_NAME)
 
25
  outputs = model(**inputs)
26
  embeddings = outputs.last_hidden_state[:, 0] # CLS token
27
  normalized = F.normalize(embeddings, p=2, dim=1)
28
+ return {'embedding': normalized[0].tolist()}