Spaces:
Build error
Build error
File size: 1,662 Bytes
d12f28d | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 | from fastapi import FastAPI
from pydantic import BaseModel
from transformers import BertTokenizerFast, BertModel
import torch
import torch.nn as nn
import os
# Define constants
MODEL_PATH = os.path.join(os.path.dirname(__file__), "model")
WEIGHTS_PATH = os.path.join(MODEL_PATH, "bert-multilabel-model.pth")
NUM_LABELS = 6 # Adjust based on your dataset
# Initialize FastAPI app
app = FastAPI()
# Load tokenizer from local directory
tokenizer = BertTokenizerFast.from_pretrained(MODEL_PATH)
# Define the BERT-based multi-label classifier
class BertMultiLabelClassifier(nn.Module):
def __init__(self):
super(BertMultiLabelClassifier, self).__init__()
self.bert = BertModel.from_pretrained(MODEL_PATH)
self.classifier = nn.Linear(self.bert.config.hidden_size, NUM_LABELS)
def forward(self, input_ids, attention_mask):
output = self.bert(input_ids=input_ids, attention_mask=attention_mask)
cls_output = output.last_hidden_state[:, 0, :]
return self.classifier(cls_output)
# Load the model weights
model = BertMultiLabelClassifier()
model.load_state_dict(torch.load(WEIGHTS_PATH, map_location="cpu"))
model.eval()
# Input schema for prediction
class PredictRequest(BaseModel):
text: str
@app.get("/")
def read_root():
return {"message": "Multi-label BERT model is running!"}
@app.post("/predict")
def predict(request: PredictRequest):
inputs = tokenizer(request.text, return_tensors="pt", truncation=True, padding=True, max_length=512)
with torch.no_grad():
logits = model(**inputs)
probs = torch.sigmoid(logits).squeeze().tolist()
return {"probabilities": probs}
|