Spaces:

CLOUDYUL
/

AGaRiCleaner-Detector-FastAPI

Sleeping

App Files Files Community

CLOUDYUL commited on Jun 4, 2025

Commit

f4d60e7

0 Parent(s):

Remove nested .git from detector folder

Browse files

Files changed (6) hide show

.gitattributes +3 -0
.gitignore +3 -0
Dockerfile +23 -0
detector +1 -0
requirements.txt +4 -0
server.py +76 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,3 @@

+detector/*.safetensors filter=lfs diff=lfs merge=lfs -text
+detector/*.bin filter=lfs diff=lfs merge=lfs -text
+detector/*.json filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+__pycache__/
+*.pyc
+.env

Dockerfile ADDED Viewed

	@@ -0,0 +1,23 @@

+# Dockerfile
+# 1) Python 3.10 slim 베이스 이미지 사용
+FROM python:3.10-slim
+# 2) 작업 디렉터리를 /app으로 지정
+WORKDIR /app
+# 3) (선택) 시스템 종속 패키지 설치 → 모델 컴파일 시 필요하다면 추가
+RUN apt-get update && apt-get install -y \
+    build-essential \
+ && rm -rf /var/lib/apt/lists/*
+# 4) requirements.txt 복사 후 pip으로 종속성 설치
+COPY requirements.txt .
+RUN pip install --upgrade pip \
+ && pip install --no-cache-dir -r requirements.txt
+# 5) 나머지 모든 파일(코드 + detector 폴더) 복사
+COPY . .
+# 6) 컨테이너 구동 시 uvicorn으로 FastAPI 서버 실행 (포트 7860)
+CMD ["uvicorn", "server:app", "--host", "0.0.0.0", "--port", "7860"]

detector ADDED Viewed

	@@ -0,0 +1 @@


1	+ Subproject commit 6f96793357b0992617416e965fa0721310ee1e19

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+fastapi
+uvicorn[standard]
+torch
+transformers

server.py ADDED Viewed

	@@ -0,0 +1,76 @@

+# server.py
+from typing import List
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+import torch
+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+# ── 1) FastAPI 앱 생성
+app = FastAPI(
+    title="AGaRiCleaner Toxicity Detector (FastAPI)",
+    description="FastAPI 기반 한국어 악플 탐지 모델 서버",
+    version="1.0.0"
+)
+# ── 2) 요청 스키마 정의 (Pydantic 모델)
+class TextsIn(BaseModel):
+    data: List[str]  # JSON 예시: { "data": ["문장1", "문장2", ...] }
+# ── 3) 모델 디렉터리 경로 (Space에서는 /app/detector 폴더가 된다)
+MODEL_DIR = "./detector"
+# ── 4) 디바이스 설정 (Mac MPS 지원 여부 확인)
+device = "mps" if torch.backends.mps.is_available() else "cpu"
+print(f"▶ 모델 추론 디바이스: {device}")
+# ── 5) 토크나이저와 모델 로드
+try:
+    tokenizer = AutoTokenizer.from_pretrained(MODEL_DIR)
+    model = AutoModelForSequenceClassification.from_pretrained(MODEL_DIR)
+    model.to(device)
+    model.eval()
+    print("✔ 모델 및 토크나이저 로드 완료")
+except Exception as e:
+    print("✖ 모델 로드 실패:", e)
+    raise e
+# ── 6) 악플 탐지 함수 정의
+def detect_toxic(texts: List[str]) -> List[dict]:
+    encoding = tokenizer(
+        texts,
+        padding=True,
+        truncation=True,
+        return_tensors="pt",
+        max_length=128
+    )
+    input_ids = encoding["input_ids"].to(device)
+    attention_mask = encoding["attention_mask"].to(device)
+    with torch.no_grad():
+        outputs = model(input_ids=input_ids, attention_mask=attention_mask)
+        logits = outputs.logits
+        probs = torch.softmax(logits, dim=-1).cpu().tolist()
+    results = []
+    for i, text in enumerate(texts):
+        score_1 = probs[i][1]
+        label = 1 if score_1 >= 0.5 else 0
+        results.append({
+            "text": text,
+            "label": label,
+            "score": round(score_1, 6)
+        })
+    return results
+# ── 7) POST /predict 엔드포인트 정의
+@app.post("/predict", summary="텍스트 목록을 입력받아 악플 여부(label, score) 반환")
+async def predict_endpoint(payload: TextsIn):
+    texts = payload.data
+    if not isinstance(texts, list) or len(texts) == 0:
+        raise HTTPException(status_code=400, detail="‘data’ 필드에 최소 1개 이상의 문자열이 있어야 합니다.")
+    try:
+        output = detect_toxic(texts)
+        return output
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"모델 추론 중 오류 발생: {e}")