File size: 1,331 Bytes
356b86e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8e2886d
0e62c8f
356b86e
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import gradio as gr
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
import torch

MODEL_NAME = "angkor96/khmer-news-summarization"

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_NAME).to(device)
model.eval()

def summarize(text):
    try:
        inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=1024)
        inputs = {k: v.to(device) for k, v in inputs.items()}
        with torch.no_grad():
            summary_ids = model.generate(
                **inputs,
                max_length=150,
                num_beams=4,
                length_penalty=2.0,
                early_stopping=True
            )
        return tokenizer.decode(summary_ids[0], skip_special_tokens=True)
    except Exception as e:
        return f"αž˜αž·αž“αž’αžΆαž…αžŸαž„αŸ’αžαŸαž”αž”αžΆαž“αž‘αŸαŸ” ({e})"

iface = gr.Interface(
    fn=summarize,
    inputs=gr.Textbox(label="αž”αž‰αŸ’αž…αžΌαž›αž’αžαŸ’αžαž”αž‘"),
    outputs=gr.Textbox(label="αž’αžαŸ’αžαž”αž‘αžŸαž„αŸ’αžαŸαž”"),
    title="Khmer News Summarization API",
    description="API service powered by angkor96/khmer-news-summarization",
    api_name="predict",  # <-- this exposes /run/predict
)

iface.launch()