Adarsh921's picture
Upload app.py
b4fa544 verified
import gradio as gr
import torch
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
# Load from Hugging Face Hub
tokenizer = AutoTokenizer.from_pretrained("Adarsh921/flan-t5-english-summarizer")
model = AutoModelForSeq2SeqLM.from_pretrained("Adarsh921/flan-t5-english-summarizer")
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model = model.to(device)
MAX_INPUT_LEN = 768
MAX_TARGET_LEN = 150
def summarize(text):
inputs = tokenizer(
text,
return_tensors="pt",
truncation=True,
max_length=MAX_INPUT_LEN
).to(device)
with torch.no_grad():
output = model.generate(
**inputs,
max_length=MAX_TARGET_LEN,
min_length=40,
num_beams=6,
no_repeat_ngram_size=3,
length_penalty=1.0,
early_stopping=True
)
return tokenizer.decode(output[0], skip_special_tokens=True).strip()
# Gradio UI
gr.Interface(
fn=summarize,
inputs=gr.Textbox(lines=10, label="Paste english Article"),
outputs=gr.Textbox(label="Generated Summary"),
title="English Article Summarizer",
description="Summarizer fine-tuned on ILSUM 2024 using Flan-T5"
).launch(share=True)