CoderHassan commited on
Commit
e54889e
·
verified ·
1 Parent(s): f0b4ecd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -15
app.py CHANGED
@@ -1,31 +1,25 @@
1
  import streamlit as st
2
- from transformers import MarianMTModel, MarianTokenizer
3
 
4
- # Install SentencePiece if not already installed
5
- try:
6
- import sentencepiece
7
- except ImportError:
8
- st.error("The SentencePiece library is required but not installed. Please install it using `pip install sentencepiece` and restart the application.")
9
- st.stop()
10
-
11
- # Load the model and tokenizer
12
  @st.cache_resource
13
  def load_model():
14
- model_name = "Helsinki-NLP/opus-mt-en-ur"
15
- tokenizer = MarianTokenizer.from_pretrained(model_name)
16
- model = MarianMTModel.from_pretrained(model_name)
17
  return model, tokenizer
18
 
19
  model, tokenizer = load_model()
20
 
21
  def translate_text(text, model, tokenizer):
22
- inputs = tokenizer.encode(text, return_tensors="pt", truncation=True)
23
- outputs = model.generate(inputs, max_length=1024, num_beams=5, early_stopping=True)
 
24
  translated_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
25
  return translated_text
26
 
27
  # Streamlit UI
28
- st.title("English to Urdu Translation")
29
 
30
  # Input text from the user
31
  text_to_translate = st.text_area("Enter English text to translate:")
@@ -34,3 +28,5 @@ if text_to_translate.strip():
34
  with st.spinner("Translating..."):
35
  translated_text = translate_text(text_to_translate, model, tokenizer)
36
  st.markdown(f"### Translated Text:\n{translated_text}")
 
 
 
1
  import streamlit as st
2
+ from transformers import T5Tokenizer, T5ForConditionalGeneration
3
 
4
+ # Load the T5 model and tokenizer
 
 
 
 
 
 
 
5
  @st.cache_resource
6
  def load_model():
7
+ model_name = "t5-small"
8
+ tokenizer = T5Tokenizer.from_pretrained(model_name)
9
+ model = T5ForConditionalGeneration.from_pretrained(model_name)
10
  return model, tokenizer
11
 
12
  model, tokenizer = load_model()
13
 
14
  def translate_text(text, model, tokenizer):
15
+ input_text = f"translate English to Urdu: {text}"
16
+ inputs = tokenizer.encode(input_text, return_tensors="pt", truncation=True)
17
+ outputs = model.generate(inputs, max_length=512, num_beams=5, early_stopping=True)
18
  translated_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
19
  return translated_text
20
 
21
  # Streamlit UI
22
+ st.title("English to Urdu Translation with T5")
23
 
24
  # Input text from the user
25
  text_to_translate = st.text_area("Enter English text to translate:")
 
28
  with st.spinner("Translating..."):
29
  translated_text = translate_text(text_to_translate, model, tokenizer)
30
  st.markdown(f"### Translated Text:\n{translated_text}")
31
+
32
+