Spaces:

NetraVerse
/

IndicTrans

Sleeping

App Files Files Community

NetraVerse commited on Nov 13, 2025

Commit

60ffa1d

verified ·

1 Parent(s): 4aafe0f

Create the app.py

Browse files

Files changed (1) hide show

app.py +217 -0

app.py ADDED Viewed

	@@ -0,0 +1,217 @@

+import torch
+import os
+import gradio as gr
+from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
+from IndicTransToolkit.processor import IndicProcessor
+# Get token from environment variable
+token = os.getenv("HUGGINGFACE_HUB_TOKEN")
+# Device configuration
+DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+# Model configuration - English to Kannada translation
+src_lang, tgt_lang = "eng_Latn", "kan_Knda"
+model_name = "ai4bharat/indictrans2-en-indic-dist-200M"
+# Global variables to store model and tokenizer
+model = None
+tokenizer = None
+ip = None
+def load_model():
+    """Load the translation model and tokenizer"""
+    global model, tokenizer, ip
+    try:
+        print(f"Loading model: {model_name}")
+        tokenizer = AutoTokenizer.from_pretrained(
+            model_name,
+            trust_remote_code=True,
+            token=token
+        )
+        model = AutoModelForSeq2SeqLM.from_pretrained(
+            model_name,
+            trust_remote_code=True,
+            dtype=torch.float16,
+            token=token
+        ).to(DEVICE)
+        ip = IndicProcessor(inference=True)
+        print(f"Model loaded successfully on {DEVICE}")
+        return True
+    except Exception as e:
+        print(f"Error loading model: {str(e)}")
+        return False
+def translate_text(input_text):
+    """
+    Translate input text using the loaded model
+    Args:
+        input_text: Single sentence to translate
+    Returns:
+        Translated text
+    """
+    if not model or not tokenizer or not ip:
+        return "❌ Model not loaded. Please check the model configuration."
+    if not input_text.strip():
+        return "Please enter some text to translate."
+    try:
+        # Single sentence translation
+        input_sentences = [input_text.strip()]
+        if not input_sentences:
+            return "No valid sentences found."
+        # Preprocess the input
+        batch = ip.preprocess_batch(
+            input_sentences,
+            src_lang=src_lang,
+            tgt_lang=tgt_lang,
+        )
+        # Tokenize the sentences
+        inputs = tokenizer(
+            batch,
+            truncation=True,
+            padding="longest",
+            return_tensors="pt",
+            return_attention_mask=True,
+        ).to(DEVICE)
+        # Generate translations
+        with torch.no_grad():
+            generated_tokens = model.generate(
+                **inputs,
+                use_cache=False,
+                min_length=0,
+                max_length=256,
+                num_beams=5,
+                num_return_sequences=1,
+            )
+        # Decode the generated tokens
+        generated_tokens = tokenizer.batch_decode(
+            generated_tokens,
+            skip_special_tokens=True,
+            clean_up_tokenization_spaces=True,
+        )
+        # Postprocess the translations
+        translations = ip.postprocess_batch(generated_tokens, lang=tgt_lang)
+        # Return single translation
+        return translations[0] if translations else "Translation failed."
+    except Exception as e:
+        return f"❌ Translation error: {str(e)}"
+def create_interface():
+    """Create and configure the Gradio interface"""
+    # Load model on startup
+    model_loaded = load_model()
+    if not model_loaded:
+        # Create a simple error interface
+        with gr.Blocks(title="Translation App - Error") as demo:
+            gr.Markdown("## ❌ Model Loading Error")
+            gr.Markdown("Failed to load the translation model. Please check:")
+            gr.Markdown("- Your Hugging Face token is set correctly")
+            gr.Markdown("- You have access to the gated model")
+            gr.Markdown("- Your internet connection is working")
+        return demo
+    # Create the main interface
+    with gr.Blocks(
+        title="AI4Bharat IndicTrans2 Translation",
+        theme=gr.themes.Soft(),
+    ) as demo:
+        gr.Markdown(
+            f"""
+            # 🌍 AI4Bharat IndicTrans2 Translation
+            **Current Configuration:**
+            - **Source Language:** {src_lang} (English)
+            - **Target Language:** {tgt_lang} (Kannada)
+            - **Model:** {model_name}
+            - **Device:** {DEVICE}
+            Enter text below to translate from English to Kannada.
+            """)
+        with gr.Row():
+            with gr.Column():
+                input_text = gr.Textbox(
+                    label=f"Input Text ({src_lang})",
+                    placeholder="Enter English text to translate...",
+                    lines=5,
+                    max_lines=10
+                )
+                with gr.Row():
+                    translate_btn = gr.Button("🔄 Translate", variant="primary")
+                    clear_btn = gr.Button("🗑️ Clear")
+            with gr.Column():
+                output_text = gr.Textbox(
+                    label=f"Translation ({tgt_lang})",
+                    lines=5,
+                    max_lines=10,
+                    interactive=False
+                )
+        # Example inputs
+        gr.Markdown("### 📝 Example Inputs:")
+        examples = [
+            ["Hello, how are you?"],
+            ["I am going to the market today."],
+            ["This is a very beautiful place."],
+            ["Can you help me?"],
+        ]
+        gr.Examples(
+            examples=examples,
+            inputs=[input_text],
+            outputs=[output_text],
+            fn=translate_text,
+            cache_examples=True
+        )
+        # Event handlers
+        translate_btn.click(
+            fn=translate_text,
+            inputs=[input_text],
+            outputs=[output_text]
+        )
+        clear_btn.click(
+            fn=lambda: ("", ""),
+            outputs=[input_text, output_text]
+        )
+        # Add footer
+        gr.Markdown("---")
+    return demo
+if __name__ == "__main__":
+    # Create and launch the interface
+    demo = create_interface()
+    # Launch the app
+    demo.launch(
+        server_name="0.0.0.0",  # Allow external connections
+        server_port=7860,       # Default Gradio port
+        share=False,            # Set to True if you want a public link
+        debug=True,
+        show_error=True
+    )