Spaces:

Norelad
/

coptic-translation-interface

Running

Rogaton Claude commited on Nov 13, 2025

Commit

6865b40

1 Parent(s): 0c2152d

fix: Add API token input and improve file uploader

**API Token Support:**
- Add password-protected input field for HuggingFace API token
- Display clear instructions with link to get token
- Check token presence before translation attempts
- Support both user-provided tokens and Space secrets
- Better error messages for missing/invalid tokens

**File Uploader Improvements:**
- Add 20MB file size limit with validation
- Improve error handling with descriptive messages
- Add file extension preservation for temp files
- Auto-cleanup of temporary files after loading
- Better success/warning messages

**UX Enhancements:**
- Clear visual sections with dividers
- Emoji indicators for status
- Direct links to HF token settings
- Informative help text

This resolves the "api_key required" error and improves file upload reliability.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>

Files changed (1) hide show

apertus_ui.py +82 -28

apertus_ui.py CHANGED Viewed

@@ -116,26 +116,66 @@ selected_lang = st.selectbox("Language / Langue / Idioma",
 # Sidebar for Coptic tools
 with st.sidebar:
     st.header("Coptic Tools")
     # Lexicon file uploader
-    lexicon_file = st.file_uploader("Upload Coptic Lexicon",
-                                   type=['txt', 'tsv', 'csv', 'xml'],
-                                   help="Supports: Text (TAB/pipe separated), XML (Crum format), CSV")
     # Load lexicon
     if lexicon_file:
-        # Save uploaded file temporarily
-        with open("temp_lexicon.txt", "wb") as f:
-            f.write(lexicon_file.getbuffer())
-        coptic_lexicon = load_coptic_lexicon("temp_lexicon.txt")
-        st.success(f"Loaded {len(coptic_lexicon)} lexicon entries")
     else:
         # Try to load the comprehensive lexicon if available
         comprehensive_lexicon_path = "Comprehensive_Coptic_Lexicon-v1.2-2020.xml"
         if os.path.exists(comprehensive_lexicon_path):
             coptic_lexicon = load_coptic_lexicon(comprehensive_lexicon_path)
             if coptic_lexicon:
-                st.info(f"Loaded Comprehensive Coptic Lexicon: {len(coptic_lexicon)} entries")
             else:
                 coptic_lexicon = {}
         else:
@@ -231,20 +271,22 @@ with st.sidebar:
 # This is much faster and doesn't require GPU
 MODEL_NAME = "swiss-ai/Apertus-8B-Instruct-2509"
-@st.cache_resource
-def get_inference_client():
-    """Initialize HuggingFace Inference API client"""
     try:
-        # Get HF token from secrets or environment (optional for public models)
-        hf_token = st.secrets.get("HF_TOKEN", None) if hasattr(st, 'secrets') else None
-        client = InferenceClient(token=hf_token)
-        st.success("✅ Connected to Apertus-8B via HuggingFace Inference API")
-        return client
     except Exception as e:
-        st.warning(f"⚠️ Using free-tier inference (may be slower): {e}")
-        return InferenceClient()  # No token = free tier
-inference_client = get_inference_client()
 # Chat interface
 if "messages" not in st.session_state:
@@ -257,10 +299,22 @@ for message in st.session_state.messages:
 # User input
 if prompt := st.chat_input("Type your message..."):
     # Add Coptic-specific prompt prefix if applicable
     if selected_lang in ['cop', 'cop-sa', 'cop-bo'] and 'analysis_type' in locals():
         full_prompt = f"{COPTIC_PROMPTS[analysis_type]} {prompt}"
         # Add lexicon context for lexicon lookup
         if analysis_type == 'lexicon_lookup' and coptic_lexicon:
             words_in_prompt = prompt.split()
@@ -268,17 +322,17 @@ if prompt := st.chat_input("Type your message..."):
             for word in words_in_prompt:
                 if word in coptic_lexicon:
                     lexicon_matches.append(f"{word} = {coptic_lexicon[word]}")
             if lexicon_matches:
                 full_prompt += f"\n\nLexicon entries found: {'; '.join(lexicon_matches)}"
     else:
         full_prompt = prompt
     st.session_state.messages.append({"role": "user", "content": full_prompt})
     with st.chat_message("user"):
         st.markdown(full_prompt)
     # Generate response using HuggingFace Inference API
     with st.chat_message("assistant"):
         try:
@@ -309,4 +363,4 @@ if prompt := st.chat_input("Type your message..."):
         except Exception as e:
             st.error(f"❌ Error generating response: {str(e)}")
-            st.info("💡 The model may be loading or temporarily unavailable. Please try again in a moment.")

 # Sidebar for Coptic tools
 with st.sidebar:
     st.header("Coptic Tools")
+    # HuggingFace API Token input
+    st.subheader("🔑 API Configuration")
+    hf_token_input = st.text_input(
+        "HuggingFace API Token",
+        type="password",
+        help="Required for Apertus-8B translation. Get your token at: https://huggingface.co/settings/tokens"
+    )
+    if hf_token_input:
+        st.success("✅ API token configured")
+    else:
+        st.warning("⚠️ Translation requires an API token")
+        st.markdown("[Get your free HF token →](https://huggingface.co/settings/tokens)")
+    st.divider()
     # Lexicon file uploader
+    st.subheader("📚 Lexicon Upload")
+    lexicon_file = st.file_uploader(
+        "Upload Coptic Lexicon (optional)",
+        type=['txt', 'tsv', 'csv', 'xml'],
+        help="Supports: Text (TAB/pipe separated), XML (TEI format), CSV\nNote: Comprehensive lexicon is pre-loaded"
+    )
     # Load lexicon
     if lexicon_file:
+        try:
+            # Check file size (max 20MB)
+            file_size = len(lexicon_file.getvalue())
+            if file_size > 20 * 1024 * 1024:
+                st.error("❌ File too large (max 20MB)")
+                coptic_lexicon = {}
+            else:
+                # Save uploaded file temporarily
+                temp_path = f"temp_lexicon.{lexicon_file.name.split('.')[-1]}"
+                with open(temp_path, "wb") as f:
+                    f.write(lexicon_file.getbuffer())
+                coptic_lexicon = load_coptic_lexicon(temp_path)
+                if coptic_lexicon:
+                    st.success(f"✅ Loaded {len(coptic_lexicon)} lexicon entries from {lexicon_file.name}")
+                else:
+                    st.warning("⚠️ File uploaded but no valid entries found")
+                    coptic_lexicon = {}
+                # Clean up temp file
+                if os.path.exists(temp_path):
+                    os.remove(temp_path)
+        except Exception as e:
+            st.error(f"❌ Error loading file: {str(e)}")
+            st.info("💡 Supported formats: Plain text (TAB/pipe separated), XML (TEI), CSV")
+            coptic_lexicon = {}
     else:
         # Try to load the comprehensive lexicon if available
         comprehensive_lexicon_path = "Comprehensive_Coptic_Lexicon-v1.2-2020.xml"
         if os.path.exists(comprehensive_lexicon_path):
             coptic_lexicon = load_coptic_lexicon(comprehensive_lexicon_path)
             if coptic_lexicon:
+                st.info(f"📚 Loaded Comprehensive Coptic Lexicon: {len(coptic_lexicon)} entries")
             else:
                 coptic_lexicon = {}
         else:
 # This is much faster and doesn't require GPU
 MODEL_NAME = "swiss-ai/Apertus-8B-Instruct-2509"
+def get_inference_client(token=None):
+    """Initialize HuggingFace Inference API client with provided token"""
     try:
+        if token:
+            client = InferenceClient(token=token)
+            return client
+        else:
+            # Try to get token from Space secrets as fallback
+            if hasattr(st, 'secrets') and 'HF_TOKEN' in st.secrets:
+                client = InferenceClient(token=st.secrets['HF_TOKEN'])
+                return client
+            else:
+                return None
     except Exception as e:
+        st.error(f"Error initializing inference client: {e}")
+        return None
 # Chat interface
 if "messages" not in st.session_state:
 # User input
 if prompt := st.chat_input("Type your message..."):
+    # Check if API token is available
+    if not hf_token_input:
+        st.error("⚠️ Please enter your HuggingFace API token in the sidebar to use translation.")
+        st.stop()
+    # Initialize inference client with user token
+    inference_client = get_inference_client(hf_token_input)
+    if not inference_client:
+        st.error("❌ Failed to initialize inference client. Please check your API token.")
+        st.stop()
     # Add Coptic-specific prompt prefix if applicable
     if selected_lang in ['cop', 'cop-sa', 'cop-bo'] and 'analysis_type' in locals():
         full_prompt = f"{COPTIC_PROMPTS[analysis_type]} {prompt}"
         # Add lexicon context for lexicon lookup
         if analysis_type == 'lexicon_lookup' and coptic_lexicon:
             words_in_prompt = prompt.split()
             for word in words_in_prompt:
                 if word in coptic_lexicon:
                     lexicon_matches.append(f"{word} = {coptic_lexicon[word]}")
             if lexicon_matches:
                 full_prompt += f"\n\nLexicon entries found: {'; '.join(lexicon_matches)}"
     else:
         full_prompt = prompt
     st.session_state.messages.append({"role": "user", "content": full_prompt})
     with st.chat_message("user"):
         st.markdown(full_prompt)
     # Generate response using HuggingFace Inference API
     with st.chat_message("assistant"):
         try:
         except Exception as e:
             st.error(f"❌ Error generating response: {str(e)}")
+            st.info("💡 Please verify your API token is valid and has not expired.")