Spaces:

renesistech
/

Notes

Build error

App Files Files Community

noumanjavaid commited on Apr 3, 2025

Commit

e637f4b

verified ·

1 Parent(s): 1e32418

Update app.py

Browse files

Files changed (1) hide show

app.py +67 -23

app.py CHANGED Viewed

@@ -16,14 +16,13 @@ from download import download_video_audio, delete_download
 MAX_FILE_SIZE = 41943040  # 40MB in bytes
 FILE_TOO_LARGE_MESSAGE = "File too large. Maximum size is 40MB."
-# Load environment variables
 load_dotenv()
-GROQ_API_KEY = os.environ.get("GROQ_API_KEY", None)
-audio_file_path = None
 # Initialize session states
 if 'api_key' not in st.session_state:
-    st.session_state.api_key = GROQ_API_KEY
 if 'recording' not in st.session_state:
     st.session_state.recording = False
@@ -34,9 +33,8 @@ if 'audio_data' not in st.session_state:
 if 'transcript' not in st.session_state:
     st.session_state.transcript = ""
-if 'groq' not in st.session_state:
-    if st.session_state.api_key:
-        st.session_state.groq = Groq(api_key=st.session_state.api_key)
 # Set page configuration
 st.set_page_config(
@@ -50,6 +48,17 @@ st.set_page_config(
 LLM_MODEL = "deepseek-r1-distill-llama-70b"
 TRANSCRIPTION_MODEL = "distil-whisper-large-v3-en"
 class GenerationStatistics:
     def __init__(self, input_time=0, output_time=0, input_tokens=0, output_tokens=0, total_time=0, model_name=LLM_MODEL):
         self.input_time = input_time
@@ -205,15 +214,13 @@ class AudioRecorder:
 def transcribe_audio_with_groq(audio_file_path):
     """Transcribe audio file using Groq's transcription API"""
-    if not st.session_state.api_key:
-        st.error("Please provide a valid Groq API key in the sidebar.")
         return ""
-    client = Groq(api_key=st.session_state.api_key)
     try:
         with open(audio_file_path, "rb") as file:
-            transcription = client.audio.transcriptions.create(
                 file=(audio_file_path, file.read()),
                 model=TRANSCRIPTION_MODEL,
                 response_format="verbose_json"
@@ -225,12 +232,10 @@ def transcribe_audio_with_groq(audio_file_path):
 def process_transcript(transcript):
     """Process transcript with Groq's DeepSeek model for highly structured notes"""
-    if not st.session_state.api_key:
-        st.error("Please provide a valid Groq API key in the sidebar.")
         return None
-    client = Groq(api_key=st.session_state.api_key)
     # Enhanced structure for better organization
     structure = {
         "Executive Summary": "",
@@ -309,7 +314,7 @@ def process_transcript(transcript):
         stats = GenerationStatistics(model_name=LLM_MODEL)
         start_time = time.time()
-        response = client.chat.completions.create(
             messages=[{"role": "user", "content": prompt}],
             model=LLM_MODEL,
             temperature=0.3,  # Lower temperature for more structured output
@@ -415,16 +420,55 @@ def main():
     # Sidebar for configuration
     with st.sidebar:
         st.header("Configuration")
-        api_key = st.text_input("Groq API Key", value=st.session_state.api_key or "", type="password")
-        if api_key:
-            st.session_state.api_key = api_key
-            if 'groq' not in st.session_state or st.session_state.groq is None:
-                st.session_state.groq = Groq(api_key=api_key)
         st.markdown("---")
         st.info("Using DeepSeek-R1-Distill-Llama-70B model for note generation and Distil Whisper for transcription")
     # Input methods tabs
     input_method = st.radio("Choose input method:", ["Live Recording", "Upload Audio", "YouTube URL", "Text Input"])

 MAX_FILE_SIZE = 41943040  # 40MB in bytes
 FILE_TOO_LARGE_MESSAGE = "File too large. Maximum size is 40MB."
+# Load environment variables in a secure way
 load_dotenv()
 # Initialize session states
 if 'api_key' not in st.session_state:
+    # Try to get API key from environment variable first
+    st.session_state.api_key = os.environ.get("GROQ_API_KEY", "")
 if 'recording' not in st.session_state:
     st.session_state.recording = False
 if 'transcript' not in st.session_state:
     st.session_state.transcript = ""
+if 'groq_client' not in st.session_state:
+    st.session_state.groq_client = None
 # Set page configuration
 st.set_page_config(
 LLM_MODEL = "deepseek-r1-distill-llama-70b"
 TRANSCRIPTION_MODEL = "distil-whisper-large-v3-en"
+# Initialize Groq client function
+def initialize_groq_client(api_key):
+    """Initialize Groq client with the provided API key"""
+    if not api_key:
+        return None
+    try:
+        return Groq(api_key=api_key)
+    except Exception as e:
+        st.error(f"Failed to initialize Groq client: {e}")
+        return None
 class GenerationStatistics:
     def __init__(self, input_time=0, output_time=0, input_tokens=0, output_tokens=0, total_time=0, model_name=LLM_MODEL):
         self.input_time = input_time
 def transcribe_audio_with_groq(audio_file_path):
     """Transcribe audio file using Groq's transcription API"""
+    if not st.session_state.groq_client:
+        st.error("Groq client is not initialized. Please check your API key.")
         return ""
     try:
         with open(audio_file_path, "rb") as file:
+            transcription = st.session_state.groq_client.audio.transcriptions.create(
                 file=(audio_file_path, file.read()),
                 model=TRANSCRIPTION_MODEL,
                 response_format="verbose_json"
 def process_transcript(transcript):
     """Process transcript with Groq's DeepSeek model for highly structured notes"""
+    if not st.session_state.groq_client:
+        st.error("Groq client is not initialized. Please check your API key.")
         return None
     # Enhanced structure for better organization
     structure = {
         "Executive Summary": "",
         stats = GenerationStatistics(model_name=LLM_MODEL)
         start_time = time.time()
+        response = st.session_state.groq_client.chat.completions.create(
             messages=[{"role": "user", "content": prompt}],
             model=LLM_MODEL,
             temperature=0.3,  # Lower temperature for more structured output
     # Sidebar for configuration
     with st.sidebar:
         st.header("Configuration")
+        # Improved API key handling
+        api_key_input = st.text_input(
+            "Groq API Key",
+            value=st.session_state.api_key,
+            type="password",
+            help="Enter your Groq API key. Get one at https://console.groq.com/keys"
+        )
+        # Only update if changed
+        if api_key_input != st.session_state.api_key:
+            st.session_state.api_key = api_key_input
+            # Reinitialize client with new key
+            st.session_state.groq_client = initialize_groq_client(api_key_input)
+            if st.session_state.groq_client:
+                st.success("✅ API key validated!")
+        # Initialize client if not done already
+        if st.session_state.api_key and not st.session_state.groq_client:
+            st.session_state.groq_client = initialize_groq_client(st.session_state.api_key)
+        # API key instructions
+        with st.expander("How to get a Groq API key"):
+            st.markdown("""
+            1. Visit [Groq Cloud Console](https://console.groq.com/)
+            2. Sign up or log in to your account
+            3. Navigate to API Keys in the sidebar
+            4. Click "Create API Key" and give it a name
+            5. Copy the generated key (you won't see it again!)
+            **Security tip**: For production use, store your API key as an environment variable:
+            ```bash
+            export GROQ_API_KEY="your-api-key-here"
+            ```
+            """)
         st.markdown("---")
         st.info("Using DeepSeek-R1-Distill-Llama-70B model for note generation and Distil Whisper for transcription")
+    # Check if API key is valid before proceeding
+    if not st.session_state.api_key:
+        st.warning("⚠️ Please enter your Groq API key in the sidebar to use ScribeWizard")
+        st.stop()
+    if not st.session_state.groq_client:
+        st.error("❌ Failed to initialize Groq client. Please check your API key.")
+        st.stop()
     # Input methods tabs
     input_method = st.radio("Choose input method:", ["Live Recording", "Upload Audio", "YouTube URL", "Text Input"])