Spaces:

Nahiyan14
/

USMLEStep1Prep

Sleeping

App Files Files Community

Nahiyan14 commited on Mar 11, 2025

Commit

2568443

verified ·

1 Parent(s): cbd5a41

Update app.py

Browse files

Files changed (1) hide show

app.py +73 -9

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import os
 # Try using a different directory path where you should have permissions
 os.environ['TRANSFORMERS_CACHE'] = '/tmp/model_cache'
@@ -15,17 +16,42 @@ from langchain_core.prompts import ChatPromptTemplate
 from dotenv import load_dotenv
 from src.prompt import *
 app = Flask(__name__)
 # Load environment variables - these will be set in Hugging Face Space secrets
 load_dotenv()  # Still useful for local development
 PINECONE_API_KEY = os.environ.get('PINECONE_API_KEY')
 OPENAI_API_KEY = os.environ.get('OPENAI_API_KEY')
 if not PINECONE_API_KEY or not OPENAI_API_KEY:
-    raise ValueError("Missing PINECONE_API_KEY or OPENAI_API_KEY")
 os.environ["PINECONE_API_KEY"] = PINECONE_API_KEY
 os.environ["OPENAI_API_KEY"] = OPENAI_API_KEY
@@ -37,18 +63,39 @@ rag_chain = None
 def initialize_chain():
     global embeddings, rag_chain
     try:
         embeddings = download_hugging_face_embeddings()
         index_name = "medprep"
-        # Embed each chunk and upsert the embeddings into your Pinecone index.
         docsearch = Pinecone.from_existing_index(
-        index_name=index_name,
-        embedding=embeddings
         )
         retriever = docsearch.as_retriever(search_type="similarity", search_kwargs={"k":3})
         llm = OpenAI(temperature=0.4, max_tokens=500)
         prompt = ChatPromptTemplate.from_messages(
             [
                 ("system", system_prompt),
@@ -56,16 +103,23 @@ def initialize_chain():
             ]
         )
         question_answer_chain = create_stuff_documents_chain(llm, prompt)
         rag_chain = create_retrieval_chain(retriever, question_answer_chain)
-        print("RAG chain initialized successfully")
         return True
     except Exception as e:
         print(f"Failed to initialize RAG chain: {e}")
         return False
 # Initialize the chain when the application starts
-initialize_chain()
 @app.route("/")
 def index():
@@ -77,21 +131,31 @@ def chat():
     # Make sure chain is initialized
     if rag_chain is None:
         if not initialize_chain():
             return "Error: System not initialized properly. Please check the logs."
     msg = request.form["msg"]
     try:
         response = rag_chain.invoke({"input": msg})
         return str(response["answer"])
     except Exception as e:
-        print(f"Error processing request: {e}")
         return f"Error: {str(e)}"
 # Health check endpoint for monitoring
 @app.route("/health")
 def health_check():
-    return jsonify({"status": "healthy"})
 if __name__ == '__main__':
     port = int(os.environ.get("PORT", 7860))

 import os
+import traceback
 # Try using a different directory path where you should have permissions
 os.environ['TRANSFORMERS_CACHE'] = '/tmp/model_cache'
 from dotenv import load_dotenv
 from src.prompt import *
 app = Flask(__name__)
 # Load environment variables - these will be set in Hugging Face Space secrets
 load_dotenv()  # Still useful for local development
+print("Starting application initialization")
+print(f"Python version: {os.sys.version}")
+# Add debugging endpoints
+@app.route("/test")
+def test():
+    return "Flask app is working. This is a test endpoint."
+@app.route("/check-env")
+def check_env():
+    has_pinecone = "Yes" if os.environ.get("PINECONE_API_KEY") else "No"
+    has_openai = "Yes" if os.environ.get("OPENAI_API_KEY") else "No"
+    # Check if keys appear valid (without revealing them)
+    pinecone_valid = len(os.environ.get("PINECONE_API_KEY", "")) > 10 if has_pinecone == "Yes" else "N/A"
+    openai_valid = os.environ.get("OPENAI_API_KEY", "").startswith("sk-") if has_openai == "Yes" else "N/A"
+    return f"Pinecone key present: {has_pinecone} (appears valid: {pinecone_valid})<br>OpenAI key present: {has_openai} (appears valid: {openai_valid})"
+print("Checking environment variables...")
 PINECONE_API_KEY = os.environ.get('PINECONE_API_KEY')
 OPENAI_API_KEY = os.environ.get('OPENAI_API_KEY')
+if not PINECONE_API_KEY:
+    print("WARNING: Missing PINECONE_API_KEY")
+if not OPENAI_API_KEY:
+    print("WARNING: Missing OPENAI_API_KEY")
 if not PINECONE_API_KEY or not OPENAI_API_KEY:
+    print("CRITICAL ERROR: Missing API keys")
+    # We'll continue anyway to allow debugging, but the app won't work properly
 os.environ["PINECONE_API_KEY"] = PINECONE_API_KEY
 os.environ["OPENAI_API_KEY"] = OPENAI_API_KEY
 def initialize_chain():
     global embeddings, rag_chain
     try:
+        print("Step 1: Starting to download embeddings")
         embeddings = download_hugging_face_embeddings()
+        print("Step 2: Successfully downloaded embeddings")
         index_name = "medprep"
+        print(f"Step 3: Connecting to Pinecone index: {index_name}")
+        try:
+            from pinecone import Pinecone as PineconeClient
+            pc = PineconeClient(api_key=PINECONE_API_KEY)
+            # List available indexes to verify connection
+            indexes = pc.list_indexes()
+            print(f"Available Pinecone indexes: {indexes}")
+            if index_name not in [idx.name for idx in indexes]:
+                print(f"WARNING: Index '{index_name}' not found in your Pinecone account!")
+        except Exception as e:
+            print(f"Failed to connect to Pinecone API: {e}")
         docsearch = Pinecone.from_existing_index(
+            index_name=index_name,
+            embedding=embeddings
         )
+        print("Step 4: Successfully connected to Pinecone")
         retriever = docsearch.as_retriever(search_type="similarity", search_kwargs={"k":3})
+        print("Step 5: Created retriever")
+        print("Step 6: Initializing OpenAI")
         llm = OpenAI(temperature=0.4, max_tokens=500)
+        print("Step 7: OpenAI initialized")
+        print("Step 8: Creating prompt template")
         prompt = ChatPromptTemplate.from_messages(
             [
                 ("system", system_prompt),
             ]
         )
+        print("Step 9: Creating QA chain")
         question_answer_chain = create_stuff_documents_chain(llm, prompt)
+        print("Step 10: Creating RAG chain")
         rag_chain = create_retrieval_chain(retriever, question_answer_chain)
+        print("Step 11: RAG chain initialized successfully")
         return True
     except Exception as e:
         print(f"Failed to initialize RAG chain: {e}")
+        print(f"Error type: {type(e)}")
+        traceback.print_exc()
         return False
 # Initialize the chain when the application starts
+print("Starting chain initialization...")
+initialization_result = initialize_chain()
+print(f"Chain initialization result: {initialization_result}")
 @app.route("/")
 def index():
     # Make sure chain is initialized
     if rag_chain is None:
+        print("RAG chain not initialized, attempting to initialize again...")
         if not initialize_chain():
             return "Error: System not initialized properly. Please check the logs."
     msg = request.form["msg"]
     try:
+        print(f"Processing message: {msg[:30]}...")  # Log only first 30 chars for privacy
         response = rag_chain.invoke({"input": msg})
+        print("Successfully generated response")
         return str(response["answer"])
     except Exception as e:
+        error_msg = f"Error processing request: {e}"
+        print(error_msg)
+        traceback.print_exc()
         return f"Error: {str(e)}"
 # Health check endpoint for monitoring
 @app.route("/health")
 def health_check():
+    is_initialized = rag_chain is not None
+    return jsonify({
+        "status": "healthy",
+        "rag_chain_initialized": is_initialized,
+        "embeddings_loaded": embeddings is not None
+    })
 if __name__ == '__main__':
     port = int(os.environ.get("PORT", 7860))