Spaces:

TimeCapsuleX
/

FMEA-AI

Sleeping

App Files Files Community

TimeCapsuleX commited on Mar 10

Commit

fdbfbee

1 Parent(s): 3914cd6

Add application file

Browse files

Files changed (2) hide show

__pycache__/app.cpython-311.pyc +0 -0
app.py +108 -27

__pycache__/app.cpython-311.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-311.pyc and b/__pycache__/app.cpython-311.pyc differ

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 import json
 import re
 import torch
 import gradio as gr
 import pandas as pd
@@ -25,6 +26,8 @@ QA_CHAIN = None
 RETRIEVER = None
 LLM = None
 PROMPT = None
 feedback_vector_store = None
 embeddings = None
@@ -42,23 +45,58 @@ def load_feedback_stats():
         feedback_df = pd.read_csv(FEEDBACK_FILE)
         if feedback_df.empty:
             return {}
         stats = feedback_df.groupby('action')['rating'].agg(['mean', 'count']).to_dict('index')
         return stats
     except pd.errors.EmptyDataError:
         return {}
-def save_feedback(action, rating, display_df):
     if not action:
         return "Please select a recommendation from the table first.", display_df
     norm_action = normalize_action(action)
-    new_feedback = pd.DataFrame([{'action': norm_action, 'rating': int(rating)}])
     if not os.path.exists(FEEDBACK_FILE):
         new_feedback.to_csv(FEEDBACK_FILE, index=False)
     else:
         new_feedback.to_csv(FEEDBACK_FILE, mode='a', header=False, index=False)
     build_feedback_db()
-    msg = f"✅ Rating of {rating}/10 saved for: {action}"
     # Update the displayed table dynamically
     if display_df is not None and not display_df.empty:
@@ -91,19 +129,31 @@ def build_feedback_db():
         feedback_vector_store = FAISS.from_texts(highly_rated_actions, embeddings)
         print("✅ Feedback vector store is ready.")
 # --- build_rag_chain ---
 def build_rag_chain():
-    global QA_CHAIN, RETRIEVER, LLM, PROMPT, embeddings
     try:
-        print("Initializing local HuggingFace embedding model...")
-        embeddings = HuggingFaceEmbeddings(
-            model_name='all-MiniLM-L6-v2',
-            model_kwargs={'device': DEVICE}
-        )
-        print("✅ Local embedding model loaded.")
-        build_feedback_db()
         print(f"Loading FMEA data from {FMEA_DATA_FILE}...")
         fmea_df = pd.read_csv(FMEA_DATA_FILE).fillna("")
         documents = []
@@ -113,11 +163,31 @@ def build_rag_chain():
             if "Failure_Mode" in fmea_df.columns:
                 metadata["source"] = str(row["Failure_Mode"])
             documents.append(Document(page_content=page_content, metadata=metadata))
         print(f"✅ Successfully loaded {len(documents)} records.")
-        print("Creating embeddings and building main FAISS vector store...")
-        main_vector_store = FAISS.from_documents(documents, embeddings)
-        print("✅ Main vector store created successfully.")
         # --- UPDATED TO USE LLAMA 3.3 VIA GROQ ---
         llm = ChatGroq(model_name="llama-3.3-70b-versatile", temperature=0.2)
@@ -139,10 +209,11 @@ def build_rag_chain():
         INSTRUCTIONS:
         Format your entire response as a single, valid JSON object with a key "recommendations" which is a list of 3 objects.
-        Each object must have these keys: "rank", "action", "department", "ai_score", "new_S", "new_O", "new_D".
         - "rank": The rank of the recommendation (1, 2, 3).
         - "action": The recommended action text.
         - "department": The most likely responsible department.
         - "ai_score": Confidence score (1-100) for this recommendation.
         - "new_S": Your estimated new Severity score (1-10).
@@ -153,8 +224,6 @@ def build_rag_chain():
         """
         PROMPT = PromptTemplate(template=prompt_template, input_variables=["context", "question"])
-        # Included the token-saving "k": 2 limit
-        RETRIEVER = main_vector_store.as_retriever(search_kwargs={"k": 2})
         LLM = llm
         QA_CHAIN = True
         print("✅ RAG model is ready.")
@@ -165,7 +234,7 @@ def build_rag_chain():
 # --- 3. Gradio Interface Logic ---
 def fmea_rag_interface(mode, effect, cause, severity, occurrence, detection):
-    if QA_CHAIN is None or RETRIEVER is None or LLM is None or PROMPT is None:
         return "RAG Model is not initialized.", pd.DataFrame(), ""
     rpn = severity * occurrence * detection
@@ -177,7 +246,10 @@ def fmea_rag_interface(mode, effect, cause, severity, occurrence, detection):
         f"The current scores are: Severity={severity}, Occurrence={occurrence}, Detection={detection}."
     )
-    docs = RETRIEVER.invoke(query)
     context_from_history = "\n---\n".join([doc.page_content for doc in docs])
     context_from_feedback = ""
@@ -205,6 +277,8 @@ def fmea_rag_interface(mode, effect, cause, severity, occurrence, detection):
         data = json.loads(json_text)
         output_df = pd.DataFrame(data['recommendations'])
         feedback_stats = load_feedback_stats()
         default_stat = {'mean': 0, 'count': 0}
@@ -216,16 +290,19 @@ def fmea_rag_interface(mode, effect, cause, severity, occurrence, detection):
         output_df['new_O'] = output_df['new_O'].astype(int)
         output_df['new_D'] = output_df['new_D'].astype(int)
         output_df['new_RPN'] = output_df['new_S'] * output_df['new_O'] * output_df['new_D']
         rpn_change_list = [f"{int(rpn)} ➔ {int(new_rpn)}" for new_rpn in output_df['new_RPN']]
         display_df = pd.DataFrame({
             "Rank": output_df['rank'],
             "Recommended Action": output_df['action'],
             "Department": output_df['department'],
             "AI Confidence": [f"{score}%" for score in output_df['ai_score']],
             "Avg. Feedback": [f"{avg:.2f}/10 ({int(count)})" for avg, count in zip(output_df['avg_feedback'], output_df['feedback_count'])],
-            "Revised RPN": rpn_change_list
         })
     except Exception as e:
@@ -270,8 +347,8 @@ if build_rag_chain():
             gr.Markdown("## 💡 Top 3 AI-Generated Recommendations")
             rpn_output = gr.Textbox(label="Current RPN", interactive=False)
             recommendations_output = gr.DataFrame(
-                headers=["Rank", "Recommended Action", "Department", "AI Confidence", "Avg. Feedback", "Revised RPN"],
-                datatype=["number", "str", "str", "str", "str", "str"]
             )
             df_state = gr.State()
@@ -279,8 +356,12 @@ if build_rag_chain():
             gr.Markdown("## ⭐ Provide Feedback")
             gr.Markdown("Click a row in the table above to select it, then submit your rating.")
             selected_action_text = gr.Textbox(label="Selected for Feedback", interactive=False)
-            rating_slider = gr.Slider(minimum=1, maximum=10, step=1, value=8, label="Your Rating (1-10)")
-            submit_feedback_btn = gr.Button("Submit Rating")
             feedback_status = gr.Textbox(label="Feedback Status", interactive=False)
         # FIX 1: Safer update_selection function
@@ -307,7 +388,7 @@ if build_rag_chain():
         submit_feedback_btn.click(
             fn=save_feedback,
-            inputs=[selected_action_text, rating_slider, recommendations_output],
             outputs=[feedback_status, recommendations_output]
         )

 import os
 import json
 import re
+from datetime import datetime, timezone
 import torch
 import gradio as gr
 import pandas as pd
 RETRIEVER = None
 LLM = None
 PROMPT = None
+FMEA_DF = None
+DOCUMENTS = None
 feedback_vector_store = None
 embeddings = None
         feedback_df = pd.read_csv(FEEDBACK_FILE)
         if feedback_df.empty:
             return {}
+        if "rating" not in feedback_df.columns:
+            return {}
         stats = feedback_df.groupby('action')['rating'].agg(['mean', 'count']).to_dict('index')
         return stats
     except pd.errors.EmptyDataError:
         return {}
+def ensure_feedback_schema():
+    target_cols = ["action", "rating", "feedback_type", "timestamp_utc"]
+    if not os.path.exists(FEEDBACK_FILE):
+        return
+    try:
+        existing_df = pd.read_csv(FEEDBACK_FILE)
+        if existing_df.empty:
+            pd.DataFrame(columns=target_cols).to_csv(FEEDBACK_FILE, index=False)
+            return
+        changed = False
+        for col in target_cols:
+            if col not in existing_df.columns:
+                existing_df[col] = ""
+                changed = True
+        if changed:
+            existing_df = existing_df[target_cols]
+            existing_df.to_csv(FEEDBACK_FILE, index=False)
+    except pd.errors.EmptyDataError:
+        pd.DataFrame(columns=target_cols).to_csv(FEEDBACK_FILE, index=False)
+def save_feedback(action, feedback_choice, display_df):
     if not action:
         return "Please select a recommendation from the table first.", display_df
+    choice_map = {
+        "👍 Thumbs Up": ("thumbs_up", 10),
+        "👎 Thumbs Down": ("thumbs_down", 3)
+    }
+    feedback_type, rating = choice_map.get(feedback_choice, ("thumbs_up", 10))
+    timestamp_utc = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S UTC")
     norm_action = normalize_action(action)
+    new_feedback = pd.DataFrame([{
+        'action': norm_action,
+        'rating': int(rating),
+        'feedback_type': feedback_type,
+        'timestamp_utc': timestamp_utc
+    }])
     if not os.path.exists(FEEDBACK_FILE):
         new_feedback.to_csv(FEEDBACK_FILE, index=False)
     else:
+        ensure_feedback_schema()
         new_feedback.to_csv(FEEDBACK_FILE, mode='a', header=False, index=False)
     build_feedback_db()
+    msg = f"✅ Feedback saved ({feedback_choice}) for: {action} at {timestamp_utc}"
     # Update the displayed table dynamically
     if display_df is not None and not display_df.empty:
         feedback_vector_store = FAISS.from_texts(highly_rated_actions, embeddings)
         print("✅ Feedback vector store is ready.")
+def keyword_retrieve_documents(search_query: str, k: int = 2):
+    if FMEA_DF is None or DOCUMENTS is None or FMEA_DF.empty:
+        return []
+    tokens = [tok for tok in re.findall(r"[a-z0-9]+", str(search_query).lower()) if len(tok) >= 3]
+    if not tokens:
+        return DOCUMENTS[:k]
+    scores = []
+    for idx, text in enumerate(FMEA_DF["__search_text"]):
+        token_hits = sum(1 for tok in tokens if tok in text)
+        if token_hits:
+            scores.append((token_hits, idx))
+    if not scores:
+        return DOCUMENTS[:k]
+    scores.sort(key=lambda x: x[0], reverse=True)
+    top_indices = [idx for _, idx in scores[:k]]
+    return [DOCUMENTS[idx] for idx in top_indices]
 # --- build_rag_chain ---
 def build_rag_chain():
+    global QA_CHAIN, RETRIEVER, LLM, PROMPT, FMEA_DF, DOCUMENTS, feedback_vector_store, embeddings
     try:
         print(f"Loading FMEA data from {FMEA_DATA_FILE}...")
         fmea_df = pd.read_csv(FMEA_DATA_FILE).fillna("")
         documents = []
             if "Failure_Mode" in fmea_df.columns:
                 metadata["source"] = str(row["Failure_Mode"])
             documents.append(Document(page_content=page_content, metadata=metadata))
+        search_cols = [c for c in ["Failure_Mode", "Effect", "Cause", "Recommended_Action", "Responsible_Department"] if c in fmea_df.columns]
+        fmea_df["__search_text"] = fmea_df[search_cols].astype(str).agg(" ".join, axis=1).str.lower()
+        FMEA_DF = fmea_df
+        DOCUMENTS = documents
         print(f"✅ Successfully loaded {len(documents)} records.")
+        print("Initializing local HuggingFace embedding model...")
+        try:
+            embeddings = HuggingFaceEmbeddings(
+                model_name='all-MiniLM-L6-v2',
+                model_kwargs={'device': DEVICE}
+            )
+            print("✅ Local embedding model loaded.")
+            build_feedback_db()
+            print("Creating embeddings and building main FAISS vector store...")
+            main_vector_store = FAISS.from_documents(documents, embeddings)
+            RETRIEVER = main_vector_store.as_retriever(search_kwargs={"k": 2})
+            print("✅ Main vector store created successfully.")
+        except Exception as embed_error:
+            embeddings = None
+            RETRIEVER = None
+            feedback_vector_store = None
+            print(f"⚠️ Embedding setup failed, using keyword retrieval fallback. Details: {embed_error}")
         # --- UPDATED TO USE LLAMA 3.3 VIA GROQ ---
         llm = ChatGroq(model_name="llama-3.3-70b-versatile", temperature=0.2)
         INSTRUCTIONS:
         Format your entire response as a single, valid JSON object with a key "recommendations" which is a list of 3 objects.
+        Each object must have these keys: "rank", "action", "action_details", "department", "ai_score", "new_S", "new_O", "new_D".
         - "rank": The rank of the recommendation (1, 2, 3).
         - "action": The recommended action text.
+        - "action_details": 2-3 sentences explaining why this action works and practical implementation notes.
         - "department": The most likely responsible department.
         - "ai_score": Confidence score (1-100) for this recommendation.
         - "new_S": Your estimated new Severity score (1-10).
         """
         PROMPT = PromptTemplate(template=prompt_template, input_variables=["context", "question"])
         LLM = llm
         QA_CHAIN = True
         print("✅ RAG model is ready.")
 # --- 3. Gradio Interface Logic ---
 def fmea_rag_interface(mode, effect, cause, severity, occurrence, detection):
+    if QA_CHAIN is None or LLM is None or PROMPT is None:
         return "RAG Model is not initialized.", pd.DataFrame(), ""
     rpn = severity * occurrence * detection
         f"The current scores are: Severity={severity}, Occurrence={occurrence}, Detection={detection}."
     )
+    if RETRIEVER is not None:
+        docs = RETRIEVER.invoke(query)
+    else:
+        docs = keyword_retrieve_documents(f"{mode} {effect} {cause}", k=2)
     context_from_history = "\n---\n".join([doc.page_content for doc in docs])
     context_from_feedback = ""
         data = json.loads(json_text)
         output_df = pd.DataFrame(data['recommendations'])
+        if 'action_details' not in output_df.columns:
+            output_df['action_details'] = "No additional details provided."
         feedback_stats = load_feedback_stats()
         default_stat = {'mean': 0, 'count': 0}
         output_df['new_O'] = output_df['new_O'].astype(int)
         output_df['new_D'] = output_df['new_D'].astype(int)
         output_df['new_RPN'] = output_df['new_S'] * output_df['new_O'] * output_df['new_D']
+        output_df['generated_at'] = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S UTC")
         rpn_change_list = [f"{int(rpn)} ➔ {int(new_rpn)}" for new_rpn in output_df['new_RPN']]
         display_df = pd.DataFrame({
             "Rank": output_df['rank'],
             "Recommended Action": output_df['action'],
+            "Action Details": output_df['action_details'],
             "Department": output_df['department'],
             "AI Confidence": [f"{score}%" for score in output_df['ai_score']],
             "Avg. Feedback": [f"{avg:.2f}/10 ({int(count)})" for avg, count in zip(output_df['avg_feedback'], output_df['feedback_count'])],
+            "Revised RPN": rpn_change_list,
+            "Generated At (UTC)": output_df['generated_at']
         })
     except Exception as e:
             gr.Markdown("## 💡 Top 3 AI-Generated Recommendations")
             rpn_output = gr.Textbox(label="Current RPN", interactive=False)
             recommendations_output = gr.DataFrame(
+                headers=["Rank", "Recommended Action", "Action Details", "Department", "AI Confidence", "Avg. Feedback", "Revised RPN", "Generated At (UTC)"],
+                datatype=["number", "str", "str", "str", "str", "str", "str", "str"]
             )
             df_state = gr.State()
             gr.Markdown("## ⭐ Provide Feedback")
             gr.Markdown("Click a row in the table above to select it, then submit your rating.")
             selected_action_text = gr.Textbox(label="Selected for Feedback", interactive=False)
+            feedback_choice = gr.Radio(
+                choices=["👍 Thumbs Up", "👎 Thumbs Down"],
+                value="👍 Thumbs Up",
+                label="Your Feedback"
+            )
+            submit_feedback_btn = gr.Button("Submit Feedback")
             feedback_status = gr.Textbox(label="Feedback Status", interactive=False)
         # FIX 1: Safer update_selection function
         submit_feedback_btn.click(
             fn=save_feedback,
+            inputs=[selected_action_text, feedback_choice, recommendations_output],
             outputs=[feedback_status, recommendations_output]
         )