Spaces:

AI-Agent-Exercise-2025
/

Operation_data_analysis2

Runtime error

App Files Files Community

MTeguri commited on Sep 17, 2025

Commit

cd0375c

1 Parent(s): 32c8275

Implement check_thresholds function and enhance run_troubleshooting: Add alert generation for threshold violations, improve empty checks, and ensure timestamp consistency with timezone handling.

Browse files

Files changed (1) hide show

app.py +98 -36

app.py CHANGED Viewed

@@ -94,84 +94,146 @@ import pytz # Import pytz for timezone conversion
 # Assuming the data loading and check_thresholds function from the previous cell are available
 # トラブルシューティング実行関数の定義
 def run_troubleshooting():
     try:
-        # Get current time and calculate the time 24 hours ago
         current_time_utc = datetime.datetime.now(datetime.timezone.utc)
-        # 24時間前のUTC
         time_24_hours_ago_utc = current_time_utc - datetime.timedelta(hours=24)
-        # Filter sensor data for the last 24 hours
-        # Use the globally available sensor_df and filter it each time the function is called
-        global sensor_df
         recent_sensor_df = sensor_df[
-        (sensor_df['datetime'] >= time_24_hours_ago_utc) &
-        (sensor_df['datetime'] <= current_time_utc)
         ].copy()
-        # Ensure other dataframes are accessible (they are loaded globally once)
-        global threshold_df
-        global troubleshooting_df
-        # しきい値チェックの実行
-        alerts_df = check_thresholds(recent_sensor_df, threshold_df) # Pass the filtered data
-        # タイムスタンプごとのユニークなデータ番号の数をカウント
         grouped_alerts = alerts_df.groupby('timestamp')['data no.'].nunique()
-        # 複数のデータ番号を持つタイムスタンプを抽出
         multiple_data_nos_timestamps = grouped_alerts[grouped_alerts > 1].index.tolist()
-        # 複数のデータ番号を持つタイムスタンプに該当するアラートをフィルタリング
         filtered_alerts_df = alerts_df[alerts_df['timestamp'].isin(multiple_data_nos_timestamps)]
-        # タイムスタンプごとにデータ番号をリスト化
         data_nos_by_timestamp = filtered_alerts_df.groupby('timestamp')['data no.'].unique().apply(list)
-        # 結果リストの作成
         result_list = []
         for timestamp, data_nos in data_nos_by_timestamp.items():
             data_nos_str = ', '.join(map(str, data_nos))
             result_list.append({"timestamp": timestamp, "data_nos": data_nos_str})
-        # 結果データフレームの作成
-        result_df = pd.DataFrame(result_list)
-        # Convert timestamp to JST　時間変換
-        if not result_df.empty and 'timestamp' in result_df.columns:
-             JST = pytz.timezone('Asia/Tokyo')
-             result_df['timestamp'] = result_df['timestamp'].dt.tz_convert(JST)
-        # If no alerts, return "異常ありません"
         if result_df.empty:
             return "過去24時間 異常ありません"
-        # トラブルシューティングデータフレームの指標番号リストを整数リストに変換
-        troubleshooting_indicator_lists = troubleshooting_df['指標No.'].str.split(',').apply(lambda x: [int(i) for i in x])
-        # 結果データフレームのデータ番号リストを整数リストに変換
-        result_data_nos_lists = result_df['data_nos'].str.split(', ').apply(lambda x: [int(i) for i in x])
-        # 出力テキストの生成
         output_text = ""
         for i, result_nos in enumerate(result_data_nos_lists):
             result_timestamp = result_df.loc[i, 'timestamp']
             for j, troubleshooting_nos in enumerate(troubleshooting_indicator_lists):
-                # 結果のデータ番号がトラブルシューティングの指標番号のスーパーセットであるか確認
                 if set(troubleshooting_nos).issubset(set(result_nos)):
-                    troubleshooting_situation = troubleshooting_df.loc[j, 'シチュエーション\n（対応が必要な状況）']
-                    troubleshooting_action = troubleshooting_df.loc[j, 'sub goal到達のために必要な行動\n（解決策）']
                     output_text += f"Timestamp: {result_timestamp}\n"
                     output_text += f"Trouble: {troubleshooting_situation}\n"
                     output_text += f"Troubleshooting: {troubleshooting_action}\n"
-                    output_text += "-" * 20 + "\n" # 区切り線
-        return output_text
     except Exception as e:
         return f"エラーが発生しました: {type(e).__name__} - {e}"
 # Gradioインターフェースの設定
 iface = gr.Interface(
     fn=run_troubleshooting,

 # Assuming the data loading and check_thresholds function from the previous cell are available
 # トラブルシューティング実行関数の定義
+# ① check_thresholds の戻り DataFrameは列を先に固定して作る
+def check_thresholds(sensor_df_filtered, threshold_df):
+    alerts = []
+    threshold_df['下限'] = pd.to_numeric(threshold_df['下限'], errors='coerce')
+    threshold_df['上限'] = pd.to_numeric(threshold_df['上限'], errors='coerce')
+    for _, row in threshold_df.iterrows():
+        metric = row["指標名"]
+        min_val = row["下限"]
+        max_val = row["上限"]
+        data_no = row["No."]
+        if metric not in sensor_df_filtered.columns:
+            continue
+        sensor_metric_data = pd.to_numeric(sensor_df_filtered[metric], errors='coerce')
+        for index, value in sensor_metric_data.items():
+            if index not in sensor_df_filtered.index:
+                continue
+            # 常に 'datetime' 列を優先し、無ければ index を使う
+            timestamp = (
+                sensor_df_filtered.loc[index, "datetime"]
+                if "datetime" in sensor_df_filtered.columns else index
+            )
+            if pd.notna(min_val) and pd.notna(value) and value < min_val:
+                alerts.append({
+                    "timestamp": timestamp,
+                    "metric": metric,
+                    "value": value,
+                    "status": f"下限値 {min_val} 未満",
+                    "data no.": data_no
+                })
+            if pd.notna(max_val) and pd.notna(value) and value > max_val:
+                alerts.append({
+                    "timestamp": timestamp,
+                    "metric": metric,
+                    "value": value,
+                    "status": f"上限値 {max_val} 超過",
+                    "data no.": data_no
+                })
+    # ← ここで列を固定。空でも 'timestamp' などの列が存在するようにする
+    return pd.DataFrame(alerts, columns=["timestamp", "metric", "value", "status", "data no."])
+# ② run_troubleshooting 内の空チェックとタイムゾーン担保
 def run_troubleshooting():
     try:
         current_time_utc = datetime.datetime.now(datetime.timezone.utc)
         time_24_hours_ago_utc = current_time_utc - datetime.timedelta(hours=24)
+        global sensor_df, threshold_df, troubleshooting_df
         recent_sensor_df = sensor_df[
+            (sensor_df['datetime'] >= time_24_hours_ago_utc) &
+            (sensor_df['datetime'] <= current_time_utc)
         ].copy()
+        alerts_df = check_thresholds(recent_sensor_df, threshold_df)
+        # まず空チェック（ここで 'timestamp' KeyError を根絶）
+        if alerts_df.empty:
+            return "過去24時間 異常ありません（アラート0件）"
+        # 'timestamp' 列が存在するか念のため防御（列固定しているので基本 True）
+        if 'timestamp' not in alerts_df.columns:
+            return "過去24時間 異常ありません（アラート0件／timestamp列なし）"
+        # 型とTZを担保：tz-naive → UTC を付与
+        if not pd.api.types.is_datetime64_any_dtype(alerts_df['timestamp']):
+            alerts_df['timestamp'] = pd.to_datetime(alerts_df['timestamp'], errors='coerce', utc=True)
+        elif alerts_df['timestamp'].dt.tz is None:
+            alerts_df['timestamp'] = alerts_df['timestamp'].dt.tz_localize('UTC')
         grouped_alerts = alerts_df.groupby('timestamp')['data no.'].nunique()
         multiple_data_nos_timestamps = grouped_alerts[grouped_alerts > 1].index.tolist()
         filtered_alerts_df = alerts_df[alerts_df['timestamp'].isin(multiple_data_nos_timestamps)]
+        # ここで空になるケースにも対応
+        if filtered_alerts_df.empty:
+            return "過去24時間 異常ありません（複数指標の同時異常なし）"
         data_nos_by_timestamp = filtered_alerts_df.groupby('timestamp')['data no.'].unique().apply(list)
         result_list = []
         for timestamp, data_nos in data_nos_by_timestamp.items():
             data_nos_str = ', '.join(map(str, data_nos))
             result_list.append({"timestamp": timestamp, "data_nos": data_nos_str})
+        result_df = pd.DataFrame(result_list, columns=["timestamp", "data_nos"])
+        # JST に変換（常に tz-aware 前提）
+        JST = pytz.timezone('Asia/Tokyo')
+        result_df['timestamp'] = result_df['timestamp'].dt.tz_convert(JST)
         if result_df.empty:
             return "過去24時間 異常ありません"
+        # 以下、トラブルシューティング照合
+        if '指標No.' not in troubleshooting_df.columns:
+            return "設定テーブルに『指標No.』列が見つかりません。"
+        troubleshooting_indicator_lists = troubleshooting_df['指標No.'].astype(str).str.split(',').apply(
+            lambda x: [int(i) for i in x if i.strip().isdigit()]
+        )
+        result_data_nos_lists = result_df['data_nos'].astype(str).str.split(', ').apply(
+            lambda x: [int(i) for i in x if i.strip().isdigit()]
+        )
         output_text = ""
         for i, result_nos in enumerate(result_data_nos_lists):
             result_timestamp = result_df.loc[i, 'timestamp']
             for j, troubleshooting_nos in enumerate(troubleshooting_indicator_lists):
                 if set(troubleshooting_nos).issubset(set(result_nos)):
+                    # 列の存在チェックも加える
+                    if ('シチュエーション\n（対応が必要な状況）' in troubleshooting_df.columns and
+                        'sub goal到達のために必要な行動\n（解決策）' in troubleshooting_df.columns):
+                        troubleshooting_situation = troubleshooting_df.loc[j, 'シチュエーション\n（対応が必要な状況）']
+                        troubleshooting_action = troubleshooting_df.loc[j, 'sub goal到達のために必要な行動\n（解決策）']
+                    else:
+                        troubleshooting_situation = "（シチュエーション列なし）"
+                        troubleshooting_action   = "（解決策列なし）"
                     output_text += f"Timestamp: {result_timestamp}\n"
                     output_text += f"Trouble: {troubleshooting_situation}\n"
                     output_text += f"Troubleshooting: {troubleshooting_action}\n"
+                    output_text += "-" * 20 + "\n"
+        return output_text if output_text else "該当するトラブルシューティングの組み合わせはありませんでした。"
     except Exception as e:
         return f"エラーが発生しました: {type(e).__name__} - {e}"
 # Gradioインターフェースの設定
 iface = gr.Interface(
     fn=run_troubleshooting,