Spaces:

nivakaran
/

modelx

Sleeping

App Files Files Community

nivakaran commited on Dec 10, 2025

Commit

c565e08

verified ·

1 Parent(s): 16ec2cf

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

src/nodes/vectorizationAgentNode.py +8 -8
src/utils/trending_detector.py +7 -7
vectorizer_anomaly_visualization.png +2 -2

src/nodes/vectorizationAgentNode.py CHANGED Viewed

@@ -6,7 +6,7 @@ Uses language-specific BERT models for Sinhala, Tamil, and English
 import sys
 import logging
-from datetime import datetime
 from typing import Dict, Any, List
 from pathlib import Path
 import numpy as np
@@ -794,7 +794,7 @@ Format your response in a clear, structured manner."""
                 "domain": "vectorization",
                 "category": "text_analysis",
                 "summary": f"Processed {len(embeddings)} texts with multilingual BERT models",
-                "timestamp": datetime.utcnow().isoformat(),
                 "severity": "low",
                 "impact_type": "analysis",
                 "confidence": 0.9,
@@ -820,7 +820,7 @@ Format your response in a clear, structured manner."""
                     "domain": "anomaly_detection",
                     "category": "ml_analysis",
                     "summary": f"ML Anomaly Detection: {len(anomalies)} anomalies found in {anomaly_results.get('total_analyzed', 0)} texts",
-                    "timestamp": datetime.utcnow().isoformat(),
                     "severity": "high" if len(anomalies) > 5 else "medium",
                     "impact_type": "risk",
                     "confidence": 0.85,
@@ -840,7 +840,7 @@ Format your response in a clear, structured manner."""
                         "domain": "anomaly_detection",
                         "category": "anomaly",
                         "summary": f"Anomaly detected (score: {anomaly.get('anomaly_score', 0):.2f})",
-                        "timestamp": datetime.utcnow().isoformat(),
                         "severity": (
                             "high"
                             if anomaly.get("anomaly_score", 0) > 0.7
@@ -863,7 +863,7 @@ Format your response in a clear, structured manner."""
                     "domain": "anomaly_detection",
                     "category": "system_info",
                     "summary": "ML model not trained yet - using severity-based fallback",
-                    "timestamp": datetime.utcnow().isoformat(),
                     "severity": "low",
                     "impact_type": "info",
                     "confidence": 1.0,
@@ -878,7 +878,7 @@ Format your response in a clear, structured manner."""
                     "domain": "vectorization",
                     "category": "opportunity",
                     "summary": opp.get("description", "Opportunity detected"),
-                    "timestamp": datetime.utcnow().isoformat(),
                     "severity": "medium",
                     "impact_type": "opportunity",
                     "confidence": opp.get("confidence", 0.7),
@@ -893,7 +893,7 @@ Format your response in a clear, structured manner."""
                     "domain": "vectorization",
                     "category": "threat",
                     "summary": threat.get("description", "Threat detected"),
-                    "timestamp": datetime.utcnow().isoformat(),
                     "severity": "high",
                     "impact_type": "risk",
                     "confidence": threat.get("confidence", 0.7),
@@ -903,7 +903,7 @@ Format your response in a clear, structured manner."""
         # Final output
         final_output = {
             "batch_id": batch_id,
-            "timestamp": datetime.utcnow().isoformat(),
             "total_texts": len(embeddings),
             "processing_stats": processing_stats,
             "expert_summary": expert_summary,

 import sys
 import logging
+from datetime import datetime, timezone
 from typing import Dict, Any, List
 from pathlib import Path
 import numpy as np
                 "domain": "vectorization",
                 "category": "text_analysis",
                 "summary": f"Processed {len(embeddings)} texts with multilingual BERT models",
+                "timestamp": datetime.now(timezone.utc).isoformat(),
                 "severity": "low",
                 "impact_type": "analysis",
                 "confidence": 0.9,
                     "domain": "anomaly_detection",
                     "category": "ml_analysis",
                     "summary": f"ML Anomaly Detection: {len(anomalies)} anomalies found in {anomaly_results.get('total_analyzed', 0)} texts",
+                    "timestamp": datetime.now(timezone.utc).isoformat(),
                     "severity": "high" if len(anomalies) > 5 else "medium",
                     "impact_type": "risk",
                     "confidence": 0.85,
                         "domain": "anomaly_detection",
                         "category": "anomaly",
                         "summary": f"Anomaly detected (score: {anomaly.get('anomaly_score', 0):.2f})",
+                        "timestamp": datetime.now(timezone.utc).isoformat(),
                         "severity": (
                             "high"
                             if anomaly.get("anomaly_score", 0) > 0.7
                     "domain": "anomaly_detection",
                     "category": "system_info",
                     "summary": "ML model not trained yet - using severity-based fallback",
+                    "timestamp": datetime.now(timezone.utc).isoformat(),
                     "severity": "low",
                     "impact_type": "info",
                     "confidence": 1.0,
                     "domain": "vectorization",
                     "category": "opportunity",
                     "summary": opp.get("description", "Opportunity detected"),
+                    "timestamp": datetime.now(timezone.utc).isoformat(),
                     "severity": "medium",
                     "impact_type": "opportunity",
                     "confidence": opp.get("confidence", 0.7),
                     "domain": "vectorization",
                     "category": "threat",
                     "summary": threat.get("description", "Threat detected"),
+                    "timestamp": datetime.now(timezone.utc).isoformat(),
                     "severity": "high",
                     "impact_type": "risk",
                     "confidence": threat.get("confidence", 0.7),
         # Final output
         final_output = {
             "batch_id": batch_id,
+            "timestamp": datetime.now(timezone.utc).isoformat(),
             "total_texts": len(embeddings),
             "processing_stats": processing_stats,
             "expert_summary": expert_summary,

src/utils/trending_detector.py CHANGED Viewed

@@ -15,7 +15,7 @@ import json
 import sqlite3
 import hashlib
 import logging
-from datetime import datetime, timedelta
 from typing import List, Dict, Any, Optional, Tuple
 from pathlib import Path
@@ -110,7 +110,7 @@ class TrendingDetector:
     def _get_hour_bucket(self, dt: datetime = None) -> str:
         """Get the hour bucket string (YYYY-MM-DD-HH)"""
-        dt = dt or datetime.utcnow()
         return dt.strftime("%Y-%m-%d-%H")
     def record_mention(
@@ -130,7 +130,7 @@ class TrendingDetector:
             timestamp: When the mention occurred (default: now)
         """
         topic_hash = self._topic_hash(topic)
-        ts = timestamp or datetime.utcnow()
         hour_bucket = self._get_hour_bucket(ts)
         with sqlite3.connect(self.db_path) as conn:
@@ -180,7 +180,7 @@ class TrendingDetector:
             Momentum value (1.0 = normal, >2.0 = trending, >3.0 = spike)
         """
         topic_hash = self._topic_hash(topic)
-        now = datetime.utcnow()
         current_hour = self._get_hour_bucket(now)
         with sqlite3.connect(self.db_path) as conn:
@@ -230,7 +230,7 @@ class TrendingDetector:
         Returns:
             List of trending topics with their momentum values
         """
-        now = datetime.utcnow()
         current_hour = self._get_hour_bucket(now)
         trending = []
@@ -291,7 +291,7 @@ class TrendingDetector:
             List of hourly counts
         """
         topic_hash = self._topic_hash(topic)
-        now = datetime.utcnow()
         history = []
         with sqlite3.connect(self.db_path) as conn:
@@ -320,7 +320,7 @@ class TrendingDetector:
         Args:
             days: Number of days to keep
         """
-        cutoff = datetime.utcnow() - timedelta(days=days)
         cutoff_str = cutoff.isoformat()
         cutoff_bucket = self._get_hour_bucket(cutoff)

 import sqlite3
 import hashlib
 import logging
+from datetime import datetime, timedelta, timezone
 from typing import List, Dict, Any, Optional, Tuple
 from pathlib import Path
     def _get_hour_bucket(self, dt: datetime = None) -> str:
         """Get the hour bucket string (YYYY-MM-DD-HH)"""
+        dt = dt or datetime.now(timezone.utc)
         return dt.strftime("%Y-%m-%d-%H")
     def record_mention(
             timestamp: When the mention occurred (default: now)
         """
         topic_hash = self._topic_hash(topic)
+        ts = timestamp or datetime.now(timezone.utc)
         hour_bucket = self._get_hour_bucket(ts)
         with sqlite3.connect(self.db_path) as conn:
             Momentum value (1.0 = normal, >2.0 = trending, >3.0 = spike)
         """
         topic_hash = self._topic_hash(topic)
+        now = datetime.now(timezone.utc)
         current_hour = self._get_hour_bucket(now)
         with sqlite3.connect(self.db_path) as conn:
         Returns:
             List of trending topics with their momentum values
         """
+        now = datetime.now(timezone.utc)
         current_hour = self._get_hour_bucket(now)
         trending = []
             List of hourly counts
         """
         topic_hash = self._topic_hash(topic)
+        now = datetime.now(timezone.utc)
         history = []
         with sqlite3.connect(self.db_path) as conn:
         Args:
             days: Number of days to keep
         """
+        cutoff = datetime.now(timezone.utc) - timedelta(days=days)
         cutoff_str = cutoff.isoformat()
         cutoff_bucket = self._get_hour_bucket(cutoff)

vectorizer_anomaly_visualization.png CHANGED Viewed

Git LFS Details

SHA256: 5f0bc1c338b312268601e3e62ea34d3f8301745b3519cec96f3362becc030813
Pointer size: 131 Bytes
Size of remote file: 182 kB

Git LFS Details

SHA256: d81dade48c9da94862b253c9273061f51b9ad9d31215289832119f425064c06c
Pointer size: 130 Bytes
Size of remote file: 49.4 kB