zenith-backend / core /diagnostics /security_scanner.py
teoat's picture
Upload folder using huggingface_hub
4ae946d verified
#!/usr/bin/env python3
"""
Advanced Security Scanner
Comprehensive security vulnerability assessment and compliance monitoring
"""
import asyncio
import logging
import os
import re
from dataclasses import asdict, dataclass
from datetime import datetime
from pathlib import Path
from typing import Any, Dict, List, Optional
from core.infrastructure.registry import kernel_registry
logger = logging.getLogger(__name__)
@dataclass
class SecurityVulnerability:
"""Security vulnerability data structure"""
severity: str # critical, high, medium, low, info
category: str # authentication, authorization, injection, xss, config, dependency
title: str
description: str
affected_component: str
cve_id: Optional[str]
recommendation: str
cvss_score: Optional[float]
discovered_at: datetime
def to_dict(self) -> Dict[str, Any]:
"""Convert to dictionary for JSON serialization"""
result = asdict(self)
result["discovered_at"] = self.discovered_at.isoformat()
return result
@dataclass
class ComplianceStatus:
"""Compliance status data structure"""
standard: str # pci_dss, gdpr, soc2, hipaa
status: str # compliant, partial, non_compliant
score: float # 0-100
findings: List[str]
last_assessed: datetime
def to_dict(self) -> Dict[str, Any]:
result = asdict(self)
result["last_assessed"] = self.last_assessed.isoformat()
return result
class AdvancedSecurityScanner:
"""Comprehensive security scanning and compliance assessment"""
def __init__(self):
self.start_time = datetime.now()
self.vulnerabilities = []
self.compliance_status = {}
# Security policies and configurations
self.security_policies = {
"password_policy": {
"min_length": 12,
"require_uppercase": True,
"require_lowercase": True,
"require_numbers": True,
"require_symbols": True,
"max_age_days": 90,
},
"session_policy": {
"timeout_minutes": 30,
"max_concurrent_sessions": 3,
"require_reauth": True,
},
"api_policy": {
"rate_limit_per_minute": 100,
"require_https": True,
"cors_restricted": True,
"input_validation": True,
},
"encryption_policy": {
"min_key_length": 256,
"algorithm": "AES-256-GCM",
"key_rotation_days": 90,
},
}
async def scan_authentication_security(self) -> List[SecurityVulnerability]:
"""Scan authentication mechanisms for vulnerabilities"""
vulnerabilities = []
current_time = datetime.now()
# Check password policy implementation
try:
if not kernel_registry.auth_service:
logger.warning("Auth service not registered in kernel. Skipping password hashing check.")
return vulnerabilities
# Check if password hashing is strong enough
test_password = "TestPassword123!"
hashed_password = kernel_registry.auth_service.hash_password(test_password)
# Check if bcrypt or argon2 is being used
if not any(hash_type in str(hashed_password).lower() for hash_type in ["bcrypt", "argon2"]):
vulnerabilities.append(
SecurityVulnerability(
severity="high",
category="authentication",
title="Weak Password Hashing",
description="Password hashing algorithm may not meet security standards",
affected_component="auth_service",
cve_id=None,
recommendation="Implement bcrypt or Argon2 for password hashing",
cvss_score=7.5,
discovered_at=current_time,
)
)
# Check JWT configuration
jwt_secret = os.getenv("JWT_SECRET", "")
if len(jwt_secret) < 32:
vulnerabilities.append(
SecurityVulnerability(
severity="critical",
category="authentication",
title="Weak JWT Secret",
description="JWT secret is shorter than recommended minimum",
affected_component="JWT configuration",
cve_id=None,
recommendation="Use JWT secret of at least 32 characters with high entropy",
cvss_score=8.5,
discovered_at=current_time,
)
)
# Check JWT token expiration
jwt_exp_minutes = os.getenv("JWT_ACCESS_TOKEN_EXPIRE_MINUTES", "60")
if int(jwt_exp_minutes) > 120: # More than 2 hours
vulnerabilities.append(
SecurityVulnerability(
severity="medium",
category="authentication",
title="Long JWT Token Expiration",
description="JWT tokens have excessive expiration time",
affected_component="JWT configuration",
cve_id=None,
recommendation="Reduce JWT token expiration to maximum 2 hours",
cvss_score=5.5,
discovered_at=current_time,
)
)
except Exception:
pass
# Check for default credentials
default_credentials = [
("admin", "admin"),
("admin", "password"),
("root", "root"),
("user", "password"),
("test", "test"),
]
if os.getenv("DEFAULT_USERNAME") in [cred[0] for cred in default_credentials]:
vulnerabilities.append(
SecurityVulnerability(
severity="critical",
category="authentication",
title="Default Credentials in Use",
description="Default username is being used in production",
affected_component="authentication",
cve_id="CVE-2021-12345",
recommendation="Change default credentials immediately",
cvss_score=9.0,
discovered_at=current_time,
)
)
return vulnerabilities
async def scan_authorization_security(self) -> List[SecurityVulnerability]:
"""Scan authorization and access control"""
vulnerabilities = []
current_time = datetime.now()
# Check role-based access control
try:
# This would require database access, so we'll do config-based checks
if os.getenv("RBAC_ENABLED", "true").lower() != "true":
vulnerabilities.append(
SecurityVulnerability(
severity="high",
category="authorization",
title="Role-Based Access Control Disabled",
description="RBAC is not enabled, potentially exposing sensitive operations",
affected_component="authorization system",
cve_id=None,
recommendation="Enable and properly configure role-based access control",
cvss_score=7.0,
discovered_at=current_time,
)
)
except Exception:
pass
# Check API key security
api_keys = [key for key in os.environ.keys() if key.endswith("_KEY") or key.endswith("_SECRET")]
for key in api_keys:
value = os.getenv(key, "")
if len(value) < 20 or value.lower() in [
"secret",
"key",
"password",
"test",
]:
vulnerabilities.append(
SecurityVulnerability(
severity="critical",
category="authorization",
title=f"Weak {key} Value",
description=f"Environment variable {key} has insufficient entropy",
affected_component="environment configuration",
cve_id=None,
recommendation=f"Use cryptographically secure random values for {key}",
cvss_score=8.0,
discovered_at=current_time,
)
)
return vulnerabilities
async def scan_input_validation_security(self) -> List[SecurityVulnerability]:
"""Scan for input validation and injection vulnerabilities"""
vulnerabilities = []
current_time = datetime.now()
# Check SQL injection protection
try:
# Analyze SQL queries in codebase for potential injection points
sql_injection_patterns = [
r"SELECT.*\+.*%s", # String concatenation in SQL
r"execute\s*\(\s*['\"][^'\"]*%s[^'\"]*['\"]", # Unsafe execute
r"format\s*\(\s*['\"][^'\"]*\{\}[^'\"]*['\"]", # Unsafe format
]
# Scan Python files for SQL patterns
py_files = list(Path("/Users/Arief/Desktop/378x492/backend").rglob("*.py"))
for py_file in py_files[:50]: # Limit to first 50 files for performance
try:
with open(py_file, "r", encoding="utf-8") as f:
content = f.read()
for pattern in sql_injection_patterns:
if re.search(pattern, content, re.IGNORECASE):
vulnerabilities.append(
SecurityVulnerability(
severity="high",
category="injection",
title="Potential SQL Injection",
description=f"SQL injection vulnerability pattern detected in {py_file.name}",
affected_component=str(py_file),
cve_id="CWE-89",
recommendation="Use parameterized queries and proper input validation",
cvss_score=8.5,
discovered_at=current_time,
)
)
break
except Exception:
continue
except Exception:
pass
# Check XSS protection
try:
# Check if content security policy is configured
csp_configured = any("content-security-policy" in os.getenv(key, "").lower() for key in os.environ.keys())
if not csp_configured:
vulnerabilities.append(
SecurityVulnerability(
severity="medium",
category="xss",
title="Missing Content Security Policy",
description="CSP header not configured to prevent XSS attacks",
affected_component="security headers",
cve_id=None,
recommendation="Implement Content Security Policy header",
cvss_score=5.5,
discovered_at=current_time,
)
)
except Exception:
pass
# Check file upload security
upload_config = {
"max_file_size": os.getenv("MAX_FILE_SIZE", "10MB"),
"allowed_extensions": os.getenv("ALLOWED_EXTENSIONS", "*.pdf,*.doc,*.docx").split(","),
"scan_uploads": os.getenv("SCAN_UPLOADS", "true").lower() == "true",
}
if upload_config["scan_uploads"] == "False":
vulnerabilities.append(
SecurityVulnerability(
severity="medium",
category="authorization",
title="File Upload Scanning Disabled",
description="Malicious file scanning is not enabled for uploads",
affected_component="file upload system",
cve_id="CWE-434",
recommendation="Enable virus scanning for all file uploads",
cvss_score=6.5,
discovered_at=current_time,
)
)
return vulnerabilities
async def scan_configuration_security(self) -> List[SecurityVulnerability]:
"""Scan configuration files and settings for security issues"""
vulnerabilities = []
current_time = datetime.now()
# Check for sensitive data in configuration files
sensitive_patterns = [
(r"password\s*=\s*['\"][^'\"]{8,}['\"]", "weak_password"),
(r"secret\s*=\s*['\"][^'\"]{20,}['\"]", "weak_secret"),
(r"key\s*=\s*['\"][^'\"]{20,}['\"]", "weak_key"),
(r"token\s*=\s*['\"][^'\"]{20,}['\"]", "weak_token"),
(r"\.env", "environment_file_exposed"),
]
config_files = [
".env",
"config.py",
"settings.py",
"docker-compose.yml",
"kubernetes.yaml",
]
for config_file in config_files:
config_path = Path("/Users/Arief/Desktop/378x492") / config_file
if config_path.exists():
try:
with open(config_path, "r", encoding="utf-8") as f:
content = f.read()
for pattern, issue_type in sensitive_patterns:
if re.search(pattern, content, re.IGNORECASE):
if issue_type == "environment_file_exposed":
severity = "high"
title = "Potentially Exposed Environment File"
description = f"Environment file {config_file} may be publicly accessible"
else:
severity = "critical"
title = f"Weak {issue_type.replace('_', ' ').title()} in Configuration"
description = f"Weak credential pattern found in {config_file}"
vulnerabilities.append(
SecurityVulnerability(
severity=severity,
category="config",
title=title,
description=description,
affected_component=str(config_path),
cve_id=None,
recommendation="Use strong, randomly generated secrets and proper file permissions",
cvss_score=(8.0 if severity == "critical" else 6.5),
discovered_at=current_time,
)
)
break
except Exception:
continue
# Check file permissions
sensitive_files = [".env", "config/secrets.yaml", "ssl/cert.pem", "ssl/key.pem"]
for sensitive_file in sensitive_files:
file_path = Path("/Users/Arief/Desktop/378x492") / sensitive_file
if file_path.exists():
try:
stat = file_path.stat()
# Check if file is readable by others
if stat.st_mode & 0o004: # Others can read
vulnerabilities.append(
SecurityVulnerability(
severity="high",
category="config",
title=f"Insecure File Permissions: {sensitive_file}",
description=f"Sensitive file {sensitive_file} is readable by other users",
affected_component=str(file_path),
cve_id="CWE-732",
recommendation="Restrict file permissions to owner and group only (chmod 600)",
cvss_score=7.5,
discovered_at=current_time,
)
)
except Exception:
continue
# Check debug mode
debug_enabled = os.getenv("DEBUG", "false").lower() == "true"
if debug_enabled and os.getenv("ENVIRONMENT", "development").lower() == "production":
vulnerabilities.append(
SecurityVulnerability(
severity="critical",
category="config",
title="Debug Mode in Production",
description="Application is running in debug mode in production environment",
affected_component="application configuration",
cve_id=None,
recommendation="Disable debug mode in production environment",
cvss_score=9.0,
discovered_at=current_time,
)
)
return vulnerabilities
async def scan_dependency_vulnerabilities(self) -> List[SecurityVulnerability]:
"""Scan dependencies for known vulnerabilities"""
vulnerabilities = []
current_time = datetime.now()
try:
# Check requirements.txt for vulnerable packages
requirements_path = Path("/Users/Arief/Desktop/378x492/requirements.txt")
if requirements_path.exists():
# Simulate security scanning (in real implementation, use tools like safety or snyk)
# This is a simplified version - real implementation would query vulnerability databases
# Check for common vulnerable versions
vulnerable_packages = {
"django": {"<3.2.0": "CVE-2023-43664"},
"requests": {"<2.25.0": "CVE-2023-32681"},
"urllib3": {"<1.26.0": "CVE-2023-45803"},
"cryptography": {"<3.4.8": "CVE-2023-3817"},
}
with open(requirements_path, "r") as f:
for line in f:
line = line.strip()
if not line or line.startswith("#"):
continue
# Parse package name and version
parts = re.split(r"([<>=!])", line)
if len(parts) >= 2:
package_name = parts[0].strip()
version_part = parts[2].strip() if len(parts) > 2 else ""
if package_name.lower() in vulnerable_packages:
vuln_info = vulnerable_packages[package_name.lower()]
for version_constraint, cve_id in vuln_info.items():
# This is simplified - real implementation would parse and compare versions
vulnerabilities.append(
SecurityVulnerability(
severity="high",
category="dependency",
title=f"Vulnerable Dependency: {package_name}",
description=f"{package_name} {version_part} may be vulnerable to {cve_id}",
affected_component=package_name,
cve_id=cve_id,
recommendation=f"Update {package_name} to a secure version",
cvss_score=7.5,
discovered_at=current_time,
)
)
# Check package lock files
package_locks = ["package-lock.json", "poetry.lock", "Pipfile.lock"]
for lock_file in package_locks:
lock_path = Path("/Users/Arief/Desktop/378x492") / lock_file
if lock_path.exists():
try:
with open(lock_path, "r") as f:
lock_content = f.read()
# Check for known vulnerabilities in lock file (simplified)
if "vulnerable" in lock_content.lower() or "cve-" in lock_content.lower():
vulnerabilities.append(
SecurityVulnerability(
severity="medium",
category="dependency",
title=f"Potential Vulnerability in {lock_file}",
description="Lock file may contain vulnerable packages",
affected_component=lock_file,
cve_id=None,
recommendation="Update dependencies and regenerate lock file",
cvss_score=6.0,
discovered_at=current_time,
)
)
except Exception:
continue
except Exception:
pass
return vulnerabilities
async def assess_compliance(self, standard: str) -> ComplianceStatus:
"""Assess compliance with specific security standard"""
findings = []
current_time = datetime.now()
if standard.lower() == "pci_dss":
# PCI DSS assessment
score = 100.0
# Requirement 3: Protect cardholder data
if not os.getenv("ENCRYPTION_KEY"):
findings.append("Missing encryption for cardholder data")
score -= 20
# Requirement 4: Strong access control
if os.getenv("RBAC_ENABLED", "true").lower() != "true":
findings.append("Insufficient access control measures")
score -= 15
# Requirement 6: Regular testing
if not self._has_security_testing():
findings.append("No evidence of regular security testing")
score -= 10
# Requirement 7: Secure network
if (
os.getenv("ENVIRONMENT", "development").lower() == "production"
and os.getenv("DEBUG", "false").lower() == "true"
):
findings.append("Debug mode enabled in production")
score -= 25
status = "compliant" if score >= 90 else "partial" if score >= 70 else "non_compliant"
elif standard.lower() == "gdpr":
# GDPR assessment
score = 100.0
# Data protection
if not os.getenv("ENCRYPTION_KEY"):
findings.append("Insufficient data protection measures")
score -= 20
# Right to be forgotten
if not self._has_data_deletion_capability():
findings.append("No data deletion mechanism for GDPR right to be forgotten")
score -= 15
# Consent management
if not self._has_consent_management():
findings.append("No consent management system")
score -= 10
# Data breach notification
if not self._has_breach_notification():
findings.append("No breach notification system")
score -= 15
status = "compliant" if score >= 90 else "partial" if score >= 70 else "non_compliant"
elif standard.lower() == "soc2":
# SOC 2 Type II assessment
score = 100.0
# Security controls
if not self._has_monitoring():
findings.append("Insufficient security monitoring")
score -= 20
# Incident response
if not self._has_incident_response():
findings.append("No incident response procedure")
score -= 15
# Change management
if not self._has_change_management():
findings.append("No formal change management process")
score -= 10
# Data classification
if not self._has_data_classification():
findings.append("No data classification system")
score -= 10
status = "compliant" if score >= 90 else "partial" if score >= 70 else "non_compliant"
else:
return ComplianceStatus(
standard=standard,
status="not_assessed",
score=0.0,
findings=["Standard not supported for assessment"],
last_assessed=current_time,
)
return ComplianceStatus(
standard=standard,
status=status,
score=score,
findings=findings,
last_assessed=current_time,
)
def _has_security_testing(self) -> bool:
"""Check if security testing is configured"""
# Look for security testing configurations
security_tools = ["safety", "bandit", "semgrep", "snyk"]
return any(tool in os.getenv("SECURITY_TOOLS", "") for tool in security_tools)
def _has_data_deletion_capability(self) -> bool:
"""Check if data deletion mechanisms exist"""
# Look for user data deletion endpoints/services
return os.getenv("DATA_RETENTION_ENABLED", "true").lower() == "true"
def _has_consent_management(self) -> bool:
"""Check if consent management is available"""
return os.getenv("CONSENT_MANAGEMENT", "false").lower() == "true"
def _has_breach_notification(self) -> bool:
"""Check if breach notification is configured"""
return os.getenv("BREACH_NOTIFICATION_ENABLED", "false").lower() == "true"
def _has_monitoring(self) -> bool:
"""Check if security monitoring is enabled"""
return os.getenv("SECURITY_MONITORING", "true").lower() == "true"
def _has_incident_response(self) -> bool:
"""Check if incident response is configured"""
return os.getenv("INCIDENT_RESPONSE", "false").lower() == "true"
def _has_change_management(self) -> bool:
"""Check if change management process exists"""
return os.getenv("CHANGE_MANAGEMENT", "false").lower() == "true"
def _has_data_classification(self) -> bool:
"""Check if data classification system exists"""
return os.getenv("DATA_CLASSIFICATION", "false").lower() == "true"
async def generate_comprehensive_security_report(self) -> Dict[str, Any]:
"""Generate comprehensive security assessment report"""
current_time = datetime.now()
# Run all security scans
scan_tasks = [
self.scan_authentication_security(),
self.scan_authorization_security(),
self.scan_input_validation_security(),
self.scan_configuration_security(),
self.scan_dependency_vulnerabilities(),
]
results = await asyncio.gather(*scan_tasks, return_exceptions=True)
# Collect all vulnerabilities
all_vulnerabilities = []
for i, result in enumerate(results):
if isinstance(result, Exception):
# Add scan error as vulnerability
all_vulnerabilities.append(
SecurityVulnerability(
severity="medium",
category="scan_error",
title=f"Security Scan Error {i}",
description=f"Security scanning module {i} failed: {str(result)}",
affected_component="security_scanner",
cve_id=None,
recommendation="Fix scanning configuration and retry",
cvss_score=5.0,
discovered_at=current_time,
)
)
else:
all_vulnerabilities.extend(result)
# Assess compliance for all standards
compliance_standards = ["pci_dss", "gdpr", "soc2"]
compliance_results = {}
for standard in compliance_standards:
compliance_results[standard] = await self.assess_compliance(standard)
# Calculate overall security score
critical_count = sum(1 for v in all_vulnerabilities if v.severity == "critical")
high_count = sum(1 for v in all_vulnerabilities if v.severity == "high")
medium_count = sum(1 for v in all_vulnerabilities if v.severity == "medium")
low_count = sum(1 for v in all_vulnerabilities if v.severity == "low")
# Weighted scoring
base_score = 100.0
base_score -= critical_count * 25
base_score -= high_count * 15
base_score -= medium_count * 8
base_score -= low_count * 3
security_score = max(0, min(100, base_score))
# Determine overall risk level
if critical_count > 0:
risk_level = "critical"
elif high_count > 2:
risk_level = "high"
elif high_count > 0 or medium_count > 3:
risk_level = "medium"
elif medium_count > 0 or low_count > 5:
risk_level = "low"
else:
risk_level = "minimal"
# Generate recommendations
recommendations = []
# Priority recommendations based on findings
if critical_count > 0:
recommendations.append("CRITICAL: Address all critical vulnerabilities immediately")
if high_count > 0:
recommendations.append("HIGH: Prioritize high-severity vulnerabilities within 30 days")
if any("authentication" in v.category for v in all_vulnerabilities):
recommendations.append("Strengthen authentication mechanisms with MFA")
if any("authorization" in v.category for v in all_vulnerabilities):
recommendations.append("Review and tighten access controls")
if any("injection" in v.category for v in all_vulnerabilities):
recommendations.append("Implement comprehensive input validation and parameterized queries")
if any("config" in v.category for v in all_vulnerabilities):
recommendations.append("Secure configuration files and environment variables")
if any("dependency" in v.category for v in all_vulnerabilities):
recommendations.append("Update all vulnerable dependencies immediately")
report = {
"security_score": security_score,
"risk_level": risk_level,
"scan_timestamp": current_time.isoformat(),
"summary": {
"total_vulnerabilities": len(all_vulnerabilities),
"critical": critical_count,
"high": high_count,
"medium": medium_count,
"low": low_count,
"scan_modules_executed": len(scan_tasks),
"scan_errors": sum(1 for r in results if isinstance(r, Exception)),
},
"vulnerabilities_by_category": {
"authentication": [v.to_dict() for v in all_vulnerabilities if v.category == "authentication"],
"authorization": [v.to_dict() for v in all_vulnerabilities if v.category == "authorization"],
"injection": [v.to_dict() for v in all_vulnerabilities if v.category == "injection"],
"xss": [v.to_dict() for v in all_vulnerabilities if v.category == "xss"],
"configuration": [v.to_dict() for v in all_vulnerabilities if v.category == "config"],
"dependency": [v.to_dict() for v in all_vulnerabilities if v.category == "dependency"],
"network": [v.to_dict() for v in all_vulnerabilities if v.category == "network"],
"scan_error": [v.to_dict() for v in all_vulnerabilities if v.category == "scan_error"],
},
"compliance_assessment": {standard: comp.to_dict() for standard, comp in compliance_results.items()},
"recommendations": recommendations,
"next_steps": [
"1. Address critical and high vulnerabilities immediately",
"2. Implement automated security scanning in CI/CD pipeline",
"3. Schedule regular penetration testing",
"4. Establish security incident response procedures",
"5. Monitor for new vulnerabilities regularly",
],
}
return report
# Global security scanner instance
security_scanner = AdvancedSecurityScanner()