kd7979148
/

XSS_Payload_Detector

@@ -23,7 +23,7 @@ from transformers import (
 )
 #################################################
-# 설정
 #################################################
 LOG_FILE = "access.log"
@@ -35,7 +35,7 @@ MAX_INPUT_LENGTH = 2000
 CHECK_INTERVAL = 0.2
 #################################################
-# SQLite 초기화
 #################################################
 conn = sqlite3.connect("xss_detection.db")
@@ -64,10 +64,10 @@ CREATE TABLE IF NOT EXISTS detections (
 conn.commit()
 #################################################
-# 모델 로드
 #################################################
-print("[+] 모델 로드 중...")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
@@ -79,10 +79,10 @@ model.to(device)
 model.eval()
-print("[+] 모델 로드 완료")
 #################################################
-# 라벨
 #################################################
 labels = {
@@ -91,7 +91,7 @@ labels = {
 }
 #################################################
-# URL 여부
 #################################################
 def is_url(text):
@@ -103,7 +103,7 @@ def is_url(text):
     )
 #################################################
-# Unicode 정규화
 #################################################
 def normalize_unicode(text):
@@ -111,7 +111,7 @@ def normalize_unicode(text):
     return unicodedata.normalize("NFKC", text)
 #################################################
-# URL payload 추출
 #################################################
 def extract_url_payload(url):
@@ -127,7 +127,7 @@ def extract_url_payload(url):
         extracted = []
         #################################################
-        # parameter value 추출
         #################################################
         for key, values in params.items():
@@ -139,7 +139,7 @@ def extract_url_payload(url):
                 extracted.append(decoded)
         #################################################
-        # query 자체에 suspicious code 존재 시 추가
         #################################################
         if contains_suspicious_code(raw_query):
@@ -147,7 +147,7 @@ def extract_url_payload(url):
             extracted.append(raw_query)
         #################################################
-        # parameter 없으면 path 사용
         #################################################
         if not extracted:
@@ -161,7 +161,7 @@ def extract_url_payload(url):
         return url
 #################################################
-# suspicious code 존재 여부
 #################################################
 def contains_suspicious_code(text):
@@ -179,7 +179,7 @@ def contains_suspicious_code(text):
         "iframe",
         "svg",
-        # JS 실행
         "eval(",
         "alert(",
         "prompt(",
@@ -188,7 +188,7 @@ def contains_suspicious_code(text):
         "document.domain",
         "window.location",
-        # 난독화 / 우회
         "constructor",
         "fromcharcode",
         "\\x",
@@ -198,7 +198,7 @@ def contains_suspicious_code(text):
         "base64",
         "atob(",
-        # 특수 실행
         "srcdoc",
         "data:text/html",
         "vbscript:",
@@ -216,7 +216,7 @@ def contains_suspicious_code(text):
     return False
 #################################################
-# 로그 한 줄 파싱
 #################################################
 def parse_log_line(line):
@@ -249,7 +249,7 @@ def parse_log_line(line):
         return None, None
 #################################################
-# BERT 추론
 #################################################
 def predict_xss(text):
@@ -281,7 +281,7 @@ def predict_xss(text):
     return label, confidence
 #################################################
-# 로그 감시
 #################################################
 def follow(thefile):
@@ -301,10 +301,10 @@ def follow(thefile):
         yield line
 #################################################
-# 메인
 #################################################
-print(f"[+] 로그 감시 시작: {LOG_FILE}")
 with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
@@ -327,7 +327,7 @@ with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
             url = normalize_unicode(url)
             #################################################
-            # URL payload 추출
             #################################################
             if is_url(url):
@@ -339,7 +339,7 @@ with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
                 target_text = url
             #################################################
-            # 길이 제한
             #################################################
             if len(target_text) > MAX_INPUT_LENGTH:
@@ -347,7 +347,7 @@ with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
                 continue
             #################################################
-            # suspicious fragment 없으면 skip
             #################################################
             if not contains_suspicious_code(target_text):
@@ -355,13 +355,13 @@ with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
                 continue
             #################################################
-            # ML 추론
             #################################################
             label, confidence = predict_xss(target_text)
             #################################################
-            # XSS 탐지 시 출력
             #################################################
             if label == "XSS":
@@ -375,7 +375,7 @@ with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
                 print("==============================\n")
             #################################################
-            # DB 저장
             #################################################
             cursor.execute("""

 )
 #################################################
+# setting
 #################################################
 LOG_FILE = "access.log"
 CHECK_INTERVAL = 0.2
 #################################################
+# SQLite
 #################################################
 conn = sqlite3.connect("xss_detection.db")
 conn.commit()
 #################################################
+# model load
 #################################################
+print("[+] Loading Model...")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
 model.eval()
+print("[+] Loading Model Completed.")
 #################################################
+# label
 #################################################
 labels = {
 }
 #################################################
+# URL?
 #################################################
 def is_url(text):
     )
 #################################################
+# Unicode
 #################################################
 def normalize_unicode(text):
     return unicodedata.normalize("NFKC", text)
 #################################################
+# URL payload extract
 #################################################
 def extract_url_payload(url):
         extracted = []
         #################################################
+        # parameter value
         #################################################
         for key, values in params.items():
                 extracted.append(decoded)
         #################################################
+        # Add when suspicious code exists in query itself
         #################################################
         if contains_suspicious_code(raw_query):
             extracted.append(raw_query)
         #################################################
+        # use path when parameter xde
         #################################################
         if not extracted:
         return url
 #################################################
+# suspicious code?
 #################################################
 def contains_suspicious_code(text):
         "iframe",
         "svg",
+        # JS
         "eval(",
         "alert(",
         "prompt(",
         "document.domain",
         "window.location",
+        # bypassing
         "constructor",
         "fromcharcode",
         "\\x",
         "base64",
         "atob(",
+        #
         "srcdoc",
         "data:text/html",
         "vbscript:",
     return False
 #################################################
+# log parsing
 #################################################
 def parse_log_line(line):
         return None, None
 #################################################
+# BERT
 #################################################
 def predict_xss(text):
     return label, confidence
 #################################################
+# log
 #################################################
 def follow(thefile):
         yield line
 #################################################
+# main
 #################################################
+print(f"[+] Start Monitoring Logs: {LOG_FILE}")
 with open(LOG_FILE, "r", encoding="utf-8", errors="ignore") as logfile:
             url = normalize_unicode(url)
             #################################################
+            # URL payload
             #################################################
             if is_url(url):
                 target_text = url
             #################################################
+            # length
             #################################################
             if len(target_text) > MAX_INPUT_LENGTH:
                 continue
             #################################################
+            # skip when suspicious fragment no exist
             #################################################
             if not contains_suspicious_code(target_text):
                 continue
             #################################################
+            # ML
             #################################################
             label, confidence = predict_xss(target_text)
             #################################################
+            # XSS detected
             #################################################
             if label == "XSS":
                 print("==============================\n")
             #################################################
+            # DB
             #################################################
             cursor.execute("""