ganeshkonapalli commited on
Commit
d8343dc
·
verified ·
1 Parent(s): 65f2808

Create config.py

Browse files
Files changed (1) hide show
  1. config.py +30 -0
config.py ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+
3
+ # --- Paths ---
4
+ BASE_DIR = os.path.abspath(os.path.dirname(__file__))
5
+ DATA_PATH = os.path.join(BASE_DIR, "data", "synthetic_transactions_samples_5000.csv")
6
+
7
+ MODEL_SAVE_DIR = os.path.join(BASE_DIR, "models")
8
+ LABEL_ENCODERS_PATH = os.path.join(MODEL_SAVE_DIR, "label_encoders.pkl")
9
+ TFIDF_VECTORIZER_PATH = os.path.join(MODEL_SAVE_DIR, "tfidf_vectorizer.pkl")
10
+ MODEL_PATH = os.path.join(MODEL_SAVE_DIR, "logreg_models.pkl") # <-- Logistic Regression model file
11
+
12
+ # --- Columns ---
13
+ TEXT_COLUMN = "Sanction_Context"
14
+ LABEL_COLUMNS = [
15
+ "Red_Flag_Reason",
16
+ "Maker_Action",
17
+ "Escalation_Level",
18
+ "Risk_Category",
19
+ "Risk_Drivers",
20
+ "Investigation_Outcome"
21
+ ]
22
+
23
+ # --- TF-IDF Settings ---
24
+ TFIDF_MAX_FEATURES = 5000
25
+ NGRAM_RANGE = (1, 2)
26
+ USE_STOPWORDS = True
27
+
28
+ # --- Train/Test Split ---
29
+ RANDOM_STATE = 42
30
+ TEST_SIZE = 0.2