File size: 722 Bytes
42c0474
 
1fa293a
 
42c0474
1fa293a
67a43ce
42c0474
a0e0dc6
42c0474
0aed451
42c0474
 
0aed451
 
42c0474
 
1fa293a
42c0474
 
67a43ce
42c0474
1fa293a
67a43ce
0aed451
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import os

# --- Paths ---
MODEL_SAVE_DIR = "/tmp"  # Use writable directory

DATA_PATH = os.path.join(os.path.dirname(__file__), "data", "synthetic_transactions_samples_5000.csv")
MODEL_PATH = os.path.join(MODEL_SAVE_DIR, "logreg_model.pkl")
TFIDF_VECTORIZER_PATH = os.path.join(MODEL_SAVE_DIR, "tfidf_vectorizer.pkl")
LABEL_ENCODERS_PATH = os.path.join(MODEL_SAVE_DIR, "label_encoders.pkl")

# --- Columns ---
TEXT_COLUMN = "Sanction_Context"
LABEL_COLUMNS = [
    "Red_Flag_Reason", "Maker_Action", "Escalation_Level",
    "Risk_Category", "Risk_Drivers", "Investigation_Outcome"
]

# --- TF-IDF ---
TFIDF_MAX_FEATURES = 5000
NGRAM_RANGE = (1, 2)
USE_STOPWORDS = True

# --- Split ---
RANDOM_STATE = 42
TEST_SIZE = 0.2