Upload train_v38_2.py with huggingface_hub
Browse files- train_v38_2.py +4 -1
train_v38_2.py
CHANGED
|
@@ -54,7 +54,7 @@ def safe_num(v, default=-1):
|
|
| 54 |
# 1. LOAD INTEGRATED FEATURE MATRIX
|
| 55 |
# ============================================================
|
| 56 |
print("=" * 70)
|
| 57 |
-
print(" V38.2 BARE MODEL: MULTI-SEED ENSEMBLE WITH
|
| 58 |
print("=" * 70)
|
| 59 |
|
| 60 |
df_raw = pd.read_csv(os.path.join(DATA_DIR, 'v38_2_integrated_features.csv'))
|
|
@@ -573,6 +573,9 @@ feature_groups = {
|
|
| 573 |
'Taste': [c for c in feature_cols if c.startswith('taste_')],
|
| 574 |
'Cuilu': [c for c in feature_cols if c.startswith('cuilu_')],
|
| 575 |
'Major': [c for c in feature_cols if c.startswith('major_') or c in ['has_secondary_major', 'has_college_division', 'is_undecided', 'has_major', 'school_major_count']],
|
|
|
|
|
|
|
|
|
|
| 576 |
}
|
| 577 |
|
| 578 |
for group_name, group_cols in feature_groups.items():
|
|
|
|
| 54 |
# 1. LOAD INTEGRATED FEATURE MATRIX
|
| 55 |
# ============================================================
|
| 56 |
print("=" * 70)
|
| 57 |
+
print(" V38.2 BARE MODEL v4: MULTI-SEED ENSEMBLE WITH 148 FEATURES (v4 + PS BERT + HS×Univ + Summer)")
|
| 58 |
print("=" * 70)
|
| 59 |
|
| 60 |
df_raw = pd.read_csv(os.path.join(DATA_DIR, 'v38_2_integrated_features.csv'))
|
|
|
|
| 573 |
'Taste': [c for c in feature_cols if c.startswith('taste_')],
|
| 574 |
'Cuilu': [c for c in feature_cols if c.startswith('cuilu_')],
|
| 575 |
'Major': [c for c in feature_cols if c.startswith('major_') or c in ['has_secondary_major', 'has_college_division', 'is_undecided', 'has_major', 'school_major_count']],
|
| 576 |
+
'PS BERT PCA': [c for c in feature_cols if c.startswith('ps_bert_')],
|
| 577 |
+
'HS×Univ History': [c for c in feature_cols if c.startswith('hs_') and any(k in c for k in ['hist', 'overall', 'smooth', 'apps', 'admits'])],
|
| 578 |
+
'Summer Programs': [c for c in feature_cols if c.startswith('summer_')],
|
| 579 |
}
|
| 580 |
|
| 581 |
for group_name, group_cols in feature_groups.items():
|