catninja123 commited on
Commit
49b6530
·
verified ·
1 Parent(s): 8cf6db2

Upload train_v38_2.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. train_v38_2.py +4 -1
train_v38_2.py CHANGED
@@ -54,7 +54,7 @@ def safe_num(v, default=-1):
54
  # 1. LOAD INTEGRATED FEATURE MATRIX
55
  # ============================================================
56
  print("=" * 70)
57
- print(" V38.2 BARE MODEL: MULTI-SEED ENSEMBLE WITH 116 FEATURES (v3 cleaned)")
58
  print("=" * 70)
59
 
60
  df_raw = pd.read_csv(os.path.join(DATA_DIR, 'v38_2_integrated_features.csv'))
@@ -573,6 +573,9 @@ feature_groups = {
573
  'Taste': [c for c in feature_cols if c.startswith('taste_')],
574
  'Cuilu': [c for c in feature_cols if c.startswith('cuilu_')],
575
  'Major': [c for c in feature_cols if c.startswith('major_') or c in ['has_secondary_major', 'has_college_division', 'is_undecided', 'has_major', 'school_major_count']],
 
 
 
576
  }
577
 
578
  for group_name, group_cols in feature_groups.items():
 
54
  # 1. LOAD INTEGRATED FEATURE MATRIX
55
  # ============================================================
56
  print("=" * 70)
57
+ print(" V38.2 BARE MODEL v4: MULTI-SEED ENSEMBLE WITH 148 FEATURES (v4 + PS BERT + HS×Univ + Summer)")
58
  print("=" * 70)
59
 
60
  df_raw = pd.read_csv(os.path.join(DATA_DIR, 'v38_2_integrated_features.csv'))
 
573
  'Taste': [c for c in feature_cols if c.startswith('taste_')],
574
  'Cuilu': [c for c in feature_cols if c.startswith('cuilu_')],
575
  'Major': [c for c in feature_cols if c.startswith('major_') or c in ['has_secondary_major', 'has_college_division', 'is_undecided', 'has_major', 'school_major_count']],
576
+ 'PS BERT PCA': [c for c in feature_cols if c.startswith('ps_bert_')],
577
+ 'HS×Univ History': [c for c in feature_cols if c.startswith('hs_') and any(k in c for k in ['hist', 'overall', 'smooth', 'apps', 'admits'])],
578
+ 'Summer Programs': [c for c in feature_cols if c.startswith('summer_')],
579
  }
580
 
581
  for group_name, group_cols in feature_groups.items():