Spaces:
Sleeping
Sleeping
| from imblearn.over_sampling import SMOTE | |
| import pandas as pd | |
| import numpy as np | |
| def run(df: pd.DataFrame, action: dict) -> dict: | |
| df_clean = df.dropna() | |
| if len(df_clean) < 20 or len(set(df_clean["label"])) < 2: | |
| return {"df": df, "log": "Augmenter skipped — insufficient clean data."} | |
| X = df_clean.drop("label", axis=1).values | |
| y = df_clean["label"].values | |
| try: | |
| sm = SMOTE(random_state=42) | |
| X_res, y_res = sm.fit_resample(X, y) | |
| df_out = pd.DataFrame(X_res, columns=df.columns[:-1]) | |
| df_out["label"] = y_res | |
| added = len(df_out) - len(df_clean) | |
| return {"df": df_out, "log": f"Augmenter added {added} synthetic samples."} | |
| except Exception as e: | |
| return {"df": df, "log": f"Augmenter failed: {str(e)}"} | |