Spaces:

donizetti-yoann
/

technova-ml-api

Sleeping

technova-ml-api / app /ml /preprocessing.py

github-actions

deploy: snapshot

5fa8558 about 2 months ago

370 Bytes

	import pandas as pd

	TEXT_COLUMNS = [
	"genre",
	"statut_marital",
	"departement",
	"poste",
	"domaine_etude",
	"frequence_deplacement",
	]


	def normalize_text(df: pd.DataFrame) -> pd.DataFrame:
	df = df.copy()
	for col in TEXT_COLUMNS:
	if col in df.columns:
	df[col] = df[col].astype(str).str.strip().str.lower()
	return df