Spaces:

KLEB38
/

OC_P5

Sleeping

App Files Files Community

KLEB38 commited on Feb 25

Commit

2f42479

1 Parent(s): 060e228

feat:added predict endpoint with Pydantic validation

Browse files

Files changed (3) hide show

app/main.py +79 -6
app/pipeline_rh.joblib +2 -2
app/schemas.py +32 -0

app/main.py CHANGED Viewed

@@ -1,24 +1,97 @@
 from fastapi import FastAPI
 import joblib
 app = FastAPI() # On crée l'outil (le guichet)
 # Au démarrage, on charge ton pipeline
 model = joblib.load('app/pipeline_rh.joblib')
 @app.get("/") # La page d'accueil de ton API
 def read_root():
-    return {"message": "Bienvenue sur l'API RH de Futurisys"}
 @app.post("/predict")
-def predict(data: dict):
     # 1. On transforme le dictionnaire reçu en DataFrame pandas
-    df = pd.DataFrame([data])
     # 2. On utilise le pipeline pour faire la prédiction
     prediction = model.predict(df)
-    # 3. On renvoie le résultat au format JSON
     return {
-        "statut_employe": int(prediction[0])
-    }

 from fastapi import FastAPI
+import pandas as pd
 import joblib
+from app.schemas import EmployeeInput
 app = FastAPI() # On crée l'outil (le guichet)
 # Au démarrage, on charge ton pipeline
 model = joblib.load('app/pipeline_rh.joblib')
+def inconsistency(df):
+    if df["departement"] == "Commercial":
+        if (
+            df["domaine_etude"]
+            == "Marketing"
+            # or df["domaine_etude"] == "Transformation Digitale"
+            # or df["domaine_etude"] == "Infra & Cloud"
+            # or df["domaine_etude"] == "Entrepreunariat"
+        ):
+            return 0
+        else:
+            return 1
+    elif df["departement"] == "Consulting":
+        if (
+            df["domaine_etude"] == "Infra & Cloud"
+            or df["domaine_etude"] == "Transformation Digitale"
+            # or df["domaine_etude"] == "Entrepreunariat"
+        ):
+            return 0
+        else:
+            return 1
+    elif df["departement"] == "Ressources Humaines":
+        if (
+            df["domaine_etude"] == "Ressources Humaines"
+            or df["domaine_etude"] == "Entrepreunariat"
+        ):
+            return 0
+        else:
+            return 1
+def promotion(df):
+    if (
+        df["annes_sous_responsable_actuel"] > 4
+        and df["annees_depuis_la_derniere_promotion"] > 4
+    ):
+        return 1
+    else:
+        return 0
+def developpement(df):
+    if df["annees_dans_l_entreprise"] == 0:
+        return 0
+    elif df["annees_dans_l_entreprise"] >= 2 and df["nb_formations_suivies"] <= 1:
+        return 1
+    else:
+        return 0
+def depart(x):
+    if x == 0:
+        return "The staff has a LOW probability of resigning"
+    if x==1:
+        return "The staff has a HIGH probability of resigning"
 @app.get("/") # La page d'accueil de ton API
 def read_root():
+    return {"message": "Welcome to the FUTURISYS HR predictor API"}
 @app.post("/predict")
+def predict(data: EmployeeInput):
     # 1. On transforme le dictionnaire reçu en DataFrame pandas
+    df = pd.DataFrame([data.model_dump()])
+    # Encodage binaire non inclus dans le pipeline:
+    df['genre']= df["genre"].map({"M": 1, "F": 0})
+    df['heure_supplementaires']= df["heure_supplementaires"].map({"Oui": 1, "Non": 0})
+    # Changement de type pour augmentation salaire precedente (non inclus dans pipeline)
+    df["augementation_salaire_precedente"] = df["augementation_salaire_precedente"].apply(lambda x: float(x[:-1]) / 100)
+    dft = df[[item for item in df.columns if item.startswith("satisfaction")]].copy()
+    dft.loc[:, "overall_satisfaction"] = dft.mean(
+        axis=1
+    )
+    df["overall_satisfaction"] = dft["overall_satisfaction"].copy()
+    df["expertise_inconcistency"] = df.apply(inconsistency, axis=1)
+    df["managarial_stagnation"] = df.apply(promotion, axis=1)
+    df["developpement_stagnation"] = df.apply(developpement, axis=1)
     # 2. On utilise le pipeline pour faire la prédiction
     prediction = model.predict(df)
+        # 3. On renvoie le résultat au format JSON
     return {
+        "statut_employe": depart(int(prediction[0]))
+    }

app/pipeline_rh.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2f9f36f06fd2578a274d7661a710f7c0693dad3ecc83e2c2f80b5ad674852f9
-size 197529

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5e9e643a821334a5580ea7b58e4211a4acce4b7b2c010907cce800f7e711a4e
+size 204942

app/schemas.py CHANGED Viewed

	@@ -0,0 +1,32 @@

+from pydantic import BaseModel, Field
+from typing import Literal
+class EmployeeInput(BaseModel):
+    genre: Literal["M", "F"] = Field(..., alias="Genre")
+    statut_marital: str = Field(..., alias="Statut Marital")
+    departement: str = Field(..., alias="Département")
+    poste: str = Field(..., alias="Poste")
+    domaine_etude: str = Field(..., alias="Domaine d'étude")
+    frequence_deplacement: str = Field(..., alias="Fréquence de déplacement")
+    heure_supplementaires: Literal["Oui", "Non"] = Field(..., alias="Heures supplémentaires")
+    age: int = Field(..., alias="Âge")
+    revenu_mensuel: int = Field(..., alias="Revenu mensuel")
+    nombre_experiences_precedentes: int = Field(..., alias="Nombre d'expériences précédentes")
+    annee_experience_totale: int = Field(..., alias="Années d'expérience totale")
+    annees_dans_l_entreprise: int = Field(..., alias="Années dans l'entreprise")
+    annees_dans_le_poste_actuel: int = Field(..., alias="Années dans le poste actuel")
+    nb_formations_suivies: int = Field(..., alias="Nombre de formations suivies")
+    distance_domicile_travail: int = Field(..., alias="Distance domicile-travail")
+    niveau_education: int = Field(..., alias="Niveau d'éducation")
+    annees_depuis_la_derniere_promotion: int = Field(..., alias="Années depuis la dernière promotion")
+    annes_sous_responsable_actuel: int = Field(..., alias="Années sous responsable actuel")
+    satisfaction_employee_environnement: int = Field(..., alias="Satisfaction environnement")
+    note_evaluation_precedente: int = Field(..., alias="Note évaluation précédente")
+    satisfaction_employee_nature_travail: int = Field(..., alias="Satisfaction nature du travail")
+    satisfaction_employee_equipe: int = Field(..., alias="Satisfaction équipe")
+    satisfaction_employee_equilibre_pro_perso: int = Field(..., alias="Satisfaction équilibre pro/perso")
+    note_evaluation_actuelle: int = Field(..., alias="Note évaluation actuelle")
+    augementation_salaire_precedente: str = Field(..., alias="Augmentation salaire précédente")
+    model_config = {"populate_by_name": True}