nivakaran commited on
Commit
6cc90ac
·
verified ·
1 Parent(s): 1883a7b

Create training_pipeline/__init__.py

Browse files
src/constants/training_pipeline/__init__.py ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import sys
3
+ import numpy as np
4
+ import pandas as pd
5
+
6
+ """
7
+ Defining common constant variable for training pipeline
8
+ """
9
+
10
+ TARGET_COLUMN="Time_taken(min)"
11
+ PIPELINE_NAME:str = "DeliveryTimePrediction"
12
+ ARTIFACT_DIR:str = "Artifacts"
13
+ FILE_NAME:str = "final_data.csv"
14
+
15
+ TRAIN_FILE_NAME:str = "train.csv"
16
+ TEST_FILE_NAME: str = "test.csv"
17
+
18
+
19
+ SCHEMA_FILE_PATH=os.path.join("data_schema", "schema.yaml")
20
+
21
+ SAVED_MODEL_DIR=os.path.join("saved_models")
22
+ MODEL_FILE_NAME= "model.pkl"
23
+
24
+ """
25
+ Data Ingestion related constant start with DATA_INGESTION VAR NAME
26
+ """
27
+
28
+ DATA_INGESTION_COLLECTION_NAME: str ="DeliveryTimePrediction"
29
+ DATA_INGESTION_DATABASE_NAME: str ="NIVASYSTEM"
30
+ DATA_INGESTION_DIR_NAME: str = "data_ingestion"
31
+ DATA_INGESTION_FEATURE_STORE_DIR: str = "feature_store"
32
+ DATA_INGESTION_INGESTED_DIR: str = "ingested"
33
+ DATA_INGESTION_TRAIN_TEST_SPLIT_RATION: float = 0.2
34
+
35
+ """
36
+ Data Validation related constant start with DATA_VALIDATION VAR NAME
37
+ """
38
+ DATA_VALIDATION_DIR_NAME:str = "data_validation"
39
+ DATA_VALIDATION_VALID_DIR: str = "validated"
40
+ DATA_VALIDATION_INVALID_DIR: str = "invalid"
41
+ DATA_VALIDATION_DRIFT_REPORT_DIR: str = "drift_report"
42
+ DATA_VALIDATION_DRIFT_REPORT_FILE_NAME:str = "report.yaml"
43
+ PREPROCESSING_OBJECT_FILE_NAME:str="preprocessing.pkl"
44
+
45
+ """
46
+ Data Transformation related constant start with DATA_TRANSFORMATION VAR NAME
47
+ """
48
+
49
+ DATA_TRANSFORMATION_DIR_NAME: str = "data_transformation"
50
+ DATA_TRANSFORMATION_TRANSFORMED_DATA_DIR: str="transformed"
51
+ DATA_TRANSFORMATION_TRANSFORMED_OBJECT_DIR: str="transformed_object"
52
+
53
+ ## Knn imputer class to replace nan values
54
+ DATA_TRANSFORMATION_IMPUTER_PARAMS: dict={
55
+ "missing_values": np.nan,
56
+ "n_neighbors": 3,
57
+ "weights": "uniform"
58
+ }
59
+
60
+
61
+ DATA_TRANSFORMATION_TRAIN_FILE_PATH:str = "train.py"
62
+ DATA_TRANSFORMATION_TEST_FILE_PATH:str = "test.npy"
63
+
64
+ """
65
+ Model Trainer related content startt with MODEL_TRAINER VAR NAME
66
+ """
67
+
68
+ MODEL_TRAINER_DIR_NAME:str = "model_trainer"
69
+ MODEL_TRAINER_TRAINED_MODEL_DIR:str="trained_model"
70
+ MODEL_TRAINER_TRAINED_MODEL_NAME: str="model.pkl"
71
+ MODEL_TRAINER_EXPECTED_SCORE: float=0.6
72
+ MODEL_TRAINER_OVER_FITTING_UNDER_FITTING_THRESHOLD:float= 0.05
73
+ MODEL_TRAINER_OVER_FIITING_UNDER_FITTING_THRESHOLD:float=0.05
74
+
75
+ TRAINING_BUCKET_NAME="deliveryprediction"