{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "
| \n", " | Unnamed: 0 | \n", "Store | \n", "DayOfWeek | \n", "Date | \n", "Sales | \n", "Customers | \n", "Promo | \n", "StateHoliday | \n", "SchoolHoliday | \n", "StoreType | \n", "Assortment | \n", "CompetitionDistance | \n", "CompetitionOpenSinceMonth | \n", "CompetitionOpenSinceYear | \n", "Promo2 | \n", "Promo2SinceWeek | \n", "Promo2SinceYear | \n", "PromoInterval | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "0 | \n", "1 | \n", "5 | \n", "2015-07-31 | \n", "5263 | \n", "555 | \n", "1 | \n", "0 | \n", "1 | \n", "Large Store | \n", "basic | \n", "1270 | \n", "9 | \n", "2008 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| 1 | \n", "1 | \n", "2 | \n", "5 | \n", "2015-07-31 | \n", "6064 | \n", "625 | \n", "1 | \n", "0 | \n", "1 | \n", "Small Shop | \n", "basic | \n", "570 | \n", "11 | \n", "2007 | \n", "1 | \n", "13 | \n", "2010 | \n", "Jan,Apr,Jul,Oct | \n", "
| 2 | \n", "2 | \n", "3 | \n", "5 | \n", "2015-07-31 | \n", "8314 | \n", "821 | \n", "1 | \n", "0 | \n", "1 | \n", "Small Shop | \n", "basic | \n", "14130 | \n", "12 | \n", "2006 | \n", "1 | \n", "14 | \n", "2011 | \n", "Jan,Apr,Jul,Oct | \n", "
| 3 | \n", "3 | \n", "4 | \n", "5 | \n", "2015-07-31 | \n", "13995 | \n", "1498 | \n", "1 | \n", "0 | \n", "1 | \n", "Large Store | \n", "extended | \n", "620 | \n", "9 | \n", "2009 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| 4 | \n", "4 | \n", "5 | \n", "5 | \n", "2015-07-31 | \n", "4822 | \n", "559 | \n", "1 | \n", "0 | \n", "1 | \n", "Small Shop | \n", "basic | \n", "29910 | \n", "4 | \n", "2015 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| \n", " | PromoInterval | \n", "StoreType | \n", "Assortment | \n", "StateHoliday | \n", "Store | \n", "Customers | \n", "Promo | \n", "SchoolHoliday | \n", "CompetitionDistance | \n", "CompetitionOpenSinceMonth | \n", "CompetitionOpenSinceYear | \n", "Sales | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "0 | \n", "Large Store | \n", "basic | \n", "0 | \n", "1 | \n", "555 | \n", "1 | \n", "1 | \n", "1270 | \n", "9 | \n", "2008 | \n", "5263 | \n", "
| 1 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "2 | \n", "625 | \n", "1 | \n", "1 | \n", "570 | \n", "11 | \n", "2007 | \n", "6064 | \n", "
| 2 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "3 | \n", "821 | \n", "1 | \n", "1 | \n", "14130 | \n", "12 | \n", "2006 | \n", "8314 | \n", "
| 3 | \n", "0 | \n", "Large Store | \n", "extended | \n", "0 | \n", "4 | \n", "1498 | \n", "1 | \n", "1 | \n", "620 | \n", "9 | \n", "2009 | \n", "13995 | \n", "
| 4 | \n", "0 | \n", "Small Shop | \n", "basic | \n", "0 | \n", "5 | \n", "559 | \n", "1 | \n", "1 | \n", "29910 | \n", "4 | \n", "2015 | \n", "4822 | \n", "
| \n", " | PromoInterval | \n", "StoreType | \n", "Assortment | \n", "StateHoliday | \n", "Store | \n", "Customers | \n", "Promo | \n", "SchoolHoliday | \n", "CompetitionDistance | \n", "CompetitionOpenSinceMonth | \n", "CompetitionOpenSinceYear | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|
| 795018 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "650 | \n", "636 | \n", "1 | \n", "0 | \n", "1420 | \n", "10 | \n", "2012 | \n", "
| 463276 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "72 | \n", "261 | \n", "0 | \n", "0 | \n", "2200 | \n", "12 | \n", "2009 | \n", "
| 268352 | \n", "0 | \n", "Medium Store | \n", "extra | \n", "0 | \n", "733 | \n", "3567 | \n", "1 | \n", "0 | \n", "860 | \n", "10 | \n", "1999 | \n", "
| 67308 | \n", "0 | \n", "Small Shop | \n", "extended | \n", "0 | \n", "796 | \n", "791 | \n", "1 | \n", "0 | \n", "7180 | \n", "11 | \n", "2012 | \n", "
| 482458 | \n", "0 | \n", "Small Shop | \n", "extended | \n", "0 | \n", "301 | \n", "480 | \n", "0 | \n", "0 | \n", "4510 | \n", "3 | \n", "2015 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 259178 | \n", "Feb,May,Aug,Nov | \n", "Small Shop | \n", "basic | \n", "0 | \n", "1013 | \n", "217 | \n", "0 | \n", "0 | \n", "630 | \n", "2 | \n", "2015 | \n", "
| 365838 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "extended | \n", "0 | \n", "11 | \n", "1394 | \n", "1 | \n", "0 | \n", "960 | \n", "11 | \n", "2011 | \n", "
| 131932 | \n", "0 | \n", "Small Shop | \n", "basic | \n", "0 | \n", "376 | \n", "796 | \n", "0 | \n", "0 | \n", "160 | \n", "8 | \n", "2012 | \n", "
| 671155 | \n", "0 | \n", "Hypermarket | \n", "extended | \n", "0 | \n", "76 | \n", "885 | \n", "0 | \n", "0 | \n", "19960 | \n", "3 | \n", "2006 | \n", "
| 121958 | \n", "Feb,May,Aug,Nov | \n", "Small Shop | \n", "basic | \n", "0 | \n", "446 | \n", "684 | \n", "1 | \n", "0 | \n", "340 | \n", "10 | \n", "2000 | \n", "
633253 rows × 11 columns
\n", "Pipeline(steps=[('encoding',\n",
" ColumnTransformer(remainder='passthrough',\n",
" transformers=[('ohe',\n",
" OneHotEncoder(handle_unknown='ignore'),\n",
" ['PromoInterval', 'StoreType',\n",
" 'Assortment'])])),\n",
" ('scaler', StandardScaler()),\n",
" ('model',\n",
" XGBRegressor(base_score=None, booster=None, callbacks=None,\n",
" colsample_bylevel=None, colsample_bynode=None,\n",
" colsample_bytree=None, device=None,...\n",
" feature_types=None, gamma=None, grow_policy=None,\n",
" importance_type=None,\n",
" interaction_constraints=None, learning_rate=0.1,\n",
" max_bin=None, max_cat_threshold=None,\n",
" max_cat_to_onehot=None, max_delta_step=None,\n",
" max_depth=13, max_leaves=None,\n",
" min_child_weight=None, missing=nan,\n",
" monotone_constraints=None, multi_strategy=None,\n",
" n_estimators=None, n_jobs=None,\n",
" num_parallel_tree=None, random_state=None, ...))])In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. Pipeline(steps=[('encoding',\n",
" ColumnTransformer(remainder='passthrough',\n",
" transformers=[('ohe',\n",
" OneHotEncoder(handle_unknown='ignore'),\n",
" ['PromoInterval', 'StoreType',\n",
" 'Assortment'])])),\n",
" ('scaler', StandardScaler()),\n",
" ('model',\n",
" XGBRegressor(base_score=None, booster=None, callbacks=None,\n",
" colsample_bylevel=None, colsample_bynode=None,\n",
" colsample_bytree=None, device=None,...\n",
" feature_types=None, gamma=None, grow_policy=None,\n",
" importance_type=None,\n",
" interaction_constraints=None, learning_rate=0.1,\n",
" max_bin=None, max_cat_threshold=None,\n",
" max_cat_to_onehot=None, max_delta_step=None,\n",
" max_depth=13, max_leaves=None,\n",
" min_child_weight=None, missing=nan,\n",
" monotone_constraints=None, multi_strategy=None,\n",
" n_estimators=None, n_jobs=None,\n",
" num_parallel_tree=None, random_state=None, ...))])ColumnTransformer(remainder='passthrough',\n",
" transformers=[('ohe', OneHotEncoder(handle_unknown='ignore'),\n",
" ['PromoInterval', 'StoreType', 'Assortment'])])['PromoInterval', 'StoreType', 'Assortment']
OneHotEncoder(handle_unknown='ignore')
['StateHoliday', 'Store', 'Customers', 'Promo', 'SchoolHoliday', 'CompetitionDistance', 'CompetitionOpenSinceMonth', 'CompetitionOpenSinceYear']
passthrough
StandardScaler()
XGBRegressor(base_score=None, booster=None, callbacks=None,\n",
" colsample_bylevel=None, colsample_bynode=None,\n",
" colsample_bytree=None, device=None, early_stopping_rounds=None,\n",
" enable_categorical=False, eval_metric=None, feature_types=None,\n",
" gamma=None, grow_policy=None, importance_type=None,\n",
" interaction_constraints=None, learning_rate=0.1, max_bin=None,\n",
" max_cat_threshold=None, max_cat_to_onehot=None,\n",
" max_delta_step=None, max_depth=13, max_leaves=None,\n",
" min_child_weight=None, missing=nan, monotone_constraints=None,\n",
" multi_strategy=None, n_estimators=None, n_jobs=None,\n",
" num_parallel_tree=None, random_state=None, ...)| \n", " | PromoInterval | \n", "StoreType | \n", "Assortment | \n", "StateHoliday | \n", "Store | \n", "Customers | \n", "Promo | \n", "SchoolHoliday | \n", "CompetitionDistance | \n", "CompetitionOpenSinceMonth | \n", "CompetitionOpenSinceYear | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|
| 795018 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "650 | \n", "636 | \n", "1 | \n", "0 | \n", "1420 | \n", "10 | \n", "2012 | \n", "
| 463276 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "72 | \n", "261 | \n", "0 | \n", "0 | \n", "2200 | \n", "12 | \n", "2009 | \n", "
| 268352 | \n", "0 | \n", "Medium Store | \n", "extra | \n", "0 | \n", "733 | \n", "3567 | \n", "1 | \n", "0 | \n", "860 | \n", "10 | \n", "1999 | \n", "
| 67308 | \n", "0 | \n", "Small Shop | \n", "extended | \n", "0 | \n", "796 | \n", "791 | \n", "1 | \n", "0 | \n", "7180 | \n", "11 | \n", "2012 | \n", "
| 482458 | \n", "0 | \n", "Small Shop | \n", "extended | \n", "0 | \n", "301 | \n", "480 | \n", "0 | \n", "0 | \n", "4510 | \n", "3 | \n", "2015 | \n", "
| \n", " | PromoInterval | \n", "StoreType | \n", "Assortment | \n", "StateHoliday | \n", "Store | \n", "Customers | \n", "Promo | \n", "SchoolHoliday | \n", "CompetitionDistance | \n", "CompetitionOpenSinceMonth | \n", "CompetitionOpenSinceYear | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "Jan,Apr,Jul,Oct | \n", "Small Shop | \n", "basic | \n", "0 | \n", "650 | \n", "636 | \n", "1 | \n", "0 | \n", "1420 | \n", "10 | \n", "2012 | \n", "