{ "cells": [ { "cell_type": "markdown", "id": "e3ce0e00-756c-4aae-a196-df3872ceeca5", "metadata": {}, "source": [ "# 1.Objective " ] }, { "cell_type": "raw", "id": "f94857d4-976d-4546-a5ab-883839b0f8df", "metadata": {}, "source": [ "Rain prediction of australia based on the data provided using the ANN model along with optimization technique like batch normalization." ] }, { "cell_type": "markdown", "id": "4c772b8e-baee-406f-9841-2485207b03f2", "metadata": {}, "source": [ "# 2.Libraries " ] }, { "cell_type": "code", "execution_count": 1, "id": "45af91ed-01ef-46ec-9674-78a72f8bd0a1", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import warnings\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "from sklearn.preprocessing import LabelEncoder\n", "from sklearn import preprocessing\n", "from sklearn.model_selection import train_test_split\n", "import torch\n", "from sklearn.metrics import roc_auc_score\n", "import torch.nn as nn\n", "import torch.optim as optim\n", "from sklearn.metrics import accuracy_score, confusion_matrix\n", "from sklearn.metrics import classification_report\n", "import pickle \n", "# Ignore all warnings\n", "warnings.filterwarnings('ignore')\n" ] }, { "cell_type": "markdown", "id": "b0c7e4f8-4c24-4909-91dc-73e3876a1331", "metadata": {}, "source": [ "# 3.Data description " ] }, { "cell_type": "code", "execution_count": 2, "id": "6968d7b7-ef34-4418-838f-a66f607d6ff1", "metadata": {}, "outputs": [], "source": [ "#reading the dataset\n", "df = pd.read_csv('weatherAUS.csv')\n" ] }, { "cell_type": "code", "execution_count": 3, "id": "5fa0e7cc-fcd0-4daf-bc69-6cb70f07a964", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | Date | \n", "Location | \n", "MinTemp | \n", "MaxTemp | \n", "Rainfall | \n", "Evaporation | \n", "Sunshine | \n", "WindGustDir | \n", "WindGustSpeed | \n", "WindDir9am | \n", "... | \n", "Humidity9am | \n", "Humidity3pm | \n", "Pressure9am | \n", "Pressure3pm | \n", "Cloud9am | \n", "Cloud3pm | \n", "Temp9am | \n", "Temp3pm | \n", "RainToday | \n", "RainTomorrow | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "2008-12-01 | \n", "Albury | \n", "13.4 | \n", "22.9 | \n", "0.6 | \n", "NaN | \n", "NaN | \n", "W | \n", "44.0 | \n", "W | \n", "... | \n", "71.0 | \n", "22.0 | \n", "1007.7 | \n", "1007.1 | \n", "8.0 | \n", "NaN | \n", "16.9 | \n", "21.8 | \n", "No | \n", "No | \n", "
| 1 | \n", "2008-12-02 | \n", "Albury | \n", "7.4 | \n", "25.1 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "WNW | \n", "44.0 | \n", "NNW | \n", "... | \n", "44.0 | \n", "25.0 | \n", "1010.6 | \n", "1007.8 | \n", "NaN | \n", "NaN | \n", "17.2 | \n", "24.3 | \n", "No | \n", "No | \n", "
| 2 | \n", "2008-12-03 | \n", "Albury | \n", "12.9 | \n", "25.7 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "WSW | \n", "46.0 | \n", "W | \n", "... | \n", "38.0 | \n", "30.0 | \n", "1007.6 | \n", "1008.7 | \n", "NaN | \n", "2.0 | \n", "21.0 | \n", "23.2 | \n", "No | \n", "No | \n", "
| 3 | \n", "2008-12-04 | \n", "Albury | \n", "9.2 | \n", "28.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "NE | \n", "24.0 | \n", "SE | \n", "... | \n", "45.0 | \n", "16.0 | \n", "1017.6 | \n", "1012.8 | \n", "NaN | \n", "NaN | \n", "18.1 | \n", "26.5 | \n", "No | \n", "No | \n", "
| 4 | \n", "2008-12-05 | \n", "Albury | \n", "17.5 | \n", "32.3 | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "W | \n", "41.0 | \n", "ENE | \n", "... | \n", "82.0 | \n", "33.0 | \n", "1010.8 | \n", "1006.0 | \n", "7.0 | \n", "8.0 | \n", "17.8 | \n", "29.7 | \n", "No | \n", "No | \n", "
5 rows × 23 columns
\n", "| \n", " | MinTemp | \n", "MaxTemp | \n", "Rainfall | \n", "Evaporation | \n", "Sunshine | \n", "WindGustSpeed | \n", "WindSpeed9am | \n", "WindSpeed3pm | \n", "Humidity9am | \n", "Humidity3pm | \n", "Pressure9am | \n", "Pressure3pm | \n", "Cloud9am | \n", "Cloud3pm | \n", "Temp9am | \n", "Temp3pm | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| count | \n", "143975.000000 | \n", "144199.000000 | \n", "142199.000000 | \n", "82670.000000 | \n", "75625.000000 | \n", "135197.000000 | \n", "143693.000000 | \n", "142398.000000 | \n", "142806.000000 | \n", "140953.000000 | \n", "130395.00000 | \n", "130432.000000 | \n", "89572.000000 | \n", "86102.000000 | \n", "143693.000000 | \n", "141851.00000 | \n", "
| mean | \n", "12.194034 | \n", "23.221348 | \n", "2.360918 | \n", "5.468232 | \n", "7.611178 | \n", "40.035230 | \n", "14.043426 | \n", "18.662657 | \n", "68.880831 | \n", "51.539116 | \n", "1017.64994 | \n", "1015.255889 | \n", "4.447461 | \n", "4.509930 | \n", "16.990631 | \n", "21.68339 | \n", "
| std | \n", "6.398495 | \n", "7.119049 | \n", "8.478060 | \n", "4.193704 | \n", "3.785483 | \n", "13.607062 | \n", "8.915375 | \n", "8.809800 | \n", "19.029164 | \n", "20.795902 | \n", "7.10653 | \n", "7.037414 | \n", "2.887159 | \n", "2.720357 | \n", "6.488753 | \n", "6.93665 | \n", "
| min | \n", "-8.500000 | \n", "-4.800000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "6.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "980.50000 | \n", "977.100000 | \n", "0.000000 | \n", "0.000000 | \n", "-7.200000 | \n", "-5.40000 | \n", "
| 25% | \n", "7.600000 | \n", "17.900000 | \n", "0.000000 | \n", "2.600000 | \n", "4.800000 | \n", "31.000000 | \n", "7.000000 | \n", "13.000000 | \n", "57.000000 | \n", "37.000000 | \n", "1012.90000 | \n", "1010.400000 | \n", "1.000000 | \n", "2.000000 | \n", "12.300000 | \n", "16.60000 | \n", "
| 50% | \n", "12.000000 | \n", "22.600000 | \n", "0.000000 | \n", "4.800000 | \n", "8.400000 | \n", "39.000000 | \n", "13.000000 | \n", "19.000000 | \n", "70.000000 | \n", "52.000000 | \n", "1017.60000 | \n", "1015.200000 | \n", "5.000000 | \n", "5.000000 | \n", "16.700000 | \n", "21.10000 | \n", "
| 75% | \n", "16.900000 | \n", "28.200000 | \n", "0.800000 | \n", "7.400000 | \n", "10.600000 | \n", "48.000000 | \n", "19.000000 | \n", "24.000000 | \n", "83.000000 | \n", "66.000000 | \n", "1022.40000 | \n", "1020.000000 | \n", "7.000000 | \n", "7.000000 | \n", "21.600000 | \n", "26.40000 | \n", "
| max | \n", "33.900000 | \n", "48.100000 | \n", "371.000000 | \n", "145.000000 | \n", "14.500000 | \n", "135.000000 | \n", "130.000000 | \n", "87.000000 | \n", "100.000000 | \n", "100.000000 | \n", "1041.00000 | \n", "1039.600000 | \n", "9.000000 | \n", "9.000000 | \n", "40.200000 | \n", "46.70000 | \n", "