{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [] }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" } }, "cells": [ { "cell_type": "markdown", "source": [ "# 1. Dados do aluno" ], "metadata": { "id": "O7LBoNEix_QA" } }, { "cell_type": "markdown", "source": [ "# 2. Objetivo" ], "metadata": { "id": "PpGJ0wPTyM1Z" } }, { "cell_type": "markdown", "source": [ "# 3. Motivação" ], "metadata": { "id": "g8LqqYHuyQbk" } }, { "cell_type": "markdown", "source": [ "# 4. Modelagem" ], "metadata": { "id": "_5VTISRTySj0" } }, { "cell_type": "code", "execution_count": 1, "metadata": { "id": "SMnEqgfJx7Or" }, "outputs": [], "source": [ "from pathlib import Path\n", "import torch, numpy as np, pandas as pd\n", "from fastai.data.transforms import RandomSplitter\n", "from torch import tensor" ] }, { "cell_type": "code", "source": [ "np.set_printoptions(linewidth=140)\n", "torch.set_printoptions(linewidth=140, sci_mode=False, edgeitems=7)\n", "pd.set_option('display.width', 140)" ], "metadata": { "id": "6bzlrHd71ZMV" }, "execution_count": 2, "outputs": [] }, { "cell_type": "code", "source": [ "path = Path('/content/drive/MyDrive/Software Engeneering/8th - Semester/ML/cars')\n", "path" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "xA9J1Qan1zCH", "outputId": "5fbf6638-2953-4366-9cf6-98bbd5f91633" }, "execution_count": 3, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "Path('/content/drive/MyDrive/Software Engeneering/8th - Semester/ML/cars')" ] }, "metadata": {}, "execution_count": 3 } ] }, { "cell_type": "markdown", "source": [ "## 4.1 Limpando os dados" ], "metadata": { "id": "mo7hHO8s1zX9" } }, { "cell_type": "markdown", "source": [ "Este é um dataset de dados tabulares - os dados estão na forma de uma tabela. Ele é fornecido como um arquivo de valores separados por vírgulas (CSV). Podemos abri-lo usando a biblioteca *pandas*, que criará um DataFrame" ], "metadata": { "id": "HUHC6ehD2R6-" } }, { "cell_type": "code", "source": [ "df = pd.read_csv(path/'Car_Purchasing_Data.csv')\n", "df" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 609 }, "id": "BO-LP-Zr2jP8", "outputId": "a979fe3d-81dd-4a20-8815-ef8971105176" }, "execution_count": 4, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " Customer Name Customer e-mail Country Gender Age Annual Salary Credit Card Debt \\\n", "0 Martina Avila cubilia.Curae.Phasellus@quisaccumsanconvallis.edu USA 0 42 62812.09301 11609.380910 \n", "1 Harlan Barnes eu.dolor@diam.co.uk USA 0 41 66646.89292 9572.957136 \n", "2 Naomi Rodriquez vulputate.mauris.sagittis@ametconsectetueradipiscing.co.uk USA 1 43 53798.55112 11160.355060 \n", "3 Jade Cunningham malesuada@dignissim.com USA 1 58 79370.03798 14426.164850 \n", "4 Cedric Leach felis.ullamcorper.viverra@egetmollislectus.net USA 1 57 59729.15130 5358.712177 \n", ".. ... ... ... ... ... ... ... \n", "495 Walter ligula@Cumsociis.ca USA 0 41 71942.40291 6995.902524 \n", "496 Vanna Cum.sociis.natoque@Sedmolestie.edu USA 1 38 56039.49793 12301.456790 \n", "497 Pearl penatibus.et@massanonante.com USA 1 54 68888.77805 10611.606860 \n", "498 Nell Quisque.varius@arcuVivamussit.net USA 1 59 49811.99062 14013.034510 \n", "499 Marla Camaron.marla@hotmail.com USA 1 47 61370.67766 9391.341628 \n", "\n", " Net Worth Car Purchase Amount \n", "0 238961.2505 35321.45877 \n", "1 530973.9078 45115.52566 \n", "2 638467.1773 42925.70921 \n", "3 548599.0524 67422.36313 \n", "4 560304.0671 55915.46248 \n", ".. ... ... \n", "495 541670.1016 48901.44342 \n", "496 360419.0988 31491.41457 \n", "497 764531.3203 64147.28888 \n", "498 337826.6382 45442.15353 \n", "499 462946.4924 45107.22566 \n", "\n", "[500 rows x 9 columns]" ], "text/html": [ "\n", "
| \n", " | Customer Name | \n", "Customer e-mail | \n", "Country | \n", "Gender | \n", "Age | \n", "Annual Salary | \n", "Credit Card Debt | \n", "Net Worth | \n", "Car Purchase Amount | \n", "
|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "Martina Avila | \n", "cubilia.Curae.Phasellus@quisaccumsanconvallis.edu | \n", "USA | \n", "0 | \n", "42 | \n", "62812.09301 | \n", "11609.380910 | \n", "238961.2505 | \n", "35321.45877 | \n", "
| 1 | \n", "Harlan Barnes | \n", "eu.dolor@diam.co.uk | \n", "USA | \n", "0 | \n", "41 | \n", "66646.89292 | \n", "9572.957136 | \n", "530973.9078 | \n", "45115.52566 | \n", "
| 2 | \n", "Naomi Rodriquez | \n", "vulputate.mauris.sagittis@ametconsectetueradipiscing.co.uk | \n", "USA | \n", "1 | \n", "43 | \n", "53798.55112 | \n", "11160.355060 | \n", "638467.1773 | \n", "42925.70921 | \n", "
| 3 | \n", "Jade Cunningham | \n", "malesuada@dignissim.com | \n", "USA | \n", "1 | \n", "58 | \n", "79370.03798 | \n", "14426.164850 | \n", "548599.0524 | \n", "67422.36313 | \n", "
| 4 | \n", "Cedric Leach | \n", "felis.ullamcorper.viverra@egetmollislectus.net | \n", "USA | \n", "1 | \n", "57 | \n", "59729.15130 | \n", "5358.712177 | \n", "560304.0671 | \n", "55915.46248 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 495 | \n", "Walter | \n", "ligula@Cumsociis.ca | \n", "USA | \n", "0 | \n", "41 | \n", "71942.40291 | \n", "6995.902524 | \n", "541670.1016 | \n", "48901.44342 | \n", "
| 496 | \n", "Vanna | \n", "Cum.sociis.natoque@Sedmolestie.edu | \n", "USA | \n", "1 | \n", "38 | \n", "56039.49793 | \n", "12301.456790 | \n", "360419.0988 | \n", "31491.41457 | \n", "
| 497 | \n", "Pearl | \n", "penatibus.et@massanonante.com | \n", "USA | \n", "1 | \n", "54 | \n", "68888.77805 | \n", "10611.606860 | \n", "764531.3203 | \n", "64147.28888 | \n", "
| 498 | \n", "Nell | \n", "Quisque.varius@arcuVivamussit.net | \n", "USA | \n", "1 | \n", "59 | \n", "49811.99062 | \n", "14013.034510 | \n", "337826.6382 | \n", "45442.15353 | \n", "
| 499 | \n", "Marla | \n", "Camaron.marla@hotmail.com | \n", "USA | \n", "1 | \n", "47 | \n", "61370.67766 | \n", "9391.341628 | \n", "462946.4924 | \n", "45107.22566 | \n", "
500 rows × 9 columns
\n", "| \n", " | Gender | \n", "Age | \n", "Annual Salary | \n", "Credit Card Debt | \n", "Net Worth | \n", "Car Purchase Amount | \n", "
|---|---|---|---|---|---|---|
| count | \n", "500.000000 | \n", "500.000000 | \n", "500.000000 | \n", "500.000000 | \n", "500.000000 | \n", "500.000000 | \n", "
| mean | \n", "0.506000 | \n", "46.224000 | \n", "62127.239608 | \n", "9607.645049 | \n", "431475.713625 | \n", "44209.799218 | \n", "
| std | \n", "0.500465 | \n", "7.990339 | \n", "11703.378228 | \n", "3489.187973 | \n", "173536.756340 | \n", "10773.178744 | \n", "
| min | \n", "0.000000 | \n", "20.000000 | \n", "20000.000000 | \n", "100.000000 | \n", "20000.000000 | \n", "9000.000000 | \n", "
| 25% | \n", "0.000000 | \n", "41.000000 | \n", "54391.977195 | \n", "7397.515792 | \n", "299824.195900 | \n", "37629.896040 | \n", "
| 50% | \n", "1.000000 | \n", "46.000000 | \n", "62915.497035 | \n", "9655.035568 | \n", "426750.120650 | \n", "43997.783390 | \n", "
| 75% | \n", "1.000000 | \n", "52.000000 | \n", "70117.862005 | \n", "11798.867487 | \n", "557324.478725 | \n", "51254.709517 | \n", "
| max | \n", "1.000000 | \n", "70.000000 | \n", "100000.000000 | \n", "20000.000000 | \n", "1000000.000000 | \n", "80000.000000 | \n", "
| \n", " | Gender | \n", "Age | \n", "Annual Salary | \n", "Credit Card Debt | \n", "Net Worth | \n", "Car Purchase Amount | \n", "
|---|---|---|---|---|---|---|
| 0 | \n", "0 | \n", "42 | \n", "62812.09301 | \n", "11609.380910 | \n", "238961.2505 | \n", "35321.45877 | \n", "
| 1 | \n", "0 | \n", "41 | \n", "66646.89292 | \n", "9572.957136 | \n", "530973.9078 | \n", "45115.52566 | \n", "
| 2 | \n", "1 | \n", "43 | \n", "53798.55112 | \n", "11160.355060 | \n", "638467.1773 | \n", "42925.70921 | \n", "
| 3 | \n", "1 | \n", "58 | \n", "79370.03798 | \n", "14426.164850 | \n", "548599.0524 | \n", "67422.36313 | \n", "
| 4 | \n", "1 | \n", "57 | \n", "59729.15130 | \n", "5358.712177 | \n", "560304.0671 | \n", "55915.46248 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 495 | \n", "0 | \n", "41 | \n", "71942.40291 | \n", "6995.902524 | \n", "541670.1016 | \n", "48901.44342 | \n", "
| 496 | \n", "1 | \n", "38 | \n", "56039.49793 | \n", "12301.456790 | \n", "360419.0988 | \n", "31491.41457 | \n", "
| 497 | \n", "1 | \n", "54 | \n", "68888.77805 | \n", "10611.606860 | \n", "764531.3203 | \n", "64147.28888 | \n", "
| 498 | \n", "1 | \n", "59 | \n", "49811.99062 | \n", "14013.034510 | \n", "337826.6382 | \n", "45442.15353 | \n", "
| 499 | \n", "1 | \n", "47 | \n", "61370.67766 | \n", "9391.341628 | \n", "462946.4924 | \n", "45107.22566 | \n", "
500 rows × 6 columns
\n", "