{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "id": "hvn1t3fB94IS" }, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "from sklearn.impute import SimpleImputer\n", "from sklearn.preprocessing import Normalizer\n", "from sklearn.preprocessing import LabelEncoder, OneHotEncoder \n", "from sklearn.model_selection import train_test_split \n", "from sklearn.preprocessing import StandardScaler \n", "from sklearn.preprocessing import KBinsDiscretizer" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 415 }, "id": "3RatXS8B_E-Q", "outputId": "30fe42a0-bb38-4223-8118-2dfcc8bcf546" }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
mpgcylindersdisplacementhorsepowerweightaccelerationmodel yearorigincar name
018.08307.0130.0350412.0701chevrolet chevelle malibu
115.08350.0165.0369311.5701buick skylark 320
218.08318.0150.0343611.0701plymouth satellite
316.08304.0150.0343312.0701amc rebel sst
417.08302.0140.0344910.5701ford torino
..............................
39327.04140.086.0279015.6821ford mustang gl
39444.0497.052.0213024.6822vw pickup
39532.04135.084.0229511.6821dodge rampage
39628.04120.079.0262518.6821ford ranger
39731.04119.082.0272019.4821chevy s-10
\n", "

398 rows × 9 columns

\n", "
" ], "text/plain": [ " mpg cylinders displacement horsepower weight acceleration \\\n", "0 18.0 8 307.0 130.0 3504 12.0 \n", "1 15.0 8 350.0 165.0 3693 11.5 \n", "2 18.0 8 318.0 150.0 3436 11.0 \n", "3 16.0 8 304.0 150.0 3433 12.0 \n", "4 17.0 8 302.0 140.0 3449 10.5 \n", ".. ... ... ... ... ... ... \n", "393 27.0 4 140.0 86.0 2790 15.6 \n", "394 44.0 4 97.0 52.0 2130 24.6 \n", "395 32.0 4 135.0 84.0 2295 11.6 \n", "396 28.0 4 120.0 79.0 2625 18.6 \n", "397 31.0 4 119.0 82.0 2720 19.4 \n", "\n", " model year origin car name \n", "0 70 1 chevrolet chevelle malibu \n", "1 70 1 buick skylark 320 \n", "2 70 1 plymouth satellite \n", "3 70 1 amc rebel sst \n", "4 70 1 ford torino \n", ".. ... ... ... \n", "393 82 1 ford mustang gl \n", "394 82 2 vw pickup \n", "395 82 1 dodge rampage \n", "396 82 1 ford ranger \n", "397 82 1 chevy s-10 \n", "\n", "[398 rows x 9 columns]" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df = pd.read_csv(\"auto-mpg.csv\")\n", "df" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "id": "BcC6Y8tS_SMY" }, "outputs": [], "source": [ "from sklearn.impute import MissingIndicator\n", "indicator = MissingIndicator(missing_values=np.NaN)\n", "indicator = indicator.fit_transform(df)\n", "indicator = pd.DataFrame(indicator, columns=['horsepower'])" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 417 }, "id": "6_zl5F0VCOj1", "outputId": "bb0dbe42-d9c1-470f-d3a1-cbe2aeb1caa3" }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
mpgcylindersdisplacementhorsepowerweightaccelerationmodel yearorigincar name
018.08.0307.0130.03504.012.070.01chevrolet chevelle malibu
115.08.0350.0165.03693.011.570.01buick skylark 320
218.08.0318.0150.03436.011.070.01plymouth satellite
316.08.0304.0150.03433.012.070.01amc rebel sst
417.08.0302.0140.03449.010.570.01ford torino
..............................
39327.04.0140.086.02790.015.682.01ford mustang gl
39444.04.097.052.02130.024.682.02vw pickup
39532.04.0135.084.02295.011.682.01dodge rampage
39628.04.0120.079.02625.018.682.01ford ranger
39731.04.0119.082.02720.019.482.01chevy s-10
\n", "

398 rows × 9 columns

\n", "
" ], "text/plain": [ " mpg cylinders displacement horsepower weight acceleration \\\n", "0 18.0 8.0 307.0 130.0 3504.0 12.0 \n", "1 15.0 8.0 350.0 165.0 3693.0 11.5 \n", "2 18.0 8.0 318.0 150.0 3436.0 11.0 \n", "3 16.0 8.0 304.0 150.0 3433.0 12.0 \n", "4 17.0 8.0 302.0 140.0 3449.0 10.5 \n", ".. ... ... ... ... ... ... \n", "393 27.0 4.0 140.0 86.0 2790.0 15.6 \n", "394 44.0 4.0 97.0 52.0 2130.0 24.6 \n", "395 32.0 4.0 135.0 84.0 2295.0 11.6 \n", "396 28.0 4.0 120.0 79.0 2625.0 18.6 \n", "397 31.0 4.0 119.0 82.0 2720.0 19.4 \n", "\n", " model year origin car name \n", "0 70.0 1 chevrolet chevelle malibu \n", "1 70.0 1 buick skylark 320 \n", "2 70.0 1 plymouth satellite \n", "3 70.0 1 amc rebel sst \n", "4 70.0 1 ford torino \n", ".. ... ... ... \n", "393 82.0 1 ford mustang gl \n", "394 82.0 2 vw pickup \n", "395 82.0 1 dodge rampage \n", "396 82.0 1 ford ranger \n", "397 82.0 1 chevy s-10 \n", "\n", "[398 rows x 9 columns]" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "#replacing the missing values by their mean \n", "imputer = SimpleImputer(missing_values=np.nan, strategy='mean') \n", "imputer = imputer.fit(df.iloc[:, 1:7])\n", "df.iloc[:, 1:7] = imputer.transform(df.iloc[:, 1:7])\n", "df" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 417 }, "id": "L_iJCWXxGitn", "outputId": "726891eb-1007-4244-a040-305e14e34b80" }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
cylindersdisplacementhorsepowerweightaccelerationmodel yearorigincar name
08.0307.0130.03504.012.070.01chevrolet chevelle malibu
18.0350.0165.03693.011.570.01buick skylark 320
28.0318.0150.03436.011.070.01plymouth satellite
38.0304.0150.03433.012.070.01amc rebel sst
48.0302.0140.03449.010.570.01ford torino
...........................
3934.0140.086.02790.015.682.01ford mustang gl
3944.097.052.02130.024.682.02vw pickup
3954.0135.084.02295.011.682.01dodge rampage
3964.0120.079.02625.018.682.01ford ranger
3974.0119.082.02720.019.482.01chevy s-10
\n", "

398 rows × 8 columns

\n", "
" ], "text/plain": [ " cylinders displacement horsepower weight acceleration model year \\\n", "0 8.0 307.0 130.0 3504.0 12.0 70.0 \n", "1 8.0 350.0 165.0 3693.0 11.5 70.0 \n", "2 8.0 318.0 150.0 3436.0 11.0 70.0 \n", "3 8.0 304.0 150.0 3433.0 12.0 70.0 \n", "4 8.0 302.0 140.0 3449.0 10.5 70.0 \n", ".. ... ... ... ... ... ... \n", "393 4.0 140.0 86.0 2790.0 15.6 82.0 \n", "394 4.0 97.0 52.0 2130.0 24.6 82.0 \n", "395 4.0 135.0 84.0 2295.0 11.6 82.0 \n", "396 4.0 120.0 79.0 2625.0 18.6 82.0 \n", "397 4.0 119.0 82.0 2720.0 19.4 82.0 \n", "\n", " origin car name \n", "0 1 chevrolet chevelle malibu \n", "1 1 buick skylark 320 \n", "2 1 plymouth satellite \n", "3 1 amc rebel sst \n", "4 1 ford torino \n", ".. ... ... \n", "393 1 ford mustang gl \n", "394 2 vw pickup \n", "395 1 dodge rampage \n", "396 1 ford ranger \n", "397 1 chevy s-10 \n", "\n", "[398 rows x 8 columns]" ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X = df.iloc[:,1:]\n", "Y = df.iloc[:,0]\n", "X" ] }, { "cell_type": "code", "execution_count": 6, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "MO1WYelyJ9nu", "outputId": "3ecbb3b3-9d03-42f3-a88b-c5321a8f7590" }, "outputs": [ { "data": { "text/plain": [ "array([[ 4.70902366, 2.94798968, 3.40749723, ..., 4.35694676,\n", " 18.95488984, 1.24836677],\n", " [ 4.70902366, 3.36090028, 4.32490032, ..., 4.17540731,\n", " 18.95488984, 1.24836677],\n", " [ 4.70902366, 3.05361797, 3.93172757, ..., 3.99386786,\n", " 18.95488984, 1.24836677],\n", " ...,\n", " [ 2.35451183, 1.29634725, 2.20176744, ..., 4.2117152 ,\n", " 22.20429953, 1.24836677],\n", " [ 2.35451183, 1.15230867, 2.07070985, ..., 6.75326748,\n", " 22.20429953, 1.24836677],\n", " [ 2.35451183, 1.1427061 , 2.1493444 , ..., 7.04373059,\n", " 22.20429953, 1.24836677]])" ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "#standardisaation, Feature scaling\n", "#x_scaled = (x — u) / s\n", "\n", "sc_X = StandardScaler(with_mean=False)\n", "X = sc_X.fit_transform(X.drop(['car name'], axis=1))\n", "X" ] }, { "cell_type": "code", "execution_count": 7, "metadata": { "id": "8Py_CmGKW1VH" }, "outputs": [], "source": [ "from sklearn.preprocessing import Normalizer\n", "nm = Normalizer()\n", "x_sc = nm.fit_transform(X)\n", "X=pd.DataFrame(x_sc)\n" ] }, { "cell_type": "code", "execution_count": 8, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 434 }, "id": "Gxn8BV79XDPU", "outputId": "8952fc72-b2e4-4504-ae6b-d13bc44a4025" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "(398, 8)\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
0123456car name
00.2246290.1406250.1625440.1976260.2078350.9041840.059549chevroletchevellemalibu
10.2221040.1585190.2039860.2059440.1969350.8940180.058880buickskylark320
20.2244280.1455330.1873830.1936170.1903440.9033730.059496plymouthsatellite
30.2238690.1387790.1869160.1929660.2071310.9011240.059348amcrebelsst
40.2255060.1388740.1757300.1952830.1825650.9077120.059782fordtorino
...........................
3930.1003980.0573250.0961200.1406610.2415180.9468080.053231fordmustanggl
3940.0966350.0382290.0559410.1033610.3665810.9113200.102472vwpickup
3950.1021040.0562160.0954800.1176710.1826420.9628930.054136dodgerampage
3960.0994090.0486510.0874260.1310380.2851260.9374760.052707fordranger
3970.0989660.0480310.0903420.1351760.2960660.9333040.052472chevys-10
\n", "

398 rows × 8 columns

\n", "
" ], "text/plain": [ " 0 1 2 3 4 5 6 \\\n", "0 0.224629 0.140625 0.162544 0.197626 0.207835 0.904184 0.059549 \n", "1 0.222104 0.158519 0.203986 0.205944 0.196935 0.894018 0.058880 \n", "2 0.224428 0.145533 0.187383 0.193617 0.190344 0.903373 0.059496 \n", "3 0.223869 0.138779 0.186916 0.192966 0.207131 0.901124 0.059348 \n", "4 0.225506 0.138874 0.175730 0.195283 0.182565 0.907712 0.059782 \n", ".. ... ... ... ... ... ... ... \n", "393 0.100398 0.057325 0.096120 0.140661 0.241518 0.946808 0.053231 \n", "394 0.096635 0.038229 0.055941 0.103361 0.366581 0.911320 0.102472 \n", "395 0.102104 0.056216 0.095480 0.117671 0.182642 0.962893 0.054136 \n", "396 0.099409 0.048651 0.087426 0.131038 0.285126 0.937476 0.052707 \n", "397 0.098966 0.048031 0.090342 0.135176 0.296066 0.933304 0.052472 \n", "\n", " car name \n", "0 chevroletchevellemalibu \n", "1 buickskylark320 \n", "2 plymouthsatellite \n", "3 amcrebelsst \n", "4 fordtorino \n", ".. ... \n", "393 fordmustanggl \n", "394 vwpickup \n", "395 dodgerampage \n", "396 fordranger \n", "397 chevys-10 \n", "\n", "[398 rows x 8 columns]" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X['car name'] = df.iloc[:,-1]\n", "X['car name'] = X['car name'].str.replace(\" \",\"\")\n", "\n", "print(X.shape)\n", "X" ] }, { "cell_type": "code", "execution_count": 14, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 437 }, "id": "eRJ_GIQhQuj4", "outputId": "894cbc23-0378-4258-c08c-b85285df137e", "scrolled": true }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:3: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n", "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n", " This is separate from the ipykernel package so we can avoid doing imports until\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
0123456789...294295296297298299300301302303
00000000000...0000000000
10000000000...0000000000
20000000000...0000000000
30000000000...0000000000
40000000000...0000000000
..................................................................
3930000000000...0000000000
3940000000000...0000001000
3950000000000...0000000000
3960000000000...0000000000
3970000000000...0000000000
\n", "

398 rows × 304 columns

\n", "
" ], "text/plain": [ " 0 1 2 3 4 5 6 7 8 9 ... 294 295 296 \\\n", "0 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "1 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "2 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "3 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "4 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", ".. ... ... ... ... ... ... ... ... ... ... ... ... ... ... \n", "393 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "394 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "395 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "396 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "397 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 \n", "\n", " 297 298 299 300 301 302 303 \n", "0 0 0 0 0 0 0 0 \n", "1 0 0 0 0 0 0 0 \n", "2 0 0 0 0 0 0 0 \n", "3 0 0 0 0 0 0 0 \n", "4 0 0 0 0 0 0 0 \n", ".. ... ... ... ... ... ... ... \n", "393 0 0 0 0 0 0 0 \n", "394 0 0 0 1 0 0 0 \n", "395 0 0 0 0 0 0 0 \n", "396 0 0 0 0 0 0 0 \n", "397 0 0 0 0 0 0 0 \n", "\n", "[398 rows x 304 columns]" ] }, "execution_count": 14, "metadata": {}, "output_type": "execute_result" } ], "source": [ "#TEST ENCODER\n", "from sklearn.preprocessing import OneHotEncoder\n", "onehot = OneHotEncoder(dtype=np.int, sparse=True)\n", "nominals = pd.DataFrame(\n", " onehot.fit_transform(X[['car name']])\\\n", " .toarray())\n", "nominals" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Data Visualization" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Text(0.5, 1.0, 'x^2')" ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "\n", "import matplotlib.pyplot as plt\n", "\n", "\n", "x = [1,2,3,4,5]\n", "\n", "y = [1,4,9,16,25]\n", "\n", "# plotting the points\n", "plt.plot(x, y, color='green', linestyle='dashed', linewidth = 3,\n", " marker='o', markerfacecolor='red', markersize=12)\n", "\n", "\n", "plt.xlabel('x - axis: numbers')\n", "\n", "plt.ylabel('y - axis: Square(x)')\n", "\n", "\n", "plt.title('x^2')\n", "\n", "\n", "\n" ] }, { "cell_type": "code", "execution_count": 32, "metadata": {}, "outputs": [ { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYIAAAEWCAYAAABrDZDcAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4zLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvnQurowAAFB1JREFUeJzt3Xu0ZGV95vHvw0VBQO2e7iASxlYGjaxkQNNBUZKgjhPCylKJSw1BxAkunCiDGBjHMYngmDXiqGQyQZMBRVEuoxFQEo2RAGODgqGbtNLYiXhpAkigkSgXJU43v/mjdsfi2Oec6qZ3bc55v5+1atWufan9e6tO1XP2pd6dqkKS1K6dhi5AkjQsg0CSGmcQSFLjDAJJapxBIEmNMwgkqXEGgZqU5CNJ/mCA9a5IUkl2mfa6pdkYBHrUS7IhyY+SLJsxfm33pbpimMoeHbrX4N/MGDdI0GlhMgi0UHwbOHrLgyQ/B+w+XDk/NtR/925VaEcxCLRQfAx4zdjj44CPbnmQ5BeS3Dn+5Zjk5UnWzvGcy5JcnuS+JF9I8pSxZf8oya1J7k2yJskvjk07Pcknk5yf5F7gtTOfOMnuSd6X5JYk309yTZLx4DomyT8kuTvJ744td0iSa5N8L8kdSc5K8pix6ZXkjUluBm5Osqqb9JUk9yd51RztlbbKINBCcR3w+CTPTLIz8Crg/C0Tq+p64LvAi8eWeTWjAJnNMcA7gWXAWuCCsWnXAwcDS4ELgT9LstvY9JcCnwSeOGO5Ld4L/DzwvO453gI8NDb9MOAZwIuAtyd5Zjd+M/DmrqZDu+lvmPHcLwOeAxxYVb/UjTuoqvasqo/P0V5pqwwCLSRbtgpeDPwdcPuM6ecx+vInyVLgVxh9ic/mM1W1qqr+Gfhd4NAk+wFU1flV9d2q2lRV7wMey+iLe4trq+pTVfVQVf1w/EmT7AT8FvCmqrq9qjZX1Ze69Wzxjqr6YVV9BfgKcFC33jVVdV233g3A/wZ+eUbd76qqe2auV9pe7mPUQvIxYBXwVMZ2C405H1ifZE/glcDVVXXHHM9365aBqro/yT3Ak4Fbk5wCvK57XMDjGf2X/hPLbsUyYDfgm3PM849jwz8A9gRI8nTgTGAl8DhGn9E1s9Ut7QhuEWjBqKpbGB00PhK4ZCvTbweuBY4CjmXu3UIA+20Z6MJjKfCd7njAf2EUJkuq6onA94GMr26O570beBDYf571b82fMNraOaCqHg+8bcZ651v3aIaq11bV723H+tUgg0ALzfHAC6vqgVmmf5TR/vifAy6d57mOTHJYdzD2ncCXq+pWYC9gE7AR2CXJ2xltEUykqh4CzgXOTPLkJDsnOTTJYydYfC/gXuD+JD8D/PYEy9wJPG3S+qSZDAItKFX1zapaPccslwJPAS6dIyy2uBA4DbiH0YHdY7rxfwX8JfB14BZG/91v6+6YU4EbGR10vgd4N5N93k4FfhO4DzgHmOTg7+nAed2ZRq8ESPKnSX5/G2tWo+KFabTYJPkm8Pqq+uuha5EWArcItKgkeTmjfehXDl2LtFB41pAWjST/FzgQOLbbTy9pAu4akqTGuWtIkhq3IHYNLVu2rFasWDF0GZK0oKxZs+buqlo+33wLIghWrFjB6tVznTEoSZopyS2TzOeuIUlqnEEgSY0zCCSpcQaBJDXOIJCkxhkEktS43oIgyX5JrkqyPslNSd7UjT89ye1J1na3I/uqQZI0vz5/R7AJOKWqbkiyF7AmyeXdtD+sqvf2uG5J0oR6C4LuEoF3dMP3JVkP7NvX+iRJ22cqxwiSrACeBXy5G3Vikq8mOTfJklmWOSHJ6iSrN27cOI0yJS0WyeK5TUHvQdBdC/Zi4OSqupfRNVn3Bw5mtMXwvq0tV1VnV9XKqlq5fPm8XWVIkrZTr0GQZFdGIXBBVV0CUFV3VtXmrr/4c4BD+qxBkjS3Ps8aCvAhYH1VnTk2fp+x2Y4C1vVVgyRpfn2eNfR84FjgxiRru3FvA45OcjCjywluAF7fYw2SpHn0edbQNcDWjnR8tq91SpK2nb8slqTGGQSS1DiDQJIaZxBIUuMMAklqnEEgSY0zCCSpcQaBJDXOIJCkxhkEktQ4g0CSGmcQSFLjDAJJapxBIEmNMwgkqXEGgSQ1ziCQpMYZBJLUOINAkhpnEEhS4wwCSWqcQSBJjTMIJKlxBoEkNc4gkKTGGQSS1DiDQJIaZxBIUuMMAklqnEEgSY0zCCSpcQaBJDWutyBIsl+Sq5KsT3JTkjd145cmuTzJzd39kr5qkCTNr88tgk3AKVX1TOC5wBuTHAi8Fbiiqg4ArugeS5IG0lsQVNUdVXVDN3wfsB7YF3gpcF4323nAy/qqQZI0v6kcI0iyAngW8GVg76q6A0ZhAfzULMuckGR1ktUbN26cRpmS1KTegyDJnsDFwMlVde+ky1XV2VW1sqpWLl++vL8CJalxvQZBkl0ZhcAFVXVJN/rOJPt00/cB7uqzBknS3Po8ayjAh4D1VXXm2KTLgOO64eOAT/dVgyRpfrv0+NzPB44Fbkyythv3NuAM4BNJjgf+AXhFjzVIkubRWxBU1TVAZpn8or7WK0naNv6yWJIaZxBIUuMMAklqnEEgSY0zCCSpcQaBJDXOIJCkxhkEktQ4g0CSGmcQSFLjDAJJapxBIEmNMwgkqXEGgSQ1ziCQpMYZBJLUOINAkhpnEEhS4wwCSWqcQSBJjTMIJKlxBoEkNc4gkKTGGQSS1DiDQJIaZxBIUuMMAklq3C5DFyBpx8s7MnQJO0ydVkOXsOi5RSBJjTMIJKlxBoEkNc4gkKTG9RYESc5NcleSdWPjTk9ye5K13e3IvtYvSZpMn1sEHwGO2Mr4P6yqg7vbZ3tcvyRpAr0FQVWtAu7p6/klSTvGvEGQZI8kO3XDT0/ykiS7PoJ1npjkq92uoyWP4HkkSTvAJFsEq4DdkuwLXAH8B0a7fbbHnwD7AwcDdwDvm23GJCckWZ1k9caNG7dzdZKk+UwSBKmqHwC/DvxxVR0FHLg9K6uqO6tqc1U9BJwDHDLHvGdX1cqqWrl8+fLtWZ0kaQITBUGSQ4FjgM9047ara4ok+4w9PApYN9u8kqTpmOQL/WTgvwKXVtVNSZ4GXDXfQkkuAg4HliW5DTgNODzJwUABG4DXb2fdkqQdZN4gqKovAF8Ye/wt4KQJljt6K6M/tE3VSZJ6N2sQJPmfVXVykj9n9B/8w1TVS3qtTJI0FXNtEXysu3/vNAqRJA1j1iCoqjXd4Pqqumt8WpJn9FqVJGlqJjlr6Ookr9zyIMkpwKX9lSRJmqZJzho6HDg7ySuAvYH1zHH+vyRpYZl3i6Cq7gA+BxwKrAA+WlX391yXJGlK5t0iSHI5o+4gfhb4aeDcJKuq6tS+i5Mk9W+SYwTvr6rXVNX3qmod8Dzg+z3XJUmakkl+UPapGY83Ae/srSJJ0lRN0g31c5Ncn+T+JD9KsjmJWwSStEhMsmvoLOBo4GZgd+B1wPv7LEqSND0T9SJaVd9IsnNVbQY+nORLPdclSZqSSYLgB0keA6xN8j8YnUG0R79lSZKmZZJdQ8d2850IPADsB7y8z6IkSdMzyVlDt3SDDwLv6LccSdK0TbJFIElaxAwCSWrcNgVBkif1VYgkaRjbukXw2V6qkCQNZluDIL1UIUkazLYGwTm9VCFJGsw2BUFVfaCvQiRJw/CsIUlqnEEgSY2bpBvqE5MsmUYxkqTpm2SL4EnA9Uk+keSIJJ45JEmLyCQXr/894ADgQ8BrgZuT/Pck+/dcmyRpCiY6RlBVBfxjd9sELAE+2XVLLUlawObtfTTJScBxwN3AB4H/XFX/L8lOjK5a9pZ+S5Qk9WmSC9MsA359rDtqAKrqoSS/1k9ZkqRpmeR6BG+fY9r6HVuOJGna/B2BJDXOIJCkxvUWBEnOTXJXknVj45YmuTzJzd29P1STpIH1uUXwEeCIGePeClxRVQcAV3SPJUkD6i0IqmoVcM+M0S8FzuuGzwNe1tf6JUmTmfYxgr2r6g6A7v6nZpsxyQlJVidZvXHjxqkVKEmtedQeLK6qs6tqZVWtXL58+dDlSNKiNe0guDPJPgDd/V1TXr8kaYZpB8FljLqroLv/9JTXL0maoc/TRy8CrgWekeS2JMcDZwAvTnIz8OLusSRpQJP0NbRdquroWSa9qK91SpK23aP2YLEkaToMAklqXG+7hqTBLaarqlYNXYEWMbcIJKlxBoEkNc4gkKTGGQSS1DiDQJIaZxBIUuMMAklqnEEgSY0zCCSpcQaBJDXOIJCkxhkEktQ4g0CSGmcQSFLjDAJJapxBIEmNMwgkqXEGgSQ1ziCQpMYZBJLUOINAkhpnEEhS4wwCSWqcQSBJjTMIJKlxBoEkNc4gkKTGGQSS1DiDQJIat8sQK02yAbgP2AxsqqqVQ9QhSRooCDovqKq7B1y/JAl3DUlS84YKggI+n2RNkhO2NkOSE5KsTrJ648aNUy5PktoxVBA8v6qeDfwq8MYkvzRzhqo6u6pWVtXK5cuXT79CSWrEIEFQVd/p7u8CLgUOGaIOSdIAQZBkjyR7bRkG/j2wbtp1SJJGhjhraG/g0iRb1n9hVX1ugDokSQwQBFX1LeCgaa9XkrR1nj4qSY0zCCSpcQaBJDVuyC4mNAV5R4YuYYeo02roEqRFyy0CSWqcQSBJjTMIJKlxBoEkNc4gkKTGGQSS1DiDQJIaZxBIUuMMAklqnEEgSY0zCCSpcQaBJDXOIJCkxhkEktQ4g0CSGmcQSFLjDAJJapxBIEmNMwgkqXEGgSQ1ziCQpMYZBJLUOINAkhpnEEhS43YZuoDeJUNXsONUDV2BpEXILQJJapxBIEmNMwgkqXEGgSQ1bpAgSHJEkr9P8o0kbx2iBknSyNSDIMnOwPuBXwUOBI5OcuC065AkjQyxRXAI8I2q+lZV/Qj4P8BLB6hDksQwvyPYF7h17PFtwHNmzpTkBOCE7uH9Sf5+CrU9EsuAu3tdw6P3NxG9tz2nt9t2wPf+0WkhvPdPmWSmIYJga636iV9KVdXZwNn9l7NjJFldVSuHrmMItr3NtkPb7V9MbR9i19BtwH5jj38a+M4AdUiSGCYIrgcOSPLUJI8BfgO4bIA6JEkMsGuoqjYlORH4K2Bn4NyqumnadfRgwezG6oFtb1fL7V80bU/ZkZkkNc1fFktS4wwCSWqcQaA5JXlikjcMXcc0jLc1yeFJ/mLomoaU5KQk65NcMHQtQxhr/z8t9q5wDALN54lAE0HAdrS16zJlsXoDcGRVHbO9T5CRhfo9s6X9S6rqjKGL6dNCfYOmLsnvJFnX3U5OsqL7b+GcJDcl+XyS3bt590/yuSRrklyd5GeGrv8ROAPYP8naJB9O8hKAJJcmObcbPj7JH3TDD3udBqx7e/xLW4H3AHsm+WSSv0tyQTL6iWeSDUnenuQa4BWzvd9Jlie5OMn13e35wzVt2yT5U+BpwGVJTknyqSRfTXJdkn/bzXN6klPHllnXfS62fDY+ANzAw383tCDMaP+bk5yV5Ande79TN8/jktyaZNcF/5mvKm/z3ICfB24E9gD2BG4CngVsAg7u5vkE8Opu+ArggG74OcCVQ7fhEbR9BbCuG/4N4D3d8N8A13XDHwZ+ZbbXaeg2bGdbDwe+z+gHjzsB1wKHddM2AG8ZW26r7zdw4dgy/xpYP3Qbt/H12MCoG4U/Bk7rxr0QWNsNnw6cOjb/uu41XAE8BDx36DbsoPa/FjirG/dp4AXd8KuAD871N7BQbov/msU7xmHApVX1AECSS4BfBL5dVWu7edYAK5LsCTwP+LP8uI+Qx0653r5cDZzc9Rb7NWBJkn2AQ4GTgN9i66/T3w5U7yP1N1V1G0C3lbACuKab9vFu/Fzv978DDhwb//gke1XVff2XvkMdBrwcoKquTPKvkjxhnmVuqarr+i9t6j7OKACuYvSP0QcWw2feIJjMbL0+/fPY8GZgd0b/PX6vqg7uvaopq6rbkywBjgBWAUuBVwL3V9V9yaO3Z7TtNPP9Hf+8PNDdz/V+7wQcWlU/7Km+aZmtf7BNPHz38m5jww+wOF0GvCvJUkZbwFcy2gJe0J95jxFMZhXwsm6f4B7AUYz+O/4JVXUv8O0kr4B/OVh20PRK3eHuA/Yae3wtcDKj1+Rq4FR+/FpM/Do9Ss1s67zmeb8/D5y4Zd4kC/WLYhVwDIzOpgLu7tq9AXh2N/7ZwFMHqm9qqup+RrtF/wj4i6ravBg+8wbBBKrqBuAjjP4Avgx8EPinORY5Bjg+yVcY7SdfsNdbqKrvAl/sDgS+h9EX+y5V9Q1GBwKXduO2+jpV1YLZLTTeVkYHiyc12/t9ErCyO8j6NeA/7tCCp+d0unYwOqB+XDf+YmBpt9vst4GvD1Pe1H0ceHV3v8WC/szbxYQkNc4tAklqnEEgSY0zCCSpcQaBJDXOIJCkxhkE0hQkWZnkfw1dh7Q1nj4qSY1zi0BNSvIL3Q+9dkuyR9eD7M9uw/Irul4mb+huz+vGH5Xkr7tfl+6T5OtJnpSx6xsk+eWMenNdm+Rvk2zTr5mlHc0tAjUro66zd2PUR9RtVfWubVj2ccBDVfVgkgOAi6pqZTftfOA6Rn0yXVBVF3VdM5xaVb+W5M+BM6rqi12HZQ9W1aYd2zppcnY6p5b9N+B64EFG3UFsi12Bs7r+gzYDTx+b9p8Ydcl8XVVdtJVlvwicmdGVvy7Z0sOpNBR3DallSxldN2EvHt5zJgBJ3ji2C+fJMya/GbgTOAhYCTxmbNq+jPrj3ztbuTpXja529TpGWyLXLbiLmGjRMQjUsrOB3wcuAN49c2JVvb+qDu5u35kx+QnAHVX1EHAssDNAkl0YXajnN4H1wO/MfN4k+1fVjVX1bmA1YBBoUO4aUpOSvAbYVFUXZnTd4S8leWFVXTnhU3wAuLjrevgqftz//tuAq6vq6q5XzuuTfGbGsicneQGjXUpfA/7yETdIegQ8WCxJjXPXkCQ1ziCQpMYZBJLUOINAkhpnEEhS4wwCSWqcQSBJjfv/58LQj1fiX+sAAAAASUVORK5CYII=\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "import matplotlib.pyplot as plt\n", "\n", "# x-coordinates of left sides of bars\n", "left = [1, 2, 3, 4, 5]\n", "\n", "# heights of bars\n", "height = [1,4,9,16,25]\n", "\n", "# labels for bars\n", "tick_label = ['one', 'two', 'three', 'four', 'five']\n", "\n", "# plotting a bar chart\n", "plt.bar(left, height, tick_label = tick_label,\n", "\t\twidth = 0.8, color = ['red', 'green'])\n", "\n", "# naming the x-axis\n", "plt.xlabel('x - axis')\n", "# naming the y-axis\n", "plt.ylabel('y - axis')\n", "# plot title\n", "plt.title('My bar chart!')\n", "\n", "# function to show the plot\n", "plt.show()\n", "\n" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXwAAAEWCAYAAABliCz2AAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4zLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvnQurowAAFRFJREFUeJzt3Xm0ZWWd3vHvI4XIDMLVJUN1OdC0RqOwSoZgbEVMAxpwQFuiqDSm2m5tMRqNrjYirclaJq3BThs6pQwOiFGkFO0WRYFuNTJUATLbLQhSgFAIWoADg7/8cfZtbop7T526dfed3u9nrbPu2fvsc97fvrvqOe99zz7vTlUhSVr8HjPXBUiSZoeBL0mNMPAlqREGviQ1wsCXpEYY+JLUCANfi1aS05N8aMjj9yV5ymzWJM0lA1/zQpKbkjyQZNcN1l+RpJIsm+k2q2q7qrpxI3W9IMnamW5bmgsGvuaTHwNHjy8keRaw9dyV078kW8x1DWqHga/55DPA6ycsvwH49PhCkucmuSPJkgnrXpnkiiGvuXOSv01yb5KLkzx1wnMrydO6+4cnubbb7tYk/zHJtsDXgd264Z/7kuyWZKskJyW5rbudlGSrCa/77iS3d4+9aYN2Tk9ycpK/S3I/8MIkL0lyeZL1SW5J8oEJr7Wse/6x3WP3JHlz97u4MsnPk/z1dH/haouBr/nkImCHJE/ver5/CHx2/MGquhT4GfDiCc95HYM3iqkcDZwI7Az8CPgvU2x3CvDHVbU98Ezg/Kq6HzgMuK0b/tmuqm4D/hw4AHgO8GxgP+B9AEkOBd4BHAI8Dfj9Sdr6d10d2wPfBe5n8Ea3E/AS4E+SvGyD5+wP7NX9Tk7qajgE+BfAq5NM1o70/zHwNd+M9/JfDFwP3LrB459iEPIkeTzwB8Dnhrze2VV1SVU9BJzBIKQn8yDwjCQ7VNU9VXXZkNd8LfAXVXVnVa1j8IZyTPfYq4HTquqaqvpl99iGvlJV36uq31bVr6vqwqq6qlu+EjiTR79RfLDb9psM3iDO7Nq/FfgOsM+QeiXAwNf88xkGPeA3MmE4Z4LPAv82yXYMwvU7VXX7kNf76YT7vwS2m2K7VwKHAzcn+fskBw55zd2Amycs39ytG3/slgmPTbw/6bok+ye5IMm6JL8A3gzsusFz7phw/1eTLE+1X9I/M/A1r1TVzQw+vD0cOHuSx28Fvg+8nEGvethwzqa0e2lVHQk8Afgy8IXxhybZ/DbgdyYsL+3WAdwO7DHhsT0na26D5c8B5wB7VtWOwN8A2aQdkEZg4Gs+Og44uBtDn8yngXcDzwJWbW5jSR6b5LVJdqyqB4H1wMPdw3cAuyTZccJTzgTel2SsO430/TzyWcMXgGO7zyG26R7bmO2Bu6vq10n2Y/AXjjTjDHzNO1V1Q1WtHrLJKgY97FVD3hQ21THATUnWMxhSeV1Xy/UMAv7G7oyY3YAPAauBK4GrgMu6dVTV14G/Ai5g8CHx97vX/82Qtv8U+Isk9zJ4g/jCkG2laYsXQNFClOQGBmfVfGuuaxkmydOBq4Gtug+OpTljD18LTpJXMhgHP3+ua5lMkpd3w0Q7Ax8GvmrYaz4w8LWgJLkQOBl4S1X9do7LmcofA+uAGxh8FvAnc1uONOCQjiQ1wh6+JDViycY3mT277rprLVu2bK7LkKQFY82aNXdV1dgo286rwF+2bBmrVw87G0+SNFGSmze+1YBDOpLUCANfkhph4EtSIwx8SWqEgS9JjTDwJakRvQV+kr2TXDHhtj7J2/tqT5I0XG/n4VfVD+kuJ9ddn/RWZmDucknS9MzWkM6LgBu6qxlJkubAbH3T9jUMLiLxKElWACsAli5dOkvlaKHLif1fAbBOcGJBLS699/CTPBY4AvjiZI9X1cqqWl5Vy8fGRpoOQpI0DbMxpHMYcFlV3TELbUmSpjAbgX80UwznSJJmT6+Bn2Qb4MXA2X22I0nauF4/tK2qXwK79NmGJGk0ftNWkhph4EtSIwx8SWqEgS9JjTDwJakRBr4kNcLAl6RGGPiS1AgDX5IaYeBLUiMMfElqhIEvSY0w8CWpEQa+JDXCwJekRhj4ktQIA1+SGmHgS1IjDHxJaoSBL0mN6DXwk+yU5Kwk1ye5LsmBfbYnSZrakp5f/2PAuVV1VJLHAtv03J4kaQq9BX6SHYDnA28EqKoHgAf6ak+SNFyfQzpPAdYBpyW5PMknk2y74UZJViRZnWT1unXreixHktrWZ+AvAfYFTq6qfYD7gfdsuFFVrayq5VW1fGxsrMdyJKltfQb+WmBtVV3cLZ/F4A1AkjQHegv8qvopcEuSvbtVLwKu7as9SdJwfZ+l82fAGd0ZOjcCx/bcniRpCr0GflVdASzvsw1J0mj8pq0kNcLAl6RGGPiS1AgDX5IaYeBLUiMMfElqhIEvSY0w8CWpEQa+JDXCwJekRhj4ktQIA1+SGmHgS1IjDHxJaoSBL0mNMPAlqREGviQ1wsCXpEYY+JLUCANfkhph4EtSI5b0+eJJbgLuBR4GHqqq5X22J0maWq+B33lhVd01C+1IkoZwSEeSGtF34BfwzSRrkqyYbIMkK5KsTrJ63bp1PZcjSe3qO/APqqp9gcOAtyR5/oYbVNXKqlpeVcvHxsZ6LkeS2tVr4FfVbd3PO4FVwH59tidJmlpvgZ9k2yTbj98H/g1wdV/tSZKG6/MsnScCq5KMt/O5qjq3x/YkSUP0FvhVdSPw7L5eX5K0aTwtU5IaYeBLUiM2GvhJtknyn5N8olveK8lL+y9NkjSTRunhnwb8BjiwW14LfKi3iiRJvRgl8J9aVf8NeBCgqn4FpNeqJEkzbpTAfyDJ1gymSSDJUxn0+CVJC8gop2WeAJwL7JnkDOAg4I19FiVJmnkbDfyqOi/JZcABDIZyjne6Y0laeKYM/CT7brDq9u7n0iRLq+qy/sqSJM20YT38jwx5rICDZ7gWSVKPpgz8qnrhbBYiSerXRsfwkzwO+FPgeQx69t8B/qaqft1zbZKkGTTKWTqfZnAh8v/ZLR8NfAZ4VV9FSZJm3iiBv3dVTZz18oIkP+irIElSP0b54tXlSQ4YX0iyP/C9/kqSJPVhlB7+/sDrk/ykW14KXJfkKqCq6l/2Vp0kacaMEviH9l6FJKl3o3zT9uYkzwb+dbfqO1XlGL4kLTCjzId/PHAG8ITu9tkkf9Z3YZKkmTXKkM5xwP5VdT9Akg8D3+eR0zQlSQvAKGfpBHh4wvLDbMJ8+Em2SHJ5kq9tanGSpJkzSg//NODiJKu65ZcBp2xCG8cD1wE7bGJtkqQZtNEeflV9FDgWuBu4Bzi2qk4a5cWT7AG8BPjk5hQpSdp8owzpAGwD3FtVHwPWJnnyiM87CXg38NupNkiyIsnqJKvXrVs34stKkjbVKGfpnAD8J+C93aotgc+O8LyXAndW1Zph21XVyqpaXlXLx8bGRihZkjQdo/TwXw4cAdwPUFW3AduP8LyDgCOS3AR8Hjg4yUbfKCRJ/RjpIuZVVTxyEfNtR3nhqnpvVe1RVcuA1wDnV9Xrpl2pJGmzjBL4X0jyv4Gdkvx74FvAJ/otS5I000aZWuEvk7wYWA/8LvD+qjpvUxqpqguBC6dToCRpZoxyHj7AVcDWDIZ1ruqvHElSX0Y5S+dNwCXAK4CjgIuS/FHfhUmSZtYoPfx3AftU1c8AkuwC/F/g1D4LkyTNrFE+tF3L4Jq24+4FbumnHElSX0bp4d/KYC6drzAYwz8SuCTJO+Cfp16QJM1zowT+Dd1t3Fe6n6N8+UqSNE+MclrmibNRiCSpX6NOniZJWuAMfElqxJSB313KkCSvmr1yJEl9GdbDPzzJljwyLbIkaQEb9qHtucBdwLZJ1jO4jm2N/6wqL1koSQvIlD38qnpXVe0I/G1V7VBV20/8OYs1SpJmwCinZR6Z5InAc7tVF1eV1yKUpAVmlMnTXsVg8rRXAa9m8C3bo/ouTJI0s0b5pu37gOdW1Z0AScYYXATlrD4LkyTNrFHOw3/MeNh3fjbi8yRJ88goPfxzk3wDOLNb/kPg7/orSZLUh1E+tH1XklcAz2NwSubKqlrVe2WSpBk10iUOq+ps4Oyea5Ek9cixeElqRG+Bn+RxSS5J8oMk1yRxmmVJmkMjDelM02+Ag6vqvm5Onu8m+XpVXdRjm5KkKUyrh5/kAxvbpgbu6xa37G41nfYkSZtvuj38NaNslGSLbtunAR+vqosn2WYFsAJg6dKl0ywHcmKm/dxR1Qm+X0lauKbVw6+qr4643cNV9RxgD2C/JM+cZJuVVbW8qpaPjY1NpxxJ0ghGmUtnjySrkqxLckeSLyXZY1MaqaqfAxcCh06zTknSZhqlh38acA7wJGB34KvduqGSjCXZqbu/NXAIcP30S5UkbY5RAn+sqk6rqoe62+nAKGMvTwIuSHIlcClwXlV9bTNqlSRthlE+tL0ryet4ZC6doxlMoDZUVV0J7LMZtUmSZtAoPfw/YjAP/k+B24GjunWSpAVklMnTfgIcMQu1SJJ6NGXgJ3n/kOdVVX2wh3okST0Z1sO/f5J12wLHAbsABr4kLSBTBn5VfWT8fpLtgeOBY4HPAx+Z6nmSpPlp6Bh+kscD7wBeC3wK2Leq7pmNwiRJM2vYGP5/B14BrASeNWEiNEnSAjTstMx3ArsB7wNuS7K+u92bZP3slCdJminDxvC9GpYkLSKGuiQ1wsCXpEYY+JLUCANfkhph4EtSIwx8SWqEgS9JjTDwJakRBr4kNcLAl6RGGPiS1IjeAj/JnkkuSHJdkmuSHN9XW5KkjdvoNW03w0PAO6vqsu4CKmuSnFdV1/bYpiRpCr318Kvq9qq6rLt/L3AdsHtf7UmShpuVMfwky4B9gItnoz1J0qP1OaQDQJLtgC8Bb6+qR104JckKYAXA0qVL+y6nFzkxvbdRJ5RtzxPud3/m434vJr328JNsySDsz6iqsyfbpqpWVtXyqlo+NjbWZzmS1LQ+z9IJcApwXVV9tK92JEmj6bOHfxBwDHBwkiu62+E9tidJGqK3Mfyq+i7Q/6CfJGkkftNWkhph4EtSIwx8SWqEgS9JjTDwJakRBr4kNcLAl6RGGPiS1AgDX5IaYeBLUiMMfElqhIEvSY0w8CWpEQa+JDXCwJekRhj4ktQIA1+SGmHgS1IjDHxJaoSBL0mNMPAlqRG9BX6SU5PcmeTqvtqQJI2uzx7+6cChPb6+JGkT9Bb4VfUPwN19vb4kadMsmesCkqwAVgAsXbp0jquR5recmN7bqBOq9zYWksX0O5/zD22ramVVLa+q5WNjY3NdjiQtWnMe+JKk2WHgS1Ij+jwt80zg+8DeSdYmOa6vtiRJG9fbh7ZVdXRfry1J2nQO6UhSIwx8SWqEgS9JjTDwJakRBr4kNcLAl6RGGPiS1AgDX5IaYeBLUiMMfElqhIEvSY0w8CWpEQa+JDXCwJekRhj4ktQIA1+SGmHgS1IjDHxJaoSBL0mNMPAlqREGviQ1otfAT3Jokh8m+VGS9/TZliRpuN4CP8kWwMeBw4BnAEcneUZf7UmShuuzh78f8KOqurGqHgA+DxzZY3uSpCFSVf28cHIUcGhVvalbPgbYv6reusF2K4AV3eLewA83oZldgbtmoNyFxv1ui/vdlk3d79+pqrFRNlwyvXpGkknWPerdpapWAiun1UCyuqqWT+e5C5n73Rb3uy197nefQzprgT0nLO8B3NZje5KkIfoM/EuBvZI8OcljgdcA5/TYniRpiN6GdKrqoSRvBb4BbAGcWlXXzHAz0xoKWgTc77a4323pbb97+9BWkjS/+E1bSWqEgS9JjViQgd/KlA1J9kxyQZLrklyT5Phu/eOTnJfkn7qfO891rX1IskWSy5N8rVt+cpKLu/3+P93JAItKkp2SnJXk+u64H9jQ8f4P3b/zq5OcmeRxi/GYJzk1yZ1Jrp6wbtJjnIG/6rLuyiT7bk7bCy7wG5uy4SHgnVX1dOAA4C3dvr4H+HZV7QV8u1tejI4Hrpuw/GHgf3T7fQ9w3JxU1a+PAedW1e8Bz2aw/4v+eCfZHXgbsLyqnsngRI/XsDiP+enAoRusm+oYHwbs1d1WACdvTsMLLvBpaMqGqrq9qi7r7t/L4D//7gz291PdZp8CXjY3FfYnyR7AS4BPdssBDgbO6jZZdPudZAfg+cApAFX1QFX9nAaOd2cJsHWSJcA2wO0swmNeVf8A3L3B6qmO8ZHAp2vgImCnJE+abtsLMfB3B26ZsLy2W7eoJVkG7ANcDDyxqm6HwZsC8IS5q6w3JwHvBn7bLe8C/LyqHuqWF+NxfwqwDjitG8r6ZJJtaeB4V9WtwF8CP2EQ9L8A1rD4j/m4qY7xjObdQgz8kaZsWEySbAd8CXh7Va2f63r6luSlwJ1VtWbi6kk2XWzHfQmwL3ByVe0D3M8iHL6ZTDdmfSTwZGA3YFsGwxkbWmzHfGNm9N/9Qgz8pqZsSLIlg7A/o6rO7lbfMf5nXffzzrmqrycHAUckuYnBkN3BDHr8O3V/7sPiPO5rgbVVdXG3fBaDN4DFfrwBDgF+XFXrqupB4GzgX7H4j/m4qY7xjObdQgz8ZqZs6MatTwGuq6qPTnjoHOAN3f03AF+Z7dr6VFXvrao9qmoZg+N7flW9FrgAOKrbbDHu90+BW5Ls3a16EXAti/x4d34CHJBkm+7f/fi+L+pjPsFUx/gc4PXd2ToHAL8YH/qZlqpacDfgcOAfgRuAP5/renrcz+cx+PPtSuCK7nY4g/HsbwP/1P18/FzX2uPv4AXA17r7TwEuAX4EfBHYaq7r62F/nwOs7o75l4GdWznewInA9cDVwGeArRbjMQfOZPA5xYMMevDHTXWMGQzpfLzLuqsYnMU07badWkGSGrEQh3QkSdNg4EtSIwx8SWqEgS9JjTDwJakRBr4kNcLAl6RGGPgSkOTLSdZ087Gv6NYdl+Qfk1yY5BNJ/rpbP5bkS0ku7W4HzW310mj84pXE4AIUVXV3kq0ZTN/xB8D3GMxlcy9wPvCDqnprks8B/6uqvptkKfCNGlyzQJrXlmx8E6kJb0vy8u7+nsAxwN9X1d0ASb4I/G73+CHAMwZTvgCwQ5Lta3DNAmneMvDVvCQvYBDiB1bVL5NcCPwQmKrX/phu21/NToXSzHAMX4IdgXu6sP89BpeT3Ab4/SQ7d9PzvnLC9t8E3jq+kOQ5s1qtNE0GvgTnAkuSXAl8ELgIuBX4rwyuMPYtBlP1/qLb/m3A8u6i0tcCb579kqVN54e20hSSbFdV93U9/FXAqVW1aq7rkqbLHr40tQ8kuYLB/Ow/ZjA/vbRg2cOXpEbYw5ekRhj4ktQIA1+SGmHgS1IjDHxJasT/A1BvsrGjWAfuAAAAAElFTkSuQmCC\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "import matplotlib.pyplot as plt\n", "\n", "# frequencies\n", "ages = [2,5,70,40,30,45,50,45,43,40,44,\n", "\t\t60,7,13,57,18,90,77,32,21,20,40]\n", "\n", "# setting the ranges and no. of intervals\n", "range = (0, 100)\n", "bins = 10\n", "\n", "# plotting a histogram\n", "plt.hist(ages, bins, range, color = 'green',\n", "\t\thisttype = 'bar', rwidth = 0.8)\n", "\n", "# x-axis label\n", "plt.xlabel('age')\n", "# frequency label\n", "plt.ylabel('No. of people')\n", "# plot title\n", "plt.title('My histogram')\n", "\n", "# function to show the plot\n", "plt.show()\n" ] }, { "cell_type": "code", "execution_count": 31, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "import matplotlib.pyplot as plt\n", "\n", "# x-axis values\n", "x = [1,2,3,4,5,6,7,8,9,10]\n", "# y-axis values\n", "y = [1,4,9,16,25,36,49,64,81,100]\n", "\n", "# plotting points as a scatter plot\n", "plt.scatter(x, y, label= \"stars\", color= \"green\",\n", "\t\t\tmarker= \"o\", s=30)\n", "\n", "# x-axis label\n", "plt.xlabel('x - axis')\n", "# frequency label\n", "plt.ylabel('y - axis')\n", "# plot title\n", "plt.title('My scatter plot!')\n", "# showing legend\n", "plt.legend()\n", "\n", "# function to show the plot\n", "plt.show()\n" ] }, { "cell_type": "code", "execution_count": 33, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "import matplotlib.pyplot as plt\n", "\n", "# defining labels\n", "activities = ['php', 'java', 'python', 'c']\n", "\n", "# portion covered by each label\n", "slices = [3, 7, 8, 6]\n", "\n", "# color for each label\n", "colors = ['r', 'y', 'g', 'b']\n", "\n", "# plotting the pie chart\n", "plt.pie(slices, labels = activities, colors=colors,\n", "\t\tstartangle=90, shadow = True, explode = (0, 0, 0.1, 0),\n", "\t\tradius = 1.2, autopct = '%1.1f%%')\n", "\n", "# plotting legend\n", "plt.legend()\n", "\n", "# showing the plot\n", "plt.show()\n" ] }, { "cell_type": "code", "execution_count": 34, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
mpgcylindersdisplacementhorsepowerweightaccelerationmodel yearorigincar name
018.08307.0130.0350412.0701chevrolet chevelle malibu
115.08350.0165.0369311.5701buick skylark 320
218.08318.0150.0343611.0701plymouth satellite
316.08304.0150.0343312.0701amc rebel sst
417.08302.0140.0344910.5701ford torino
\n", "
" ], "text/plain": [ " mpg cylinders displacement horsepower weight acceleration \\\n", "0 18.0 8 307.0 130.0 3504 12.0 \n", "1 15.0 8 350.0 165.0 3693 11.5 \n", "2 18.0 8 318.0 150.0 3436 11.0 \n", "3 16.0 8 304.0 150.0 3433 12.0 \n", "4 17.0 8 302.0 140.0 3449 10.5 \n", "\n", " model year origin car name \n", "0 70 1 chevrolet chevelle malibu \n", "1 70 1 buick skylark 320 \n", "2 70 1 plymouth satellite \n", "3 70 1 amc rebel sst \n", "4 70 1 ford torino " ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" } ], "source": [ "data = pd.read_csv(\"auto-mpg.csv\")\n", "data.head()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Group by in Data frame" ] }, { "cell_type": "code", "execution_count": 50, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/anaconda3/lib/python3.7/site-packages/matplotlib/axes/_base.py:239: FutureWarning: Support for multi-dimensional indexing (e.g. `obj[:, None]`) is deprecated and will be removed in a future version. Convert to a numpy array before indexing instead.\n", " y = y[:, np.newaxis]\n" ] }, { "data": { "text/plain": [ "[]" ] }, "execution_count": 50, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "x=data.groupby(\"cylinders\")['horsepower'].mean()\n", "y=set(data['cylinders'])\n", "y=list(y)\n", "plt.plot(y, x, color='green', linestyle='dashed', linewidth = 3,marker='o', markerfacecolor='red', markersize=12)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Filtering a Data Frame" ] }, { "cell_type": "code", "execution_count": 54, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 54, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXoAAAD8CAYAAAB5Pm/hAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4zLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvnQurowAAD1tJREFUeJzt3X+s3Xddx/Hny3UMI+g2ejeb/fAOUiODSFnqMkWSyYzbitqhjGxR1hBI/bEZiBrtNAH8g4R/AIORkSJzRWA/lB9r2ECXAoJ/bNCNMTrLXIHJSpu1gAwMitl4+8f5XHq43N57e+4953SfPh/Jyfl+P9/POd93v/eT1/mez/me01QVkqR+/di0C5AkjZdBL0mdM+glqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SercmmkXALB27dqanZ2ddhmS9JRy7733fr2qZpbqd1wE/ezsLLt37552GZL0lJLkP5fTz6kbSeqcQS9JnTPoJalzBr0kdc6gl6TOGfSS1DmDXpI6Z9BLUucMeknqnEEvaUmz2+6YdglaAYNekjpn0EtS5wx6SeqcQS9JUzKpzz4MeknqnEEvSZ0z6CWpcwa9JHXOoJekCZv0F9AMeknqnEEvSZ0z6CWpcwa9dAz8ca8TSy9/b4Nekjpn0EtS5wx6SeqcQS9JnTPotWy9fDAlnWgMeknqnEEvqUu+Az3CoJekzhn0ktS5JYM+yTlJPpFkb5IHk7y2tZ+e5K4kD7f701p7krw9yb4kDyS5YNz/CEnS0S3njP4J4E+q6rnARcC1Sc4HtgG7qmo9sKutA1wOrG+3rcANq161JGnZlgz6qjpYVfe15e8Ae4GzgM3AjtZtB3BFW94MvKcG7gZOTbJu1SuXJC3LMc3RJ5kFXgjcA5xZVQdh8GIAnNG6nQU8OvSw/a1NkjQFyw76JM8APgC8rqq+vVjXBdpqgefbmmR3kt2HDx9ebhkawey2O7zUTDqBLSvok5zMIOTfV1UfbM2PzU3JtPtDrX0/cM7Qw88GDsx/zqraXlUbq2rjzMzMqPVLkpawnKtuArwb2FtVbx3atBPY0pa3ALcPtV/Trr65CHh8bopHkjR5a5bR50XAK4EvJLm/tf0F8GbgtiSvBr4KXNm23QlsAvYB3wVetaoVS5KOyZJBX1X/xsLz7gCXLNC/gGtXWJckaZX4zVhJ6pxB3yGvsJE0zKCXpM4Z9JLUOYNeOgH4pbkTm0EvSZ0z6CWpcwa9JHXOoJekzhn0ktQ5g16SOmfQS1LnDHpJ6pxBrxNKb18c6unfovEx6CWpcwa9JHXOoJekzhn0ktQ5g16SOmfQS1LnDHpJ6pxBL0mdM+glqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SeqcQS9JnTPoJalzBr2ecvxflaRjY9BLUucMep2QfFegE4lBL0mdM+glqXNLBn2SG5McSrJnqO2NSb6W5P522zS07fok+5I8lOTScRUuSVqe5ZzR3wRctkD726pqQ7vdCZDkfOAq4HntMe9IctJqFStJOnZLBn1VfQr45jKfbzNwS1V9r6q+AuwDLlxBfZKkFVrJHP11SR5oUzuntbazgEeH+uxvbZKkKRk16G8AngNsAA4Cb2ntWaBvLfQESbYm2Z1k9+HDh0csQ5K0lJGCvqoeq6onq+r7wLs4Mj2zHzhnqOvZwIGjPMf2qtpYVRtnZmZGKUOStAwjBX2SdUOrLwPmrsjZCVyV5JQk5wHrgc+srERJ0kqsWapDkpuBi4G1SfYDbwAuTrKBwbTMI8DvAVTVg0luA/4deAK4tqqeHE/pkqTlWDLoq+rqBZrfvUj/NwFvWklRWrm5r/g/8uaXTrkSSdPmN2MlqXMGvSR1zqCXpM4Z9JLUOYO+E/6+uqSjMeglqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SeqcQS9JnTPoJalzBr0kdc6gl6TOGfSS1LkTKuhnt93hj39JOuGcUEEvSScig16SOmfQS1LnDHpJ6pxBL0mdM+glqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SeqcQS9JnXvKB/38X6T01ykl6Yc95YNekrQ4g16SOmfQS1LnDHpJ6tySQZ/kxiSHkuwZajs9yV1JHm73p7X2JHl7kn1JHkhywTiLlyQtbTln9DcBl81r2wbsqqr1wK62DnA5sL7dtgI3rE6ZkqRRLRn0VfUp4JvzmjcDO9ryDuCKofb31MDdwKlJ1q1WsZKkYzfqHP2ZVXUQoN2f0drPAh4d6re/tUmSpmS1P4zNAm21YMdka5LdSXYfPnx4lcuQJM0ZNegfm5uSafeHWvt+4JyhfmcDBxZ6gqraXlUbq2rjzMzMiGVIkpYyatDvBLa05S3A7UPt17Srby4CHp+b4pEkTceapTokuRm4GFibZD/wBuDNwG1JXg18Fbiydb8T2ATsA74LvGoMNUuSjsGSQV9VVx9l0yUL9C3g2pUWJUlaPX4zVpI6Z9BLUucMeknqnEEvSZ0z6CWpcwa9JHXOoJekzhn0ktQ5g16SOmfQS1LnDHpJ6pxBL0mdM+glqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SeqcQS9JnTPoJalzBr0kdc6gl6TOGfSS1DmDXpI6Z9BLUucMeknqnEEvSZ0z6CWpcwa9JHXOoJekzhn0ktQ5g16SOmfQS1LnDHpJ6pxBL0mdW7OSByd5BPgO8CTwRFVtTHI6cCswCzwCvKKq/mtlZUqSRrUaZ/S/UlUbqmpjW98G7Kqq9cCuti5JmpJxTN1sBna05R3AFWPYhyRpmVYa9AX8S5J7k2xtbWdW1UGAdn/GCvchSVqBFc3RAy+qqgNJzgDuSvLF5T6wvTBsBTj33HNXWIYk6WhWdEZfVQfa/SHgQ8CFwGNJ1gG0+0NHeez2qtpYVRtnZmZWUoYkaREjB32Sn0jyzLll4NeAPcBOYEvrtgW4faVFSpJGt5KpmzOBDyWZe573V9XHknwWuC3Jq4GvAleuvExJ0qhGDvqq+jLwggXavwFcspKiJEmrx2/GSlLnDHpJ6pxBL0mdM+glqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SeqcQS9JnTPoJalzBr0kdc6gl6TOGfSS1DmDXpI6Z9BLUucMeknqnEEvSZ0z6CWpcwa9JHXOoJekzhn0ktQ5g16SOmfQS1LnDHpJ6pxBL0mdM+glqXMGvSR1zqCXpM4Z9JLUOYNekjpn0EtS5wx6SeqcQS9JnTPoJalzYwv6JJcleSjJviTbxrUfSdLixhL0SU4C/ha4HDgfuDrJ+ePYlyRpceM6o78Q2FdVX66q/wNuATaPaV+SpEWMK+jPAh4dWt/f2iRJE5aqWv0nTa4ELq2q17T1VwIXVtUfDfXZCmxtq88H9qx6IatjLfD1aRdxFNY2GmsbjbUdu3HX9TNVNbNUpzVj2vl+4Jyh9bOBA8Mdqmo7sB0gye6q2jimWlbE2kZjbaOxttEcr7UdL3WNa+rms8D6JOcleRpwFbBzTPuSJC1iLGf0VfVEkuuAfwZOAm6sqgfHsS9J0uLGNXVDVd0J3LnM7tvHVccqsLbRWNtorG00x2ttx0VdY/kwVpJ0/PAnECSpcxMJ+iTnJPlEkr1JHkzy2tb+xiRfS3J/u20aesz17ecTHkpy6RRqu3WorkeS3N/aZ5P8z9C2d46xtqcn+UySz7fa/qq1n5fkniQPtzqf1tpPaev72vbZCdf1vvb32pPkxiQnt/aLkzw+dMxeP466lqjtpiRfGaphQ2tPkre3Y/ZAkgumUNunh+o6kOTDrX1ix22oxpOSfC7JR9r6VMfaInVNfawtUtvUx9qPqKqx34B1wAVt+ZnAfzD4aYQ3An+6QP/zgc8DpwDnAV8CTppkbfP6vAV4fVueBfZM6LgFeEZbPhm4B7gIuA24qrW/E/iDtvyHwDvb8lXArROua1PbFuDmobouBj4y5WN2E/DyBfpvAj7aHncRcM+ka5vX5wPANZM+bkP7/2Pg/XP7nfZYW6SuqY+1RWqb+libf5vIGX1VHayq+9ryd4C9LP5N2c3ALVX1var6CrCPwc8qTLy2JAFewWAwTVQN/HdbPbndCngJ8E+tfQdwRVve3NZp2y9p9U+krqq6s20r4DMMvj8xUYscs6PZDLynPe5u4NQk66ZRW5JnMvjbfngc+19KkrOBlwJ/19bDlMfaQnXB4GKPaY+1o9W2iImNtfkmPkff3uK9kMHZDMB17W3MjUlOa21T+QmFBWoDeDHwWFU9PNR2Xnur9q9JXjzmmk7KYNroEHAXg3c336qqJ1qX4WPzg+PWtj8OPGsSdVXVPUPbTgZeCXxs6CG/2KYsPprkeeOoaRm1vamNtbclOaW1TXSsLXbcgJcBu6rq20NtEztuwF8DfwZ8v60/i+NgrC1Q1w9Me6wtUtvUx9qwiQZ9kmcweGv6ujaYbwCeA2wADjKYIoHBW5v5xnp50AK1zbmaHz6bPwicW1UvpL1lS/KT46qrqp6sqg0MzlguBJ67ULd2P7HjNr+uJM8f2vwO4FNV9em2fh+Dr2q/APgbxnzGepTargd+DvgF4HTgz1v3iY61JY7b/LE2seOW5NeBQ1V173DzAl0nOtaOUtewqY21RWo7LsbasIkFfXvl/QDwvqr6IEBVPdYG/veBd3FkembJn1AYd22tfQ3wW8Ctc21tOukbbfleBmfYPzuu2ob2+y3gkwzm9k5ttcEPH5sfHLe2/aeAb06orsvaft8AzDB4EZzr8+25KYsafL/i5CRrx1nX/NraFF1V1feAv2dKY22h2gCSPKvVdMdQn0ketxcBv5nkEQa/NvsSBmer0x5rP1JXkve2/U57rC1Y2/E21mByV90EeDewt6reOtQ+PD/1Mo78sNlO4Kr2yf55wHoG83ATq635VeCLVbV/qP9MBr+3T5Jnt9q+PKbaZpKc2pZ/vNWzF/gE8PLWbQtwe1ve2dZp2z/e5jAnUdcXk7wGuBS4ur14z/X/6bn52yQXMhh331jtupaobV1rC4N55uGxdk27IuIi4PGqOjjJ2trmKxl8mPe/Q/0ndtyq6vqqOruqZhl8uPrxqvodpjzWjlLX7x4PY22R2qY+1hYqdhKfSv8yg7coDwD3t9sm4B+AL7T2ncC6ocf8JYOz5YeAyyddWx359Pz35/X/beBBBlcF3Qf8xhhr+3ngc622PRy58ufZDF749gH/CJzS2p/e1ve17c+ecF1PtL/Z3HGca79u6JjdDfzSFI7Zx9tY2wO8lyNXv4TBf5LzpbZ946Rra9s+yeCdx3D/iR23efu9mCNXkEx1rC1S19TH2iK1TX2szb/5zVhJ6pzfjJWkzhn0ktQ5g16SOmfQS1LnDHpJ6pxBL0mdM+glqXMGvSR17v8B1vJdBEr84DAAAAAASUVORK5CYII=\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "x=data[data['cylinders']==8]['displacement']\n", "y=data[data['cylinders']==8]['horsepower']\n", "#plt.plot(y, x, color='green', linestyle='dashed', linewidth = 3,marker='o', markerfacecolor='red', markersize=12)\n", "plt.bar(x, y)" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "colab": { "collapsed_sections": [], "name": "DS_PRAC-2_18it089.ipynb", "provenance": [] }, "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.3" } }, "nbformat": 4, "nbformat_minor": 1 }