{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Exercise 13\n", "\n", "This particular Automobile Data Set includes a good mix of categorical values as well as continuous values and serves as a useful example that is relatively easy to understand. Since domain understanding is an important aspect when deciding how to encode various categorical values - this data set makes a good case study." ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Read the data into Pandas" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | symboling | \n", "normalized_losses | \n", "make | \n", "fuel_type | \n", "aspiration | \n", "num_doors | \n", "body_style | \n", "drive_wheels | \n", "engine_location | \n", "wheel_base | \n", "... | \n", "engine_size | \n", "fuel_system | \n", "bore | \n", "stroke | \n", "compression_ratio | \n", "horsepower | \n", "peak_rpm | \n", "city_mpg | \n", "highway_mpg | \n", "price | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "3 | \n", "NaN | \n", "alfa-romero | \n", "gas | \n", "std | \n", "two | \n", "convertible | \n", "rwd | \n", "front | \n", "88.6 | \n", "... | \n", "130 | \n", "mpfi | \n", "3.47 | \n", "2.68 | \n", "9.0 | \n", "111.0 | \n", "5000.0 | \n", "21 | \n", "27 | \n", "13495.0 | \n", "
1 | \n", "3 | \n", "NaN | \n", "alfa-romero | \n", "gas | \n", "std | \n", "two | \n", "convertible | \n", "rwd | \n", "front | \n", "88.6 | \n", "... | \n", "130 | \n", "mpfi | \n", "3.47 | \n", "2.68 | \n", "9.0 | \n", "111.0 | \n", "5000.0 | \n", "21 | \n", "27 | \n", "16500.0 | \n", "
2 | \n", "1 | \n", "NaN | \n", "alfa-romero | \n", "gas | \n", "std | \n", "two | \n", "hatchback | \n", "rwd | \n", "front | \n", "94.5 | \n", "... | \n", "152 | \n", "mpfi | \n", "2.68 | \n", "3.47 | \n", "9.0 | \n", "154.0 | \n", "5000.0 | \n", "19 | \n", "26 | \n", "16500.0 | \n", "
3 | \n", "2 | \n", "164.0 | \n", "audi | \n", "gas | \n", "std | \n", "four | \n", "sedan | \n", "fwd | \n", "front | \n", "99.8 | \n", "... | \n", "109 | \n", "mpfi | \n", "3.19 | \n", "3.40 | \n", "10.0 | \n", "102.0 | \n", "5500.0 | \n", "24 | \n", "30 | \n", "13950.0 | \n", "
4 | \n", "2 | \n", "164.0 | \n", "audi | \n", "gas | \n", "std | \n", "four | \n", "sedan | \n", "4wd | \n", "front | \n", "99.4 | \n", "... | \n", "136 | \n", "mpfi | \n", "3.19 | \n", "3.40 | \n", "8.0 | \n", "115.0 | \n", "5500.0 | \n", "18 | \n", "22 | \n", "17450.0 | \n", "
5 rows × 26 columns
\n", "\n", " | make | \n", "fuel_type | \n", "aspiration | \n", "num_doors | \n", "body_style | \n", "drive_wheels | \n", "engine_location | \n", "engine_type | \n", "num_cylinders | \n", "fuel_system | \n", "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "alfa-romero | \n", "gas | \n", "std | \n", "two | \n", "convertible | \n", "rwd | \n", "front | \n", "dohc | \n", "four | \n", "mpfi | \n", "
1 | \n", "alfa-romero | \n", "gas | \n", "std | \n", "two | \n", "convertible | \n", "rwd | \n", "front | \n", "dohc | \n", "four | \n", "mpfi | \n", "
2 | \n", "alfa-romero | \n", "gas | \n", "std | \n", "two | \n", "hatchback | \n", "rwd | \n", "front | \n", "ohcv | \n", "six | \n", "mpfi | \n", "
3 | \n", "audi | \n", "gas | \n", "std | \n", "four | \n", "sedan | \n", "fwd | \n", "front | \n", "ohc | \n", "four | \n", "mpfi | \n", "
4 | \n", "audi | \n", "gas | \n", "std | \n", "four | \n", "sedan | \n", "4wd | \n", "front | \n", "ohc | \n", "five | \n", "mpfi | \n", "