{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "\n", "import matplotlib.pyplot as plt\n", "\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.feature_selection import (\n", " f_regression,\n", " SelectKBest,\n", " SelectFromModel,\n", ")\n", "\n", "from sklearn.linear_model import Lasso\n", "\n", "from feature_engine.wrappers import SklearnTransformerWrapper" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Id | \n", "MSSubClass | \n", "MSZoning | \n", "LotFrontage | \n", "LotArea | \n", "Street | \n", "Alley | \n", "LotShape | \n", "LandContour | \n", "Utilities | \n", "... | \n", "PoolArea | \n", "PoolQC | \n", "Fence | \n", "MiscFeature | \n", "MiscVal | \n", "MoSold | \n", "YrSold | \n", "SaleType | \n", "SaleCondition | \n", "SalePrice | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "60 | \n", "RL | \n", "65.0 | \n", "8450 | \n", "Pave | \n", "NaN | \n", "Reg | \n", "Lvl | \n", "AllPub | \n", "... | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "2 | \n", "2008 | \n", "WD | \n", "Normal | \n", "208500 | \n", "
1 | \n", "2 | \n", "20 | \n", "RL | \n", "80.0 | \n", "9600 | \n", "Pave | \n", "NaN | \n", "Reg | \n", "Lvl | \n", "AllPub | \n", "... | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "5 | \n", "2007 | \n", "WD | \n", "Normal | \n", "181500 | \n", "
2 | \n", "3 | \n", "60 | \n", "RL | \n", "68.0 | \n", "11250 | \n", "Pave | \n", "NaN | \n", "IR1 | \n", "Lvl | \n", "AllPub | \n", "... | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "9 | \n", "2008 | \n", "WD | \n", "Normal | \n", "223500 | \n", "
3 | \n", "4 | \n", "70 | \n", "RL | \n", "60.0 | \n", "9550 | \n", "Pave | \n", "NaN | \n", "IR1 | \n", "Lvl | \n", "AllPub | \n", "... | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "2 | \n", "2006 | \n", "WD | \n", "Abnorml | \n", "140000 | \n", "
4 | \n", "5 | \n", "60 | \n", "RL | \n", "84.0 | \n", "14260 | \n", "Pave | \n", "NaN | \n", "IR1 | \n", "Lvl | \n", "AllPub | \n", "... | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0 | \n", "12 | \n", "2008 | \n", "WD | \n", "Normal | \n", "250000 | \n", "
5 rows × 81 columns
\n", "\n", " | LotArea | \n", "Neighborhood | \n", "HouseStyle | \n", "MasVnrArea | \n", "ExterQual | \n", "MSZoning | \n", "Street | \n", "Alley | \n", "LotShape | \n", "LandContour | \n", "... | \n", "GarageType | \n", "GarageFinish | \n", "GarageQual | \n", "GarageCond | \n", "PavedDrive | \n", "PoolQC | \n", "Fence | \n", "MiscFeature | \n", "SaleType | \n", "SaleCondition | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
529 | \n", "32668 | \n", "Crawfor | \n", "1Story | \n", "0.0 | \n", "Gd | \n", "RL | \n", "Pave | \n", "0 | \n", "IR1 | \n", "Lvl | \n", "... | \n", "Attchd | \n", "RFn | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Alloca | \n", "
491 | \n", "9490 | \n", "NAmes | \n", "1.5Fin | \n", "0.0 | \n", "TA | \n", "RL | \n", "Pave | \n", "0 | \n", "Reg | \n", "Lvl | \n", "... | \n", "Attchd | \n", "Unf | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "MnPrv | \n", "0 | \n", "WD | \n", "Normal | \n", "
459 | \n", "7015 | \n", "BrkSide | \n", "1.5Fin | \n", "161.0 | \n", "TA | \n", "RL | \n", "Pave | \n", "0 | \n", "IR1 | \n", "Bnk | \n", "... | \n", "Detchd | \n", "Unf | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Normal | \n", "
279 | \n", "10005 | \n", "ClearCr | \n", "2Story | \n", "299.0 | \n", "TA | \n", "RL | \n", "Pave | \n", "0 | \n", "Reg | \n", "Lvl | \n", "... | \n", "Attchd | \n", "Fin | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Normal | \n", "
655 | \n", "1680 | \n", "BrDale | \n", "2Story | \n", "381.0 | \n", "TA | \n", "RM | \n", "Pave | \n", "0 | \n", "Reg | \n", "Lvl | \n", "... | \n", "Detchd | \n", "Unf | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Family | \n", "
5 rows × 48 columns
\n", "\n", " | MSSubClass | \n", "MSZoning | \n", "LotFrontage | \n", "LotArea | \n", "Alley | \n", "LotShape | \n", "LandContour | \n", "Utilities | \n", "LotConfig | \n", "LandSlope | \n", "... | \n", "GarageType | \n", "GarageFinish | \n", "GarageQual | \n", "GarageCond | \n", "PavedDrive | \n", "PoolQC | \n", "Fence | \n", "MiscFeature | \n", "SaleType | \n", "SaleCondition | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
529 | \n", "20 | \n", "RL | \n", "0.0 | \n", "32668 | \n", "0 | \n", "IR1 | \n", "Lvl | \n", "AllPub | \n", "CulDSac | \n", "Gtl | \n", "... | \n", "Attchd | \n", "RFn | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Alloca | \n", "
491 | \n", "50 | \n", "RL | \n", "79.0 | \n", "9490 | \n", "0 | \n", "Reg | \n", "Lvl | \n", "AllPub | \n", "Inside | \n", "Gtl | \n", "... | \n", "Attchd | \n", "Unf | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "MnPrv | \n", "0 | \n", "WD | \n", "Normal | \n", "
459 | \n", "50 | \n", "RL | \n", "0.0 | \n", "7015 | \n", "0 | \n", "IR1 | \n", "Bnk | \n", "AllPub | \n", "Corner | \n", "Gtl | \n", "... | \n", "Detchd | \n", "Unf | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Normal | \n", "
279 | \n", "60 | \n", "RL | \n", "83.0 | \n", "10005 | \n", "0 | \n", "Reg | \n", "Lvl | \n", "AllPub | \n", "Inside | \n", "Gtl | \n", "... | \n", "Attchd | \n", "Fin | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Normal | \n", "
655 | \n", "160 | \n", "RM | \n", "21.0 | \n", "1680 | \n", "0 | \n", "Reg | \n", "Lvl | \n", "AllPub | \n", "Inside | \n", "Gtl | \n", "... | \n", "Detchd | \n", "Unf | \n", "TA | \n", "TA | \n", "Y | \n", "0 | \n", "0 | \n", "0 | \n", "WD | \n", "Family | \n", "
5 rows × 67 columns
\n", "