{ "cells": [ { "cell_type": "code", "execution_count": null, "id": "79abe757", "metadata": {}, "outputs": [], "source": [ "# Below code from https://inria.github.io/scikit-learn-mooc/python_scripts/datasets_ames_housing.html" ] }, { "cell_type": "code", "execution_count": 1, "id": "011cbba9", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "\n", "ames_housing = pd.read_csv(\"HousingData.csv\", na_values=\"?\")\n", "ames_housing = ames_housing.drop(columns=\"Id\")\n", "ames_housing = ames_housing.drop(columns=\"Longitude\")\n", "ames_housing = ames_housing.drop(columns=\"Latitude\")" ] }, { "cell_type": "code", "execution_count": 2, "id": "34c771e5", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | MS_SubClass | \n", "MS_Zoning | \n", "Lot_Frontage | \n", "Lot_Area | \n", "Street | \n", "Alley | \n", "Lot_Shape | \n", "Land_Contour | \n", "Utilities | \n", "Lot_Config | \n", "... | \n", "Pool_Area | \n", "Pool_QC | \n", "Fence | \n", "Misc_Feature | \n", "Misc_Val | \n", "Mo_Sold | \n", "Year_Sold | \n", "Sale_Type | \n", "Sale_Condition | \n", "Sale_Price | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "One_Story_1946_and_Newer_All_Styles | \n", "Residential_Low_Density | \n", "141 | \n", "31770 | \n", "Pave | \n", "No_Alley_Access | \n", "Slightly_Irregular | \n", "Lvl | \n", "AllPub | \n", "Corner | \n", "... | \n", "0 | \n", "No_Pool | \n", "No_Fence | \n", "NaN | \n", "0 | \n", "5 | \n", "2010 | \n", "WD | \n", "Normal | \n", "215000 | \n", "
| 1 | \n", "One_Story_1946_and_Newer_All_Styles | \n", "Residential_High_Density | \n", "80 | \n", "11622 | \n", "Pave | \n", "No_Alley_Access | \n", "Regular | \n", "Lvl | \n", "AllPub | \n", "Inside | \n", "... | \n", "0 | \n", "No_Pool | \n", "Minimum_Privacy | \n", "NaN | \n", "0 | \n", "6 | \n", "2010 | \n", "WD | \n", "Normal | \n", "105000 | \n", "
| 2 | \n", "One_Story_1946_and_Newer_All_Styles | \n", "Residential_Low_Density | \n", "81 | \n", "14267 | \n", "Pave | \n", "No_Alley_Access | \n", "Slightly_Irregular | \n", "Lvl | \n", "AllPub | \n", "Corner | \n", "... | \n", "0 | \n", "No_Pool | \n", "No_Fence | \n", "Gar2 | \n", "12500 | \n", "6 | \n", "2010 | \n", "WD | \n", "Normal | \n", "172000 | \n", "
| 3 | \n", "One_Story_1946_and_Newer_All_Styles | \n", "Residential_Low_Density | \n", "93 | \n", "11160 | \n", "Pave | \n", "No_Alley_Access | \n", "Regular | \n", "Lvl | \n", "AllPub | \n", "Corner | \n", "... | \n", "0 | \n", "No_Pool | \n", "No_Fence | \n", "NaN | \n", "0 | \n", "4 | \n", "2010 | \n", "WD | \n", "Normal | \n", "244000 | \n", "
| 4 | \n", "Two_Story_1946_and_Newer | \n", "Residential_Low_Density | \n", "74 | \n", "13830 | \n", "Pave | \n", "No_Alley_Access | \n", "Slightly_Irregular | \n", "Lvl | \n", "AllPub | \n", "Inside | \n", "... | \n", "0 | \n", "No_Pool | \n", "Minimum_Privacy | \n", "NaN | \n", "0 | \n", "3 | \n", "2010 | \n", "WD | \n", "Normal | \n", "189900 | \n", "
5 rows × 79 columns
\n", "