Skip to content

Instantly share code, notes, and snippets.

@fhiyo
Last active April 15, 2018 17:02
Show Gist options
  • Save fhiyo/d514d0f83efe22bdd262a8593d9b6efa to your computer and use it in GitHub Desktop.
Save fhiyo/d514d0f83efe22bdd262a8593d9b6efa to your computer and use it in GitHub Desktop.
(Kaggle's house prices competition) sample randomForest regression with Julia
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Sample RandomForest regression with Julia\n",
"Sample kernel with Julia (version: 0.6.2)."
]
},
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Julia's version: 0.6.2\n"
]
},
{
"data": {
"text/plain": [
"3-element Array{String,1}:\n",
" \"DataFrames: 0.10.1\" \n",
" \"DecisionTree: 0.6.5\"\n",
" \"ScikitLearn: 0.3.0\" "
]
},
"execution_count": 1,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# version info\n",
"println(\"Julia's version: \", VERSION)\n",
"function versions(packages, keys)\n",
" map(k -> @sprintf(\"%s: %s\", k, packages[k]), keys)\n",
"end\n",
"\n",
"versions(Pkg.installed(), [\"DataFrames\", \"DecisionTree\", \"ScikitLearn\"])"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"using DataFrames\n",
"using DecisionTree\n",
"using ScikitLearn \n",
"\n",
"using ScikitLearn: fit! \n",
"using ScikitLearn: predict\n",
"using ScikitLearn.CrossValidation: cross_val_score"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Id\n",
"Summary Stats:\n",
"Mean: 730.500000\n",
"Minimum: 1.000000\n",
"1st Quartile: 365.750000\n",
"Median: 730.500000\n",
"3rd Quartile: 1095.250000\n",
"Maximum: 1460.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"MSSubClass\n",
"Summary Stats:\n",
"Mean: 56.897260\n",
"Minimum: 20.000000\n",
"1st Quartile: 20.000000\n",
"Median: 50.000000\n",
"3rd Quartile: 70.000000\n",
"Maximum: 190.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"MSZoning\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"LotFrontage\n",
"Summary Stats:\n",
"Mean: 70.049958\n",
"Minimum: 21.000000\n",
"1st Quartile: 59.000000\n",
"Median: 69.000000\n",
"3rd Quartile: 80.000000\n",
"Maximum: 313.000000\n",
"Length: 1201\n",
"Type: Int64\n",
"Number Missing: 259\n",
"% Missing: 17.739726\n",
"\n",
"LotArea\n",
"Summary Stats:\n",
"Mean: 10516.828082\n",
"Minimum: 1300.000000\n",
"1st Quartile: 7553.500000\n",
"Median: 9478.500000\n",
"3rd Quartile: 11601.500000\n",
"Maximum: 215245.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Street\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 2\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Alley\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 3\n",
"Number Missing: 1369\n",
"% Missing: 93.767123\n",
"\n",
"LotShape\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 4\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"LandContour\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 4\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Utilities\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 2\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"LotConfig\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"LandSlope\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 3\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Neighborhood\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 25\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Condition1\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 9\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Condition2\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 8\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BldgType\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"HouseStyle\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 8\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"OverallQual\n",
"Summary Stats:\n",
"Mean: 6.099315\n",
"Minimum: 1.000000\n",
"1st Quartile: 5.000000\n",
"Median: 6.000000\n",
"3rd Quartile: 7.000000\n",
"Maximum: 10.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"OverallCond\n",
"Summary Stats:\n",
"Mean: 5.575342\n",
"Minimum: 1.000000\n",
"1st Quartile: 5.000000\n",
"Median: 5.000000\n",
"3rd Quartile: 6.000000\n",
"Maximum: 9.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"YearBuilt\n",
"Summary Stats:\n",
"Mean: 1971.267808\n",
"Minimum: 1872.000000\n",
"1st Quartile: 1954.000000\n",
"Median: 1973.000000\n",
"3rd Quartile: 2000.000000\n",
"Maximum: 2010.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"YearRemodAdd\n",
"Summary Stats:\n",
"Mean: 1984.865753\n",
"Minimum: 1950.000000\n",
"1st Quartile: 1967.000000\n",
"Median: 1994.000000\n",
"3rd Quartile: 2004.000000\n",
"Maximum: 2010.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"RoofStyle\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"RoofMatl\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 8\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Exterior1st\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 15\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Exterior2nd\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 16\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"MasVnrType\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 8\n",
"% Missing: 0.547945\n",
"\n",
"MasVnrArea\n",
"Summary Stats:\n",
"Mean: 103.685262\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 166.000000\n",
"Maximum: 1600.000000\n",
"Length: 1452\n",
"Type: Int64\n",
"Number Missing: 8\n",
"% Missing: 0.547945\n",
"\n",
"ExterQual\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 4\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"ExterCond\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Foundation\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BsmtQual\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 37\n",
"% Missing: 2.534247\n",
"\n",
"BsmtCond\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 37\n",
"% Missing: 2.534247\n",
"\n",
"BsmtExposure\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 38\n",
"% Missing: 2.602740\n",
"\n",
"BsmtFinType1\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 7\n",
"Number Missing: 37\n",
"% Missing: 2.534247\n",
"\n",
"BsmtFinSF1\n",
"Summary Stats:\n",
"Mean: 443.639726\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 383.500000\n",
"3rd Quartile: 712.250000\n",
"Maximum: 5644.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BsmtFinType2\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 7\n",
"Number Missing: 38\n",
"% Missing: 2.602740\n",
"\n",
"BsmtFinSF2\n",
"Summary Stats:\n",
"Mean: 46.549315\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 1474.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BsmtUnfSF\n",
"Summary Stats:\n",
"Mean: 567.240411\n",
"Minimum: 0.000000\n",
"1st Quartile: 223.000000\n",
"Median: 477.500000\n",
"3rd Quartile: 808.000000\n",
"Maximum: 2336.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"TotalBsmtSF\n",
"Summary Stats:\n",
"Mean: 1057.429452\n",
"Minimum: 0.000000\n",
"1st Quartile: 795.750000\n",
"Median: 991.500000\n",
"3rd Quartile: 1298.250000\n",
"Maximum: 6110.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Heating\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"HeatingQC\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"CentralAir\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 2\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Electrical\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 1\n",
"% Missing: 0.068493\n",
"\n",
"x1stFlrSF\n",
"Summary Stats:\n",
"Mean: 1162.626712\n",
"Minimum: 334.000000\n",
"1st Quartile: 882.000000\n",
"Median: 1087.000000\n",
"3rd Quartile: 1391.250000\n",
"Maximum: 4692.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"x2ndFlrSF\n",
"Summary Stats:\n",
"Mean: 346.992466\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 728.000000\n",
"Maximum: 2065.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"LowQualFinSF\n",
"Summary Stats:\n",
"Mean: 5.844521\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 572.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"GrLivArea\n",
"Summary Stats:\n",
"Mean: 1515.463699\n",
"Minimum: 334.000000\n",
"1st Quartile: 1129.500000\n",
"Median: 1464.000000\n",
"3rd Quartile: 1776.750000\n",
"Maximum: 5642.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BsmtFullBath\n",
"Summary Stats:\n",
"Mean: 0.425342\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 1.000000\n",
"Maximum: 3.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BsmtHalfBath\n",
"Summary Stats:\n",
"Mean: 0.057534\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 2.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"FullBath\n",
"Summary Stats:\n",
"Mean: 1.565068\n",
"Minimum: 0.000000\n",
"1st Quartile: 1.000000\n",
"Median: 2.000000\n",
"3rd Quartile: 2.000000\n",
"Maximum: 3.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"HalfBath\n",
"Summary Stats:\n",
"Mean: 0.382877\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 1.000000\n",
"Maximum: 2.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"BedroomAbvGr\n",
"Summary Stats:\n",
"Mean: 2.866438\n",
"Minimum: 0.000000\n",
"1st Quartile: 2.000000\n",
"Median: 3.000000\n",
"3rd Quartile: 3.000000\n",
"Maximum: 8.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"KitchenAbvGr\n",
"Summary Stats:\n",
"Mean: 1.046575\n",
"Minimum: 0.000000\n",
"1st Quartile: 1.000000\n",
"Median: 1.000000\n",
"3rd Quartile: 1.000000\n",
"Maximum: 3.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"KitchenQual\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 4\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"TotRmsAbvGrd\n",
"Summary Stats:\n",
"Mean: 6.517808\n",
"Minimum: 2.000000\n",
"1st Quartile: 5.000000\n",
"Median: 6.000000\n",
"3rd Quartile: 7.000000\n",
"Maximum: 14.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Functional\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 7\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"Fireplaces\n",
"Summary Stats:\n",
"Mean: 0.613014\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 1.000000\n",
"3rd Quartile: 1.000000\n",
"Maximum: 3.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"FireplaceQu\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 690\n",
"% Missing: 47.260274\n",
"\n",
"GarageType\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 7\n",
"Number Missing: 81\n",
"% Missing: 5.547945\n",
"\n",
"GarageYrBlt\n",
"Summary Stats:\n",
"Mean: 1978.506164\n",
"Minimum: 1900.000000\n",
"1st Quartile: 1961.000000\n",
"Median: 1980.000000\n",
"3rd Quartile: 2002.000000\n",
"Maximum: 2010.000000\n",
"Length: 1379\n",
"Type: Int64\n",
"Number Missing: 81\n",
"% Missing: 5.547945\n",
"\n",
"GarageFinish\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 4\n",
"Number Missing: 81\n",
"% Missing: 5.547945\n",
"\n",
"GarageCars\n",
"Summary Stats:\n",
"Mean: 1.767123\n",
"Minimum: 0.000000\n",
"1st Quartile: 1.000000\n",
"Median: 2.000000\n",
"3rd Quartile: 2.000000\n",
"Maximum: 4.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"GarageArea\n",
"Summary Stats:\n",
"Mean: 472.980137\n",
"Minimum: 0.000000\n",
"1st Quartile: 334.500000\n",
"Median: 480.000000\n",
"3rd Quartile: 576.000000\n",
"Maximum: 1418.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"GarageQual\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 81\n",
"% Missing: 5.547945\n",
"\n",
"GarageCond\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 81\n",
"% Missing: 5.547945\n",
"\n",
"PavedDrive\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 3\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"WoodDeckSF\n",
"Summary Stats:\n",
"Mean: 94.244521\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 168.000000\n",
"Maximum: 857.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"OpenPorchSF\n",
"Summary Stats:\n",
"Mean: 46.660274\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 25.000000\n",
"3rd Quartile: 68.000000\n",
"Maximum: 547.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"EnclosedPorch\n",
"Summary Stats:\n",
"Mean: 21.954110\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 552.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"x3SsnPorch\n",
"Summary Stats:\n",
"Mean: 3.409589\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 508.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"ScreenPorch\n",
"Summary Stats:\n",
"Mean: 15.060959\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 480.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"PoolArea\n",
"Summary Stats:\n",
"Mean: 2.758904\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 738.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"PoolQC\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 4\n",
"Number Missing: 1453\n",
"% Missing: 99.520548\n",
"\n",
"Fence\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 1179\n",
"% Missing: 80.753425\n",
"\n",
"MiscFeature\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 5\n",
"Number Missing: 1406\n",
"% Missing: 96.301370\n",
"\n",
"MiscVal\n",
"Summary Stats:\n",
"Mean: 43.489041\n",
"Minimum: 0.000000\n",
"1st Quartile: 0.000000\n",
"Median: 0.000000\n",
"3rd Quartile: 0.000000\n",
"Maximum: 15500.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"MoSold\n",
"Summary Stats:\n",
"Mean: 6.321918\n",
"Minimum: 1.000000\n",
"1st Quartile: 5.000000\n",
"Median: 6.000000\n",
"3rd Quartile: 8.000000\n",
"Maximum: 12.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"YrSold\n",
"Summary Stats:\n",
"Mean: 2007.815753\n",
"Minimum: 2006.000000\n",
"1st Quartile: 2007.000000\n",
"Median: 2008.000000\n",
"3rd Quartile: 2009.000000\n",
"Maximum: 2010.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"SaleType\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 9\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"SaleCondition\n",
"Summary Stats:\n",
"Length: 1460\n",
"Type: String\n",
"Number Unique: 6\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n",
"SalePrice\n",
"Summary Stats:\n",
"Mean: 180921.195890\n",
"Minimum: 34900.000000\n",
"1st Quartile: 129975.000000\n",
"Median: 163000.000000\n",
"3rd Quartile: 214000.000000\n",
"Maximum: 755000.000000\n",
"Length: 1460\n",
"Type: Int64\n",
"Number Missing: 0\n",
"% Missing: 0.000000\n",
"\n"
]
},
{
"data": {
"text/plain": [
"1459-element DataArrays.DataArray{Int64,1}:\n",
" 1461\n",
" 1462\n",
" 1463\n",
" 1464\n",
" 1465\n",
" 1466\n",
" 1467\n",
" 1468\n",
" 1469\n",
" 1470\n",
" 1471\n",
" 1472\n",
" 1473\n",
" ⋮\n",
" 2908\n",
" 2909\n",
" 2910\n",
" 2911\n",
" 2912\n",
" 2913\n",
" 2914\n",
" 2915\n",
" 2916\n",
" 2917\n",
" 2918\n",
" 2919"
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Load data\n",
"train = readtable(\"../data/raw/train.csv\")\n",
"describe(train)\n",
"\n",
"test = readtable(\"../data/raw/test.csv\")\n",
"test_id = test[:Id] # preserve test id"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<table class=\"data-frame\"><thead><tr><th></th><th>Id</th><th>MSSubClass</th><th>MSZoning</th><th>LotFrontage</th><th>LotArea</th><th>Street</th><th>Alley</th><th>LotShape</th><th>LandContour</th><th>Utilities</th><th>LotConfig</th><th>LandSlope</th><th>Neighborhood</th><th>Condition1</th><th>Condition2</th><th>BldgType</th><th>HouseStyle</th><th>OverallQual</th><th>OverallCond</th><th>YearBuilt</th><th>YearRemodAdd</th><th>RoofStyle</th><th>RoofMatl</th><th>Exterior1st</th><th>Exterior2nd</th><th>MasVnrType</th><th>MasVnrArea</th><th>ExterQual</th><th>ExterCond</th><th>Foundation</th><th>BsmtQual</th><th>BsmtCond</th><th>BsmtExposure</th><th>BsmtFinType1</th><th>BsmtFinSF1</th><th>BsmtFinType2</th><th>BsmtFinSF2</th><th>BsmtUnfSF</th><th>TotalBsmtSF</th><th>Heating</th><th>HeatingQC</th><th>CentralAir</th><th>Electrical</th><th>x1stFlrSF</th><th>x2ndFlrSF</th><th>LowQualFinSF</th><th>GrLivArea</th><th>BsmtFullBath</th><th>BsmtHalfBath</th><th>FullBath</th><th>HalfBath</th><th>BedroomAbvGr</th><th>KitchenAbvGr</th><th>KitchenQual</th><th>TotRmsAbvGrd</th><th>Functional</th><th>Fireplaces</th><th>FireplaceQu</th><th>GarageType</th><th>GarageYrBlt</th><th>GarageFinish</th><th>GarageCars</th><th>GarageArea</th><th>GarageQual</th><th>GarageCond</th><th>PavedDrive</th><th>WoodDeckSF</th><th>OpenPorchSF</th><th>EnclosedPorch</th><th>x3SsnPorch</th><th>ScreenPorch</th><th>PoolArea</th><th>PoolQC</th><th>Fence</th><th>MiscFeature</th><th>MiscVal</th><th>MoSold</th><th>YrSold</th><th>SaleType</th><th>SaleCondition</th></tr></thead><tbody><tr><th>1</th><td>1461</td><td>20</td><td>RH</td><td>80</td><td>11622</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>NAmes</td><td>Feedr</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>5</td><td>6</td><td>1961</td><td>1961</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>CBlock</td><td>TA</td><td>TA</td><td>No</td><td>Rec</td><td>468</td><td>LwQ</td><td>144</td><td>270</td><td>882</td><td>GasA</td><td>TA</td><td>Y</td><td>SBrkr</td><td>896</td><td>0</td><td>0</td><td>896</td><td>0</td><td>0</td><td>1</td><td>0</td><td>2</td><td>1</td><td>TA</td><td>5</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>1961</td><td>Unf</td><td>1</td><td>730</td><td>TA</td><td>TA</td><td>Y</td><td>140</td><td>0</td><td>0</td><td>0</td><td>120</td><td>0</td><td>NA</td><td>MnPrv</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>2</th><td>1462</td><td>20</td><td>RL</td><td>81</td><td>14267</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>NAmes</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>6</td><td>6</td><td>1958</td><td>1958</td><td>Hip</td><td>CompShg</td><td>Wd Sdng</td><td>Wd Sdng</td><td>BrkFace</td><td>108</td><td>TA</td><td>TA</td><td>CBlock</td><td>TA</td><td>TA</td><td>No</td><td>ALQ</td><td>923</td><td>Unf</td><td>0</td><td>406</td><td>1329</td><td>GasA</td><td>TA</td><td>Y</td><td>SBrkr</td><td>1329</td><td>0</td><td>0</td><td>1329</td><td>0</td><td>0</td><td>1</td><td>1</td><td>3</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>1958</td><td>Unf</td><td>1</td><td>312</td><td>TA</td><td>TA</td><td>Y</td><td>393</td><td>36</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>Gar2</td><td>12500</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>3</th><td>1463</td><td>60</td><td>RL</td><td>74</td><td>13830</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>5</td><td>5</td><td>1997</td><td>1998</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>GLQ</td><td>791</td><td>Unf</td><td>0</td><td>137</td><td>928</td><td>GasA</td><td>Gd</td><td>Y</td><td>SBrkr</td><td>928</td><td>701</td><td>0</td><td>1629</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>TA</td><td>6</td><td>Typ</td><td>1</td><td>TA</td><td>Attchd</td><td>1997</td><td>Fin</td><td>2</td><td>482</td><td>TA</td><td>TA</td><td>Y</td><td>212</td><td>34</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>MnPrv</td><td>NA</td><td>0</td><td>3</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>4</th><td>1464</td><td>60</td><td>RL</td><td>78</td><td>9978</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>6</td><td>6</td><td>1998</td><td>1998</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>20</td><td>TA</td><td>TA</td><td>PConc</td><td>TA</td><td>TA</td><td>No</td><td>GLQ</td><td>602</td><td>Unf</td><td>0</td><td>324</td><td>926</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>926</td><td>678</td><td>0</td><td>1604</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Gd</td><td>7</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>1998</td><td>Fin</td><td>2</td><td>470</td><td>TA</td><td>TA</td><td>Y</td><td>360</td><td>36</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>5</th><td>1465</td><td>120</td><td>RL</td><td>43</td><td>5005</td><td>Pave</td><td>NA</td><td>IR1</td><td>HLS</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>StoneBr</td><td>Norm</td><td>Norm</td><td>TwnhsE</td><td>1Story</td><td>8</td><td>5</td><td>1992</td><td>1992</td><td>Gable</td><td>CompShg</td><td>HdBoard</td><td>HdBoard</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>ALQ</td><td>263</td><td>Unf</td><td>0</td><td>1017</td><td>1280</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1280</td><td>0</td><td>0</td><td>1280</td><td>0</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>5</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>1992</td><td>RFn</td><td>2</td><td>506</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>82</td><td>0</td><td>0</td><td>144</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>1</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>6</th><td>1466</td><td>60</td><td>RL</td><td>75</td><td>10000</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>6</td><td>5</td><td>1993</td><td>1994</td><td>Gable</td><td>CompShg</td><td>HdBoard</td><td>HdBoard</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>763</td><td>763</td><td>GasA</td><td>Gd</td><td>Y</td><td>SBrkr</td><td>763</td><td>892</td><td>0</td><td>1655</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>TA</td><td>7</td><td>Typ</td><td>1</td><td>TA</td><td>Attchd</td><td>1993</td><td>Fin</td><td>2</td><td>440</td><td>TA</td><td>TA</td><td>Y</td><td>157</td><td>84</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>4</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>7</th><td>1467</td><td>20</td><td>RL</td><td>NA</td><td>7980</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>6</td><td>7</td><td>1992</td><td>2007</td><td>Gable</td><td>CompShg</td><td>HdBoard</td><td>HdBoard</td><td>None</td><td>0</td><td>TA</td><td>Gd</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>ALQ</td><td>935</td><td>Unf</td><td>0</td><td>233</td><td>1168</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1187</td><td>0</td><td>0</td><td>1187</td><td>1</td><td>0</td><td>2</td><td>0</td><td>3</td><td>1</td><td>TA</td><td>6</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>1992</td><td>Fin</td><td>2</td><td>420</td><td>TA</td><td>TA</td><td>Y</td><td>483</td><td>21</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>GdPrv</td><td>Shed</td><td>500</td><td>3</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>8</th><td>1468</td><td>60</td><td>RL</td><td>63</td><td>8402</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>6</td><td>5</td><td>1998</td><td>1998</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>789</td><td>789</td><td>GasA</td><td>Gd</td><td>Y</td><td>SBrkr</td><td>789</td><td>676</td><td>0</td><td>1465</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>TA</td><td>7</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>1998</td><td>Fin</td><td>2</td><td>393</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>75</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>5</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>9</th><td>1469</td><td>20</td><td>RL</td><td>85</td><td>10176</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>7</td><td>5</td><td>1990</td><td>1990</td><td>Gable</td><td>CompShg</td><td>HdBoard</td><td>HdBoard</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>Gd</td><td>GLQ</td><td>637</td><td>Unf</td><td>0</td><td>663</td><td>1300</td><td>GasA</td><td>Gd</td><td>Y</td><td>SBrkr</td><td>1341</td><td>0</td><td>0</td><td>1341</td><td>1</td><td>0</td><td>1</td><td>1</td><td>2</td><td>1</td><td>Gd</td><td>5</td><td>Typ</td><td>1</td><td>Po</td><td>Attchd</td><td>1990</td><td>Unf</td><td>2</td><td>506</td><td>TA</td><td>TA</td><td>Y</td><td>192</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>2</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>10</th><td>1470</td><td>20</td><td>RL</td><td>70</td><td>8400</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>NAmes</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>4</td><td>5</td><td>1970</td><td>1970</td><td>Gable</td><td>CompShg</td><td>Plywood</td><td>Plywood</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>CBlock</td><td>TA</td><td>TA</td><td>No</td><td>ALQ</td><td>804</td><td>Rec</td><td>78</td><td>0</td><td>882</td><td>GasA</td><td>TA</td><td>Y</td><td>SBrkr</td><td>882</td><td>0</td><td>0</td><td>882</td><td>1</td><td>0</td><td>1</td><td>0</td><td>2</td><td>1</td><td>TA</td><td>4</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>1970</td><td>Fin</td><td>2</td><td>525</td><td>TA</td><td>TA</td><td>Y</td><td>240</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>MnPrv</td><td>NA</td><td>0</td><td>4</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>11</th><td>1471</td><td>120</td><td>RH</td><td>26</td><td>5858</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>FR2</td><td>Gtl</td><td>NAmes</td><td>Norm</td><td>Norm</td><td>TwnhsE</td><td>1Story</td><td>7</td><td>5</td><td>1999</td><td>1999</td><td>Gable</td><td>CompShg</td><td>MetalSd</td><td>MetalSd</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>GLQ</td><td>1051</td><td>BLQ</td><td>0</td><td>354</td><td>1405</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1337</td><td>0</td><td>0</td><td>1337</td><td>1</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>5</td><td>Typ</td><td>1</td><td>Fa</td><td>Attchd</td><td>1999</td><td>Fin</td><td>2</td><td>511</td><td>TA</td><td>TA</td><td>Y</td><td>203</td><td>68</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>12</th><td>1472</td><td>160</td><td>RM</td><td>21</td><td>1680</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>BrDale</td><td>Norm</td><td>Norm</td><td>Twnhs</td><td>2Story</td><td>6</td><td>5</td><td>1971</td><td>1971</td><td>Gable</td><td>CompShg</td><td>HdBoard</td><td>HdBoard</td><td>BrkFace</td><td>504</td><td>TA</td><td>TA</td><td>CBlock</td><td>TA</td><td>TA</td><td>No</td><td>Rec</td><td>156</td><td>Unf</td><td>0</td><td>327</td><td>483</td><td>GasA</td><td>TA</td><td>Y</td><td>SBrkr</td><td>483</td><td>504</td><td>0</td><td>987</td><td>0</td><td>0</td><td>1</td><td>1</td><td>2</td><td>1</td><td>TA</td><td>5</td><td>Typ</td><td>0</td><td>NA</td><td>Detchd</td><td>1971</td><td>Unf</td><td>1</td><td>264</td><td>TA</td><td>TA</td><td>Y</td><td>275</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>2</td><td>2010</td><td>COD</td><td>Normal</td></tr><tr><th>13</th><td>1473</td><td>160</td><td>RM</td><td>21</td><td>1680</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>BrDale</td><td>Norm</td><td>Norm</td><td>Twnhs</td><td>2Story</td><td>5</td><td>5</td><td>1971</td><td>1971</td><td>Gable</td><td>CompShg</td><td>HdBoard</td><td>HdBoard</td><td>BrkFace</td><td>492</td><td>TA</td><td>TA</td><td>CBlock</td><td>TA</td><td>TA</td><td>No</td><td>Rec</td><td>300</td><td>Unf</td><td>0</td><td>225</td><td>525</td><td>GasA</td><td>TA</td><td>Y</td><td>SBrkr</td><td>525</td><td>567</td><td>0</td><td>1092</td><td>0</td><td>0</td><td>1</td><td>1</td><td>3</td><td>1</td><td>TA</td><td>6</td><td>Typ</td><td>0</td><td>NA</td><td>Detchd</td><td>1997</td><td>Unf</td><td>1</td><td>320</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>3</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>14</th><td>1474</td><td>160</td><td>RL</td><td>24</td><td>2280</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>FR2</td><td>Gtl</td><td>NPkVill</td><td>Norm</td><td>Norm</td><td>Twnhs</td><td>2Story</td><td>6</td><td>6</td><td>1975</td><td>1975</td><td>Gable</td><td>CompShg</td><td>Plywood</td><td>Brk Cmn</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>CBlock</td><td>TA</td><td>TA</td><td>No</td><td>ALQ</td><td>514</td><td>Unf</td><td>0</td><td>341</td><td>855</td><td>GasA</td><td>TA</td><td>Y</td><td>SBrkr</td><td>855</td><td>601</td><td>0</td><td>1456</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>1</td><td>TA</td><td>Attchd</td><td>1975</td><td>Unf</td><td>2</td><td>440</td><td>TA</td><td>TA</td><td>Y</td><td>173</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>15</th><td>1475</td><td>120</td><td>RL</td><td>24</td><td>2280</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>FR2</td><td>Gtl</td><td>NPkVill</td><td>Norm</td><td>Norm</td><td>Twnhs</td><td>1Story</td><td>7</td><td>6</td><td>1975</td><td>1975</td><td>Gable</td><td>CompShg</td><td>Plywood</td><td>Brk Cmn</td><td>None</td><td>0</td><td>TA</td><td>TA</td><td>CBlock</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>836</td><td>836</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>836</td><td>0</td><td>0</td><td>836</td><td>0</td><td>0</td><td>1</td><td>0</td><td>2</td><td>1</td><td>TA</td><td>4</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>1975</td><td>Unf</td><td>1</td><td>308</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>30</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>16</th><td>1476</td><td>60</td><td>RL</td><td>102</td><td>12858</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>NridgHt</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>9</td><td>5</td><td>2009</td><td>2010</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>Stone</td><td>162</td><td>Ex</td><td>TA</td><td>PConc</td><td>Ex</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>1590</td><td>1590</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1627</td><td>707</td><td>0</td><td>2334</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Ex</td><td>10</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>2009</td><td>Fin</td><td>3</td><td>751</td><td>TA</td><td>TA</td><td>Y</td><td>144</td><td>133</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>1</td><td>2010</td><td>New</td><td>Partial</td></tr><tr><th>17</th><td>1477</td><td>20</td><td>RL</td><td>94</td><td>12883</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>NridgHt</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>8</td><td>5</td><td>2009</td><td>2010</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>Stone</td><td>256</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>1544</td><td>1544</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1544</td><td>0</td><td>0</td><td>1544</td><td>0</td><td>0</td><td>2</td><td>0</td><td>3</td><td>1</td><td>Gd</td><td>7</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>2009</td><td>RFn</td><td>3</td><td>868</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>35</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>New</td><td>Partial</td></tr><tr><th>18</th><td>1478</td><td>20</td><td>RL</td><td>90</td><td>11520</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>NridgHt</td><td>PosN</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>9</td><td>5</td><td>2005</td><td>2005</td><td>Hip</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>615</td><td>Gd</td><td>TA</td><td>PConc</td><td>Ex</td><td>TA</td><td>No</td><td>GLQ</td><td>110</td><td>Unf</td><td>0</td><td>1588</td><td>1698</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1698</td><td>0</td><td>0</td><td>1698</td><td>0</td><td>0</td><td>2</td><td>0</td><td>3</td><td>1</td><td>Ex</td><td>7</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>2005</td><td>Fin</td><td>3</td><td>730</td><td>TA</td><td>TA</td><td>Y</td><td>192</td><td>74</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>19</th><td>1479</td><td>20</td><td>RL</td><td>79</td><td>14122</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>NridgHt</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>8</td><td>5</td><td>2005</td><td>2006</td><td>Hip</td><td>CompShg</td><td>CemntBd</td><td>CmentBd</td><td>BrkFace</td><td>240</td><td>Gd</td><td>TA</td><td>PConc</td><td>Ex</td><td>TA</td><td>No</td><td>GLQ</td><td>28</td><td>Unf</td><td>0</td><td>1794</td><td>1822</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1822</td><td>0</td><td>0</td><td>1822</td><td>0</td><td>0</td><td>2</td><td>0</td><td>3</td><td>1</td><td>Ex</td><td>8</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>2005</td><td>RFn</td><td>3</td><td>678</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>119</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>2</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>20</th><td>1480</td><td>20</td><td>RL</td><td>110</td><td>14300</td><td>Pave</td><td>NA</td><td>Reg</td><td>HLS</td><td>AllPub</td><td>Inside</td><td>Mod</td><td>NridgHt</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>9</td><td>5</td><td>2003</td><td>2004</td><td>Hip</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>1095</td><td>Ex</td><td>TA</td><td>PConc</td><td>Ex</td><td>TA</td><td>Gd</td><td>GLQ</td><td>1373</td><td>Unf</td><td>0</td><td>1473</td><td>2846</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>2696</td><td>0</td><td>0</td><td>2696</td><td>1</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Ex</td><td>10</td><td>Typ</td><td>2</td><td>Gd</td><td>Attchd</td><td>2003</td><td>Fin</td><td>3</td><td>958</td><td>TA</td><td>TA</td><td>Y</td><td>220</td><td>150</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>21</th><td>1481</td><td>60</td><td>RL</td><td>105</td><td>13650</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>NridgHt</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>8</td><td>5</td><td>2002</td><td>2002</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>232</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>Gd</td><td>GLQ</td><td>578</td><td>Unf</td><td>0</td><td>1093</td><td>1671</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1687</td><td>563</td><td>0</td><td>2250</td><td>1</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Gd</td><td>7</td><td>Typ</td><td>1</td><td>Ex</td><td>Attchd</td><td>2002</td><td>Fin</td><td>3</td><td>756</td><td>TA</td><td>TA</td><td>Y</td><td>238</td><td>130</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>22</th><td>1482</td><td>120</td><td>RL</td><td>41</td><td>7132</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>NridgHt</td><td>Norm</td><td>Norm</td><td>TwnhsE</td><td>1Story</td><td>8</td><td>5</td><td>2006</td><td>2006</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>Stone</td><td>178</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>Mn</td><td>GLQ</td><td>24</td><td>Unf</td><td>0</td><td>1346</td><td>1370</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1370</td><td>0</td><td>0</td><td>1370</td><td>0</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>2006</td><td>RFn</td><td>2</td><td>484</td><td>TA</td><td>TA</td><td>Y</td><td>120</td><td>49</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>4</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>23</th><td>1483</td><td>20</td><td>RL</td><td>100</td><td>18494</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>6</td><td>5</td><td>2005</td><td>2005</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>1324</td><td>1324</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1324</td><td>0</td><td>0</td><td>1324</td><td>0</td><td>0</td><td>2</td><td>0</td><td>3</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>2005</td><td>Fin</td><td>2</td><td>430</td><td>TA</td><td>TA</td><td>Y</td><td>36</td><td>23</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>1</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>24</th><td>1484</td><td>120</td><td>RL</td><td>43</td><td>3203</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Blmngtn</td><td>Norm</td><td>Norm</td><td>TwnhsE</td><td>1Story</td><td>7</td><td>5</td><td>2006</td><td>2006</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>14</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>Av</td><td>GLQ</td><td>16</td><td>Unf</td><td>0</td><td>1129</td><td>1145</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1145</td><td>0</td><td>0</td><td>1145</td><td>0</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>2006</td><td>Fin</td><td>2</td><td>437</td><td>TA</td><td>TA</td><td>Y</td><td>100</td><td>116</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>1</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>25</th><td>1485</td><td>80</td><td>RL</td><td>67</td><td>13300</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>SLvl</td><td>7</td><td>5</td><td>2004</td><td>2004</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>GLQ</td><td>326</td><td>Unf</td><td>0</td><td>58</td><td>384</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>744</td><td>630</td><td>0</td><td>1374</td><td>1</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Gd</td><td>7</td><td>Typ</td><td>1</td><td>Gd</td><td>BuiltIn</td><td>2004</td><td>Fin</td><td>2</td><td>400</td><td>TA</td><td>TA</td><td>Y</td><td>100</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>6</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>26</th><td>1486</td><td>60</td><td>RL</td><td>63</td><td>8577</td><td>Pave</td><td>NA</td><td>IR1</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Gilbert</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>7</td><td>5</td><td>2004</td><td>2004</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>847</td><td>847</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>847</td><td>886</td><td>0</td><td>1733</td><td>0</td><td>0</td><td>2</td><td>1</td><td>3</td><td>1</td><td>Gd</td><td>7</td><td>Typ</td><td>1</td><td>Gd</td><td>BuiltIn</td><td>2004</td><td>Fin</td><td>2</td><td>433</td><td>TA</td><td>TA</td><td>Y</td><td>144</td><td>48</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>4</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>27</th><td>1487</td><td>60</td><td>RL</td><td>60</td><td>17433</td><td>Pave</td><td>NA</td><td>IR2</td><td>Lvl</td><td>AllPub</td><td>CulDSac</td><td>Gtl</td><td>NoRidge</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>2Story</td><td>8</td><td>5</td><td>1998</td><td>1998</td><td>Hip</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>114</td><td>Gd</td><td>TA</td><td>PConc</td><td>Ex</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>1629</td><td>1629</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1645</td><td>830</td><td>0</td><td>2475</td><td>0</td><td>0</td><td>2</td><td>1</td><td>4</td><td>1</td><td>Gd</td><td>7</td><td>Typ</td><td>1</td><td>TA</td><td>Attchd</td><td>1998</td><td>Fin</td><td>3</td><td>962</td><td>TA</td><td>TA</td><td>Y</td><td>23</td><td>172</td><td>0</td><td>0</td><td>256</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>1</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>28</th><td>1488</td><td>20</td><td>RL</td><td>73</td><td>8987</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Somerst</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>8</td><td>5</td><td>2005</td><td>2006</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>BrkFace</td><td>226</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>NA</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>1595</td><td>1595</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1595</td><td>0</td><td>0</td><td>1595</td><td>0</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>2005</td><td>RFn</td><td>3</td><td>880</td><td>TA</td><td>TA</td><td>Y</td><td>144</td><td>0</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>5</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>29</th><td>1489</td><td>20</td><td>FV</td><td>92</td><td>9215</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Inside</td><td>Gtl</td><td>Somerst</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>7</td><td>5</td><td>2009</td><td>2010</td><td>Hip</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Gd</td><td>TA</td><td>No</td><td>Unf</td><td>0</td><td>Unf</td><td>0</td><td>1218</td><td>1218</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1218</td><td>0</td><td>0</td><td>1218</td><td>0</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>4</td><td>Typ</td><td>0</td><td>NA</td><td>Attchd</td><td>2009</td><td>RFn</td><td>2</td><td>676</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>136</td><td>0</td><td>0</td><td>0</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>4</td><td>2010</td><td>New</td><td>Partial</td></tr><tr><th>30</th><td>1490</td><td>20</td><td>FV</td><td>84</td><td>10440</td><td>Pave</td><td>NA</td><td>Reg</td><td>Lvl</td><td>AllPub</td><td>Corner</td><td>Gtl</td><td>Somerst</td><td>Norm</td><td>Norm</td><td>1Fam</td><td>1Story</td><td>6</td><td>5</td><td>2005</td><td>2005</td><td>Gable</td><td>CompShg</td><td>VinylSd</td><td>VinylSd</td><td>None</td><td>0</td><td>Gd</td><td>TA</td><td>PConc</td><td>Ex</td><td>TA</td><td>No</td><td>GLQ</td><td>1414</td><td>Unf</td><td>0</td><td>54</td><td>1468</td><td>GasA</td><td>Ex</td><td>Y</td><td>SBrkr</td><td>1468</td><td>0</td><td>0</td><td>1468</td><td>1</td><td>0</td><td>2</td><td>0</td><td>2</td><td>1</td><td>Gd</td><td>6</td><td>Typ</td><td>1</td><td>Gd</td><td>Attchd</td><td>2005</td><td>Fin</td><td>2</td><td>528</td><td>TA</td><td>TA</td><td>Y</td><td>0</td><td>102</td><td>0</td><td>0</td><td>216</td><td>0</td><td>NA</td><td>NA</td><td>NA</td><td>0</td><td>5</td><td>2010</td><td>WD</td><td>Normal</td></tr><tr><th>&vellip;</th><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td><td>&vellip;</td></tr></tbody></table>"
],
"text/plain": [
"1459×80 DataFrames.DataFrame\n",
"│ Row │ Id │ MSSubClass │ MSZoning │ LotFrontage │ LotArea │ Street │ Alley │\n",
"├──────┼──────┼────────────┼──────────┼─────────────┼─────────┼────────┼───────┤\n",
"│ 1 │ 1461 │ 20 │ \"RH\" │ 80 │ 11622 │ \"Pave\" │ NA │\n",
"│ 2 │ 1462 │ 20 │ \"RL\" │ 81 │ 14267 │ \"Pave\" │ NA │\n",
"│ 3 │ 1463 │ 60 │ \"RL\" │ 74 │ 13830 │ \"Pave\" │ NA │\n",
"│ 4 │ 1464 │ 60 │ \"RL\" │ 78 │ 9978 │ \"Pave\" │ NA │\n",
"│ 5 │ 1465 │ 120 │ \"RL\" │ 43 │ 5005 │ \"Pave\" │ NA │\n",
"│ 6 │ 1466 │ 60 │ \"RL\" │ 75 │ 10000 │ \"Pave\" │ NA │\n",
"│ 7 │ 1467 │ 20 │ \"RL\" │ NA │ 7980 │ \"Pave\" │ NA │\n",
"│ 8 │ 1468 │ 60 │ \"RL\" │ 63 │ 8402 │ \"Pave\" │ NA │\n",
"│ 9 │ 1469 │ 20 │ \"RL\" │ 85 │ 10176 │ \"Pave\" │ NA │\n",
"│ 10 │ 1470 │ 20 │ \"RL\" │ 70 │ 8400 │ \"Pave\" │ NA │\n",
"│ 11 │ 1471 │ 120 │ \"RH\" │ 26 │ 5858 │ \"Pave\" │ NA │\n",
"⋮\n",
"│ 1448 │ 2908 │ 20 │ \"RL\" │ 58 │ 10172 │ \"Pave\" │ NA │\n",
"│ 1449 │ 2909 │ 90 │ \"RL\" │ NA │ 11836 │ \"Pave\" │ NA │\n",
"│ 1450 │ 2910 │ 180 │ \"RM\" │ 21 │ 1470 │ \"Pave\" │ NA │\n",
"│ 1451 │ 2911 │ 160 │ \"RM\" │ 21 │ 1484 │ \"Pave\" │ NA │\n",
"│ 1452 │ 2912 │ 20 │ \"RL\" │ 80 │ 13384 │ \"Pave\" │ NA │\n",
"│ 1453 │ 2913 │ 160 │ \"RM\" │ 21 │ 1533 │ \"Pave\" │ NA │\n",
"│ 1454 │ 2914 │ 160 │ \"RM\" │ 21 │ 1526 │ \"Pave\" │ NA │\n",
"│ 1455 │ 2915 │ 160 │ \"RM\" │ 21 │ 1936 │ \"Pave\" │ NA │\n",
"│ 1456 │ 2916 │ 160 │ \"RM\" │ 21 │ 1894 │ \"Pave\" │ NA │\n",
"│ 1457 │ 2917 │ 20 │ \"RL\" │ 160 │ 20000 │ \"Pave\" │ NA │\n",
"│ 1458 │ 2918 │ 85 │ \"RL\" │ 62 │ 10441 │ \"Pave\" │ NA │\n",
"│ 1459 │ 2919 │ 60 │ \"RL\" │ 74 │ 9627 │ \"Pave\" │ NA │\n",
"\n",
"│ Row │ LotShape │ LandContour │ Utilities │ LotConfig │ LandSlope │\n",
"├──────┼──────────┼─────────────┼───────────┼───────────┼───────────┤\n",
"│ 1 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 2 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Corner\" │ \"Gtl\" │\n",
"│ 3 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 4 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 5 │ \"IR1\" │ \"HLS\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 6 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Corner\" │ \"Gtl\" │\n",
"│ 7 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 8 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 9 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 10 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Corner\" │ \"Gtl\" │\n",
"│ 11 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"FR2\" │ \"Gtl\" │\n",
"⋮\n",
"│ 1448 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1449 │ \"IR1\" │ \"Lvl\" │ \"AllPub\" │ \"Corner\" │ \"Gtl\" │\n",
"│ 1450 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1451 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1452 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Mod\" │\n",
"│ 1453 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1454 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1455 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1456 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1457 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1458 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Gtl\" │\n",
"│ 1459 │ \"Reg\" │ \"Lvl\" │ \"AllPub\" │ \"Inside\" │ \"Mod\" │\n",
"\n",
"│ Row │ Neighborhood │ Condition1 │ Condition2 │ BldgType │ HouseStyle │\n",
"├──────┼──────────────┼────────────┼────────────┼──────────┼────────────┤\n",
"│ 1 │ \"NAmes\" │ \"Feedr\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 2 │ \"NAmes\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 3 │ \"Gilbert\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"2Story\" │\n",
"│ 4 │ \"Gilbert\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"2Story\" │\n",
"│ 5 │ \"StoneBr\" │ \"Norm\" │ \"Norm\" │ \"TwnhsE\" │ \"1Story\" │\n",
"│ 6 │ \"Gilbert\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"2Story\" │\n",
"│ 7 │ \"Gilbert\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 8 │ \"Gilbert\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"2Story\" │\n",
"│ 9 │ \"Gilbert\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 10 │ \"NAmes\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 11 │ \"NAmes\" │ \"Norm\" │ \"Norm\" │ \"TwnhsE\" │ \"1Story\" │\n",
"⋮\n",
"│ 1448 │ \"Mitchel\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 1449 │ \"Mitchel\" │ \"Norm\" │ \"Norm\" │ \"Duplex\" │ \"1Story\" │\n",
"│ 1450 │ \"MeadowV\" │ \"Norm\" │ \"Norm\" │ \"Twnhs\" │ \"SFoyer\" │\n",
"│ 1451 │ \"MeadowV\" │ \"Norm\" │ \"Norm\" │ \"TwnhsE\" │ \"2Story\" │\n",
"│ 1452 │ \"Mitchel\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 1453 │ \"MeadowV\" │ \"Norm\" │ \"Norm\" │ \"Twnhs\" │ \"2Story\" │\n",
"│ 1454 │ \"MeadowV\" │ \"Norm\" │ \"Norm\" │ \"Twnhs\" │ \"2Story\" │\n",
"│ 1455 │ \"MeadowV\" │ \"Norm\" │ \"Norm\" │ \"Twnhs\" │ \"2Story\" │\n",
"│ 1456 │ \"MeadowV\" │ \"Norm\" │ \"Norm\" │ \"TwnhsE\" │ \"2Story\" │\n",
"│ 1457 │ \"Mitchel\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"1Story\" │\n",
"│ 1458 │ \"Mitchel\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"SFoyer\" │\n",
"│ 1459 │ \"Mitchel\" │ \"Norm\" │ \"Norm\" │ \"1Fam\" │ \"2Story\" │\n",
"\n",
"│ Row │ OverallQual │ OverallCond │ YearBuilt │ YearRemodAdd │ RoofStyle │\n",
"├──────┼─────────────┼─────────────┼───────────┼──────────────┼───────────┤\n",
"│ 1 │ 5 │ 6 │ 1961 │ 1961 │ \"Gable\" │\n",
"│ 2 │ 6 │ 6 │ 1958 │ 1958 │ \"Hip\" │\n",
"│ 3 │ 5 │ 5 │ 1997 │ 1998 │ \"Gable\" │\n",
"│ 4 │ 6 │ 6 │ 1998 │ 1998 │ \"Gable\" │\n",
"│ 5 │ 8 │ 5 │ 1992 │ 1992 │ \"Gable\" │\n",
"│ 6 │ 6 │ 5 │ 1993 │ 1994 │ \"Gable\" │\n",
"│ 7 │ 6 │ 7 │ 1992 │ 2007 │ \"Gable\" │\n",
"│ 8 │ 6 │ 5 │ 1998 │ 1998 │ \"Gable\" │\n",
"│ 9 │ 7 │ 5 │ 1990 │ 1990 │ \"Gable\" │\n",
"│ 10 │ 4 │ 5 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 11 │ 7 │ 5 │ 1999 │ 1999 │ \"Gable\" │\n",
"⋮\n",
"│ 1448 │ 5 │ 7 │ 1968 │ 2003 │ \"Gable\" │\n",
"│ 1449 │ 5 │ 5 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 1450 │ 4 │ 6 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 1451 │ 4 │ 4 │ 1972 │ 1972 │ \"Gable\" │\n",
"│ 1452 │ 5 │ 5 │ 1969 │ 1979 │ \"Gable\" │\n",
"│ 1453 │ 4 │ 5 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 1454 │ 4 │ 5 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 1455 │ 4 │ 7 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 1456 │ 4 │ 5 │ 1970 │ 1970 │ \"Gable\" │\n",
"│ 1457 │ 5 │ 7 │ 1960 │ 1996 │ \"Gable\" │\n",
"│ 1458 │ 5 │ 5 │ 1992 │ 1992 │ \"Gable\" │\n",
"│ 1459 │ 7 │ 5 │ 1993 │ 1994 │ \"Gable\" │\n",
"\n",
"│ Row │ RoofMatl │ Exterior1st │ Exterior2nd │ MasVnrType │ MasVnrArea │\n",
"├──────┼───────────┼─────────────┼─────────────┼────────────┼────────────┤\n",
"│ 1 │ \"CompShg\" │ \"VinylSd\" │ \"VinylSd\" │ \"None\" │ 0 │\n",
"│ 2 │ \"CompShg\" │ \"Wd Sdng\" │ \"Wd Sdng\" │ \"BrkFace\" │ 108 │\n",
"│ 3 │ \"CompShg\" │ \"VinylSd\" │ \"VinylSd\" │ \"None\" │ 0 │\n",
"│ 4 │ \"CompShg\" │ \"VinylSd\" │ \"VinylSd\" │ \"BrkFace\" │ 20 │\n",
"│ 5 │ \"CompShg\" │ \"HdBoard\" │ \"HdBoard\" │ \"None\" │ 0 │\n",
"│ 6 │ \"CompShg\" │ \"HdBoard\" │ \"HdBoard\" │ \"None\" │ 0 │\n",
"│ 7 │ \"CompShg\" │ \"HdBoard\" │ \"HdBoard\" │ \"None\" │ 0 │\n",
"│ 8 │ \"CompShg\" │ \"VinylSd\" │ \"VinylSd\" │ \"None\" │ 0 │\n",
"│ 9 │ \"CompShg\" │ \"HdBoard\" │ \"HdBoard\" │ \"None\" │ 0 │\n",
"│ 10 │ \"CompShg\" │ \"Plywood\" │ \"Plywood\" │ \"None\" │ 0 │\n",
"│ 11 │ \"CompShg\" │ \"MetalSd\" │ \"MetalSd\" │ \"None\" │ 0 │\n",
"⋮\n",
"│ 1448 │ \"CompShg\" │ \"Plywood\" │ \"Plywood\" │ \"None\" │ 0 │\n",
"│ 1449 │ \"CompShg\" │ \"Plywood\" │ \"Plywood\" │ \"None\" │ 0 │\n",
"│ 1450 │ \"CompShg\" │ \"CemntBd\" │ \"CmentBd\" │ \"None\" │ 0 │\n",
"│ 1451 │ \"CompShg\" │ \"CemntBd\" │ \"CmentBd\" │ \"None\" │ 0 │\n",
"│ 1452 │ \"CompShg\" │ \"Plywood\" │ \"Plywood\" │ \"BrkFace\" │ 194 │\n",
"│ 1453 │ \"CompShg\" │ \"CemntBd\" │ \"CmentBd\" │ \"None\" │ 0 │\n",
"│ 1454 │ \"CompShg\" │ \"CemntBd\" │ \"CmentBd\" │ \"None\" │ 0 │\n",
"│ 1455 │ \"CompShg\" │ \"CemntBd\" │ \"CmentBd\" │ \"None\" │ 0 │\n",
"│ 1456 │ \"CompShg\" │ \"CemntBd\" │ \"CmentBd\" │ \"None\" │ 0 │\n",
"│ 1457 │ \"CompShg\" │ \"VinylSd\" │ \"VinylSd\" │ \"None\" │ 0 │\n",
"│ 1458 │ \"CompShg\" │ \"HdBoard\" │ \"Wd Shng\" │ \"None\" │ 0 │\n",
"│ 1459 │ \"CompShg\" │ \"HdBoard\" │ \"HdBoard\" │ \"BrkFace\" │ 94 │\n",
"\n",
"│ Row │ ExterQual │ ExterCond │ Foundation │ BsmtQual │ BsmtCond │\n",
"├──────┼───────────┼───────────┼────────────┼──────────┼──────────┤\n",
"│ 1 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 2 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 3 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 4 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"TA\" │ \"TA\" │\n",
"│ 5 │ \"Gd\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 6 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 7 │ \"TA\" │ \"Gd\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 8 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 9 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 10 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 11 │ \"Gd\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"⋮\n",
"│ 1448 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1449 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1450 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"Gd\" │ \"TA\" │\n",
"│ 1451 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1452 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"TA\" │ \"TA\" │\n",
"│ 1453 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1454 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1455 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1456 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1457 │ \"TA\" │ \"TA\" │ \"CBlock\" │ \"TA\" │ \"TA\" │\n",
"│ 1458 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"│ 1459 │ \"TA\" │ \"TA\" │ \"PConc\" │ \"Gd\" │ \"TA\" │\n",
"\n",
"│ Row │ BsmtExposure │ BsmtFinType1 │ BsmtFinSF1 │ BsmtFinType2 │ BsmtFinSF2 │\n",
"├──────┼──────────────┼──────────────┼────────────┼──────────────┼────────────┤\n",
"│ 1 │ \"No\" │ \"Rec\" │ 468 │ \"LwQ\" │ 144 │\n",
"│ 2 │ \"No\" │ \"ALQ\" │ 923 │ \"Unf\" │ 0 │\n",
"│ 3 │ \"No\" │ \"GLQ\" │ 791 │ \"Unf\" │ 0 │\n",
"│ 4 │ \"No\" │ \"GLQ\" │ 602 │ \"Unf\" │ 0 │\n",
"│ 5 │ \"No\" │ \"ALQ\" │ 263 │ \"Unf\" │ 0 │\n",
"│ 6 │ \"No\" │ \"Unf\" │ 0 │ \"Unf\" │ 0 │\n",
"│ 7 │ \"No\" │ \"ALQ\" │ 935 │ \"Unf\" │ 0 │\n",
"│ 8 │ \"No\" │ \"Unf\" │ 0 │ \"Unf\" │ 0 │\n",
"│ 9 │ \"Gd\" │ \"GLQ\" │ 637 │ \"Unf\" │ 0 │\n",
"│ 10 │ \"No\" │ \"ALQ\" │ 804 │ \"Rec\" │ 78 │\n",
"│ 11 │ \"No\" │ \"GLQ\" │ 1051 │ \"BLQ\" │ 0 │\n",
"⋮\n",
"│ 1448 │ \"No\" │ \"ALQ\" │ 441 │ \"Unf\" │ 0 │\n",
"│ 1449 │ \"No\" │ \"BLQ\" │ 149 │ \"Unf\" │ 0 │\n",
"│ 1450 │ \"Av\" │ \"GLQ\" │ 522 │ \"Unf\" │ 0 │\n",
"│ 1451 │ \"No\" │ \"Rec\" │ 252 │ \"Unf\" │ 0 │\n",
"│ 1452 │ \"Av\" │ \"Rec\" │ 119 │ \"BLQ\" │ 344 │\n",
"│ 1453 │ \"No\" │ \"Rec\" │ 408 │ \"Unf\" │ 0 │\n",
"│ 1454 │ \"No\" │ \"Unf\" │ 0 │ \"Unf\" │ 0 │\n",
"│ 1455 │ \"No\" │ \"Unf\" │ 0 │ \"Unf\" │ 0 │\n",
"│ 1456 │ \"No\" │ \"Rec\" │ 252 │ \"Unf\" │ 0 │\n",
"│ 1457 │ \"No\" │ \"ALQ\" │ 1224 │ \"Unf\" │ 0 │\n",
"│ 1458 │ \"Av\" │ \"GLQ\" │ 337 │ \"Unf\" │ 0 │\n",
"│ 1459 │ \"Av\" │ \"LwQ\" │ 758 │ \"Unf\" │ 0 │\n",
"\n",
"│ Row │ BsmtUnfSF │ TotalBsmtSF │ Heating │ HeatingQC │ CentralAir │\n",
"├──────┼───────────┼─────────────┼─────────┼───────────┼────────────┤\n",
"│ 1 │ 270 │ 882 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 2 │ 406 │ 1329 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 3 │ 137 │ 928 │ \"GasA\" │ \"Gd\" │ \"Y\" │\n",
"│ 4 │ 324 │ 926 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"│ 5 │ 1017 │ 1280 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"│ 6 │ 763 │ 763 │ \"GasA\" │ \"Gd\" │ \"Y\" │\n",
"│ 7 │ 233 │ 1168 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"│ 8 │ 789 │ 789 │ \"GasA\" │ \"Gd\" │ \"Y\" │\n",
"│ 9 │ 663 │ 1300 │ \"GasA\" │ \"Gd\" │ \"Y\" │\n",
"│ 10 │ 0 │ 882 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 11 │ 354 │ 1405 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"⋮\n",
"│ 1448 │ 423 │ 864 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"│ 1449 │ 1503 │ 1652 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1450 │ 108 │ 630 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1451 │ 294 │ 546 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1452 │ 641 │ 1104 │ \"GasA\" │ \"Fa\" │ \"Y\" │\n",
"│ 1453 │ 138 │ 546 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1454 │ 546 │ 546 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1455 │ 546 │ 546 │ \"GasA\" │ \"Gd\" │ \"Y\" │\n",
"│ 1456 │ 294 │ 546 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1457 │ 0 │ 1224 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"│ 1458 │ 575 │ 912 │ \"GasA\" │ \"TA\" │ \"Y\" │\n",
"│ 1459 │ 238 │ 996 │ \"GasA\" │ \"Ex\" │ \"Y\" │\n",
"\n",
"│ Row │ Electrical │ x1stFlrSF │ x2ndFlrSF │ LowQualFinSF │ GrLivArea │\n",
"├──────┼────────────┼───────────┼───────────┼──────────────┼───────────┤\n",
"│ 1 │ \"SBrkr\" │ 896 │ 0 │ 0 │ 896 │\n",
"│ 2 │ \"SBrkr\" │ 1329 │ 0 │ 0 │ 1329 │\n",
"│ 3 │ \"SBrkr\" │ 928 │ 701 │ 0 │ 1629 │\n",
"│ 4 │ \"SBrkr\" │ 926 │ 678 │ 0 │ 1604 │\n",
"│ 5 │ \"SBrkr\" │ 1280 │ 0 │ 0 │ 1280 │\n",
"│ 6 │ \"SBrkr\" │ 763 │ 892 │ 0 │ 1655 │\n",
"│ 7 │ \"SBrkr\" │ 1187 │ 0 │ 0 │ 1187 │\n",
"│ 8 │ \"SBrkr\" │ 789 │ 676 │ 0 │ 1465 │\n",
"│ 9 │ \"SBrkr\" │ 1341 │ 0 │ 0 │ 1341 │\n",
"│ 10 │ \"SBrkr\" │ 882 │ 0 │ 0 │ 882 │\n",
"│ 11 │ \"SBrkr\" │ 1337 │ 0 │ 0 │ 1337 │\n",
"⋮\n",
"│ 1448 │ \"SBrkr\" │ 874 │ 0 │ 0 │ 874 │\n",
"│ 1449 │ \"SBrkr\" │ 1652 │ 0 │ 0 │ 1652 │\n",
"│ 1450 │ \"SBrkr\" │ 630 │ 0 │ 0 │ 630 │\n",
"│ 1451 │ \"SBrkr\" │ 546 │ 546 │ 0 │ 1092 │\n",
"│ 1452 │ \"SBrkr\" │ 1360 │ 0 │ 0 │ 1360 │\n",
"│ 1453 │ \"SBrkr\" │ 546 │ 546 │ 0 │ 1092 │\n",
"│ 1454 │ \"SBrkr\" │ 546 │ 546 │ 0 │ 1092 │\n",
"│ 1455 │ \"SBrkr\" │ 546 │ 546 │ 0 │ 1092 │\n",
"│ 1456 │ \"SBrkr\" │ 546 │ 546 │ 0 │ 1092 │\n",
"│ 1457 │ \"SBrkr\" │ 1224 │ 0 │ 0 │ 1224 │\n",
"│ 1458 │ \"SBrkr\" │ 970 │ 0 │ 0 │ 970 │\n",
"│ 1459 │ \"SBrkr\" │ 996 │ 1004 │ 0 │ 2000 │\n",
"\n",
"│ Row │ BsmtFullBath │ BsmtHalfBath │ FullBath │ HalfBath │ BedroomAbvGr │\n",
"├──────┼──────────────┼──────────────┼──────────┼──────────┼──────────────┤\n",
"│ 1 │ 0 │ 0 │ 1 │ 0 │ 2 │\n",
"│ 2 │ 0 │ 0 │ 1 │ 1 │ 3 │\n",
"│ 3 │ 0 │ 0 │ 2 │ 1 │ 3 │\n",
"│ 4 │ 0 │ 0 │ 2 │ 1 │ 3 │\n",
"│ 5 │ 0 │ 0 │ 2 │ 0 │ 2 │\n",
"│ 6 │ 0 │ 0 │ 2 │ 1 │ 3 │\n",
"│ 7 │ 1 │ 0 │ 2 │ 0 │ 3 │\n",
"│ 8 │ 0 │ 0 │ 2 │ 1 │ 3 │\n",
"│ 9 │ 1 │ 0 │ 1 │ 1 │ 2 │\n",
"│ 10 │ 1 │ 0 │ 1 │ 0 │ 2 │\n",
"│ 11 │ 1 │ 0 │ 2 │ 0 │ 2 │\n",
"⋮\n",
"│ 1448 │ 1 │ 0 │ 1 │ 0 │ 3 │\n",
"│ 1449 │ 0 │ 0 │ 2 │ 0 │ 4 │\n",
"│ 1450 │ 1 │ 0 │ 1 │ 0 │ 1 │\n",
"│ 1451 │ 0 │ 0 │ 1 │ 1 │ 3 │\n",
"│ 1452 │ 1 │ 0 │ 1 │ 0 │ 3 │\n",
"│ 1453 │ 0 │ 0 │ 1 │ 1 │ 3 │\n",
"│ 1454 │ 0 │ 0 │ 1 │ 1 │ 3 │\n",
"│ 1455 │ 0 │ 0 │ 1 │ 1 │ 3 │\n",
"│ 1456 │ 0 │ 0 │ 1 │ 1 │ 3 │\n",
"│ 1457 │ 1 │ 0 │ 1 │ 0 │ 4 │\n",
"│ 1458 │ 0 │ 1 │ 1 │ 0 │ 3 │\n",
"│ 1459 │ 0 │ 0 │ 2 │ 1 │ 3 │\n",
"\n",
"│ Row │ KitchenAbvGr │ KitchenQual │ TotRmsAbvGrd │ Functional │ Fireplaces │\n",
"├──────┼──────────────┼─────────────┼──────────────┼────────────┼────────────┤\n",
"│ 1 │ 1 │ \"TA\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 2 │ 1 │ \"Gd\" │ 6 │ \"Typ\" │ 0 │\n",
"│ 3 │ 1 │ \"TA\" │ 6 │ \"Typ\" │ 1 │\n",
"│ 4 │ 1 │ \"Gd\" │ 7 │ \"Typ\" │ 1 │\n",
"│ 5 │ 1 │ \"Gd\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 6 │ 1 │ \"TA\" │ 7 │ \"Typ\" │ 1 │\n",
"│ 7 │ 1 │ \"TA\" │ 6 │ \"Typ\" │ 0 │\n",
"│ 8 │ 1 │ \"TA\" │ 7 │ \"Typ\" │ 1 │\n",
"│ 9 │ 1 │ \"Gd\" │ 5 │ \"Typ\" │ 1 │\n",
"│ 10 │ 1 │ \"TA\" │ 4 │ \"Typ\" │ 0 │\n",
"│ 11 │ 1 │ \"Gd\" │ 5 │ \"Typ\" │ 1 │\n",
"⋮\n",
"│ 1448 │ 1 │ \"TA\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 1449 │ 2 │ \"TA\" │ 8 │ \"Typ\" │ 0 │\n",
"│ 1450 │ 1 │ \"TA\" │ 3 │ \"Typ\" │ 0 │\n",
"│ 1451 │ 1 │ \"TA\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 1452 │ 1 │ \"TA\" │ 8 │ \"Typ\" │ 1 │\n",
"│ 1453 │ 1 │ \"TA\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 1454 │ 1 │ \"TA\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 1455 │ 1 │ \"TA\" │ 5 │ \"Typ\" │ 0 │\n",
"│ 1456 │ 1 │ \"TA\" │ 6 │ \"Typ\" │ 0 │\n",
"│ 1457 │ 1 │ \"TA\" │ 7 │ \"Typ\" │ 1 │\n",
"│ 1458 │ 1 │ \"TA\" │ 6 │ \"Typ\" │ 0 │\n",
"│ 1459 │ 1 │ \"TA\" │ 9 │ \"Typ\" │ 1 │\n",
"\n",
"│ Row │ FireplaceQu │ GarageType │ GarageYrBlt │ GarageFinish │ GarageCars │\n",
"├──────┼─────────────┼────────────┼─────────────┼──────────────┼────────────┤\n",
"│ 1 │ NA │ \"Attchd\" │ 1961 │ \"Unf\" │ 1 │\n",
"│ 2 │ NA │ \"Attchd\" │ 1958 │ \"Unf\" │ 1 │\n",
"│ 3 │ \"TA\" │ \"Attchd\" │ 1997 │ \"Fin\" │ 2 │\n",
"│ 4 │ \"Gd\" │ \"Attchd\" │ 1998 │ \"Fin\" │ 2 │\n",
"│ 5 │ NA │ \"Attchd\" │ 1992 │ \"RFn\" │ 2 │\n",
"│ 6 │ \"TA\" │ \"Attchd\" │ 1993 │ \"Fin\" │ 2 │\n",
"│ 7 │ NA │ \"Attchd\" │ 1992 │ \"Fin\" │ 2 │\n",
"│ 8 │ \"Gd\" │ \"Attchd\" │ 1998 │ \"Fin\" │ 2 │\n",
"│ 9 │ \"Po\" │ \"Attchd\" │ 1990 │ \"Unf\" │ 2 │\n",
"│ 10 │ NA │ \"Attchd\" │ 1970 │ \"Fin\" │ 2 │\n",
"│ 11 │ \"Fa\" │ \"Attchd\" │ 1999 │ \"Fin\" │ 2 │\n",
"⋮\n",
"│ 1448 │ NA │ \"Attchd\" │ 1968 │ \"RFn\" │ 1 │\n",
"│ 1449 │ NA │ \"2Types\" │ 1970 │ \"Unf\" │ 3 │\n",
"│ 1450 │ NA │ NA │ NA │ NA │ 0 │\n",
"│ 1451 │ NA │ \"Attchd\" │ 1972 │ \"Unf\" │ 1 │\n",
"│ 1452 │ \"TA\" │ \"Attchd\" │ 1969 │ \"RFn\" │ 1 │\n",
"│ 1453 │ NA │ \"CarPort\" │ 1970 │ \"Unf\" │ 1 │\n",
"│ 1454 │ NA │ NA │ NA │ NA │ 0 │\n",
"│ 1455 │ NA │ NA │ NA │ NA │ 0 │\n",
"│ 1456 │ NA │ \"CarPort\" │ 1970 │ \"Unf\" │ 1 │\n",
"│ 1457 │ \"TA\" │ \"Detchd\" │ 1960 │ \"Unf\" │ 2 │\n",
"│ 1458 │ NA │ NA │ NA │ NA │ 0 │\n",
"│ 1459 │ \"TA\" │ \"Attchd\" │ 1993 │ \"Fin\" │ 3 │\n",
"\n",
"│ Row │ GarageArea │ GarageQual │ GarageCond │ PavedDrive │ WoodDeckSF │\n",
"├──────┼────────────┼────────────┼────────────┼────────────┼────────────┤\n",
"│ 1 │ 730 │ \"TA\" │ \"TA\" │ \"Y\" │ 140 │\n",
"│ 2 │ 312 │ \"TA\" │ \"TA\" │ \"Y\" │ 393 │\n",
"│ 3 │ 482 │ \"TA\" │ \"TA\" │ \"Y\" │ 212 │\n",
"│ 4 │ 470 │ \"TA\" │ \"TA\" │ \"Y\" │ 360 │\n",
"│ 5 │ 506 │ \"TA\" │ \"TA\" │ \"Y\" │ 0 │\n",
"│ 6 │ 440 │ \"TA\" │ \"TA\" │ \"Y\" │ 157 │\n",
"│ 7 │ 420 │ \"TA\" │ \"TA\" │ \"Y\" │ 483 │\n",
"│ 8 │ 393 │ \"TA\" │ \"TA\" │ \"Y\" │ 0 │\n",
"│ 9 │ 506 │ \"TA\" │ \"TA\" │ \"Y\" │ 192 │\n",
"│ 10 │ 525 │ \"TA\" │ \"TA\" │ \"Y\" │ 240 │\n",
"│ 11 │ 511 │ \"TA\" │ \"TA\" │ \"Y\" │ 203 │\n",
"⋮\n",
"│ 1448 │ 288 │ \"TA\" │ \"TA\" │ \"Y\" │ 0 │\n",
"│ 1449 │ 928 │ \"TA\" │ \"TA\" │ \"Y\" │ 0 │\n",
"│ 1450 │ 0 │ NA │ NA │ \"Y\" │ 0 │\n",
"│ 1451 │ 253 │ \"TA\" │ \"Fa\" │ \"Y\" │ 0 │\n",
"│ 1452 │ 336 │ \"TA\" │ \"TA\" │ \"Y\" │ 160 │\n",
"│ 1453 │ 286 │ \"TA\" │ \"TA\" │ \"Y\" │ 0 │\n",
"│ 1454 │ 0 │ NA │ NA │ \"Y\" │ 0 │\n",
"│ 1455 │ 0 │ NA │ NA │ \"Y\" │ 0 │\n",
"│ 1456 │ 286 │ \"TA\" │ \"TA\" │ \"Y\" │ 0 │\n",
"│ 1457 │ 576 │ \"TA\" │ \"TA\" │ \"Y\" │ 474 │\n",
"│ 1458 │ 0 │ NA │ NA │ \"Y\" │ 80 │\n",
"│ 1459 │ 650 │ \"TA\" │ \"TA\" │ \"Y\" │ 190 │\n",
"\n",
"│ Row │ OpenPorchSF │ EnclosedPorch │ x3SsnPorch │ ScreenPorch │ PoolArea │\n",
"├──────┼─────────────┼───────────────┼────────────┼─────────────┼──────────┤\n",
"│ 1 │ 0 │ 0 │ 0 │ 120 │ 0 │\n",
"│ 2 │ 36 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 3 │ 34 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 4 │ 36 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 5 │ 82 │ 0 │ 0 │ 144 │ 0 │\n",
"│ 6 │ 84 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 7 │ 21 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 8 │ 75 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 9 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 10 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 11 │ 68 │ 0 │ 0 │ 0 │ 0 │\n",
"⋮\n",
"│ 1448 │ 120 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1449 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1450 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1451 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1452 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1453 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1454 │ 34 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1455 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1456 │ 24 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1457 │ 0 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1458 │ 32 │ 0 │ 0 │ 0 │ 0 │\n",
"│ 1459 │ 48 │ 0 │ 0 │ 0 │ 0 │\n",
"\n",
"│ Row │ PoolQC │ Fence │ MiscFeature │ MiscVal │ MoSold │ YrSold │ SaleType │\n",
"├──────┼────────┼─────────┼─────────────┼─────────┼────────┼────────┼──────────┤\n",
"│ 1 │ NA │ \"MnPrv\" │ NA │ 0 │ 6 │ 2010 │ \"WD\" │\n",
"│ 2 │ NA │ NA │ \"Gar2\" │ 12500 │ 6 │ 2010 │ \"WD\" │\n",
"│ 3 │ NA │ \"MnPrv\" │ NA │ 0 │ 3 │ 2010 │ \"WD\" │\n",
"│ 4 │ NA │ NA │ NA │ 0 │ 6 │ 2010 │ \"WD\" │\n",
"│ 5 │ NA │ NA │ NA │ 0 │ 1 │ 2010 │ \"WD\" │\n",
"│ 6 │ NA │ NA │ NA │ 0 │ 4 │ 2010 │ \"WD\" │\n",
"│ 7 │ NA │ \"GdPrv\" │ \"Shed\" │ 500 │ 3 │ 2010 │ \"WD\" │\n",
"│ 8 │ NA │ NA │ NA │ 0 │ 5 │ 2010 │ \"WD\" │\n",
"│ 9 │ NA │ NA │ NA │ 0 │ 2 │ 2010 │ \"WD\" │\n",
"│ 10 │ NA │ \"MnPrv\" │ NA │ 0 │ 4 │ 2010 │ \"WD\" │\n",
"│ 11 │ NA │ NA │ NA │ 0 │ 6 │ 2010 │ \"WD\" │\n",
"⋮\n",
"│ 1448 │ NA │ NA │ NA │ 0 │ 10 │ 2006 │ \"WD\" │\n",
"│ 1449 │ NA │ NA │ NA │ 0 │ 3 │ 2006 │ \"WD\" │\n",
"│ 1450 │ NA │ NA │ NA │ 0 │ 4 │ 2006 │ \"WD\" │\n",
"│ 1451 │ NA │ NA │ NA │ 0 │ 5 │ 2006 │ \"WD\" │\n",
"│ 1452 │ NA │ NA │ NA │ 0 │ 5 │ 2006 │ \"WD\" │\n",
"│ 1453 │ NA │ NA │ NA │ 0 │ 12 │ 2006 │ \"WD\" │\n",
"│ 1454 │ NA │ \"GdPrv\" │ NA │ 0 │ 6 │ 2006 │ \"WD\" │\n",
"│ 1455 │ NA │ NA │ NA │ 0 │ 6 │ 2006 │ \"WD\" │\n",
"│ 1456 │ NA │ NA │ NA │ 0 │ 4 │ 2006 │ \"WD\" │\n",
"│ 1457 │ NA │ NA │ NA │ 0 │ 9 │ 2006 │ \"WD\" │\n",
"│ 1458 │ NA │ \"MnPrv\" │ \"Shed\" │ 700 │ 7 │ 2006 │ \"WD\" │\n",
"│ 1459 │ NA │ NA │ NA │ 0 │ 11 │ 2006 │ \"WD\" │\n",
"\n",
"│ Row │ SaleCondition │\n",
"├──────┼───────────────┤\n",
"│ 1 │ \"Normal\" │\n",
"│ 2 │ \"Normal\" │\n",
"│ 3 │ \"Normal\" │\n",
"│ 4 │ \"Normal\" │\n",
"│ 5 │ \"Normal\" │\n",
"│ 6 │ \"Normal\" │\n",
"│ 7 │ \"Normal\" │\n",
"│ 8 │ \"Normal\" │\n",
"│ 9 │ \"Normal\" │\n",
"│ 10 │ \"Normal\" │\n",
"│ 11 │ \"Normal\" │\n",
"⋮\n",
"│ 1448 │ \"Normal\" │\n",
"│ 1449 │ \"Normal\" │\n",
"│ 1450 │ \"Normal\" │\n",
"│ 1451 │ \"Normal\" │\n",
"│ 1452 │ \"Normal\" │\n",
"│ 1453 │ \"Abnorml\" │\n",
"│ 1454 │ \"Normal\" │\n",
"│ 1455 │ \"Normal\" │\n",
"│ 1456 │ \"Abnorml\" │\n",
"│ 1457 │ \"Abnorml\" │\n",
"│ 1458 │ \"Normal\" │\n",
"│ 1459 │ \"Normal\" │"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"train_X = deepcopy(train)\n",
"delete!(train_X, :SalePrice)\n",
"train_y = deepcopy(train[:SalePrice])\n",
"test_X = deepcopy(test)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"simpleencode (generic function with 1 method)"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"@sk_import preprocessing: LabelEncoder \n",
"labelencoder = LabelEncoder()\n",
"\n",
"function simpleencode(df)\n",
" for col in names(df)\n",
" if isa(df[:, col], DataArrays.DataArray{String,1})\n",
" df[:, col] = fit_transform!(labelencoder, df[:, col])\n",
" end\n",
" end\n",
"end"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [],
"source": [
"simpleencode(train_X)\n",
"simpleencode(test_X)"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"fillna (generic function with 1 method)"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"function fillna(df)\n",
" for col in names(df)\n",
" m = median(dropna(df[:, col]))\n",
" df[:, col] = convert(DataArrays.DataArray{Float64,1}, df[:, col])\n",
" df[isna.(df[:, col]), col] = m\n",
" if col != :SalePrice\n",
" # Normalization\n",
" df[:, col] /= maximum(df[:, col])\n",
" end\n",
" end\n",
"end"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [],
"source": [
"fillna(train_X)\n",
"fillna(test_X)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"1460-element DataArrays.DataArray{Float64,1}:\n",
" 12.2477\n",
" 12.109 \n",
" 12.3172\n",
" 11.8494\n",
" 12.4292\n",
" 11.8706\n",
" 12.6346\n",
" 12.2061\n",
" 11.7745\n",
" 11.6784\n",
" 11.7714\n",
" 12.7513\n",
" 11.8776\n",
" ⋮ \n",
" 11.6263\n",
" 11.4295\n",
" 11.8204\n",
" 12.5676\n",
" 11.8845\n",
" 11.3445\n",
" 12.1281\n",
" 12.0725\n",
" 12.2549\n",
" 12.4931\n",
" 11.8645\n",
" 11.9016"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"features = [:MSSubClass, :MSZoning, :LotFrontage, :LotArea, :Street, :LotShape, :LandContour, :Utilities,\n",
" :LotConfig, :LandSlope, :Neighborhood, :Condition1, :Condition2, :BldgType, :HouseStyle,\n",
" :OverallQual, :OverallCond, :YearBuilt, :YearRemodAdd, :RoofStyle, :RoofMatl, :Exterior1st,\n",
" :Exterior2nd, :MasVnrType, :MasVnrArea, :ExterQual, :ExterCond, :Foundation, :BsmtQual,\n",
" :BsmtCond, :BsmtExposure, :BsmtFinType1, :BsmtFinSF1, :BsmtFinType2, :BsmtFinSF2, :BsmtUnfSF,\n",
" :TotalBsmtSF, :Heating, :HeatingQC, :CentralAir, :Electrical, :x1stFlrSF, :x2ndFlrSF, :LowQualFinSF,\n",
" :GrLivArea, :BsmtFullBath, :BsmtHalfBath, :FullBath, :HalfBath, :BedroomAbvGr, :KitchenAbvGr,\n",
" :KitchenQual, :TotRmsAbvGrd, :Functional, :Fireplaces, :GarageType, :GarageYrBlt, :GarageFinish,\n",
" :GarageCars, :GarageArea, :GarageQual, :GarageCond, :PavedDrive, :WoodDeckSF, :OpenPorchSF,\n",
" :EnclosedPorch, :x3SsnPorch, :ScreenPorch, :PoolArea, :MiscVal, :MoSold, :YrSold, :SaleType,\n",
" :SaleCondition]\n",
"\n",
"train_X = train_X[features]\n",
"test_X = test_X[features]\n",
"\n",
"train_y = log(train_y)"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"DecisionTree.RandomForestRegressor(0, 5, 100, 0.7, -1, MersenneTwister(UInt32[0x2260c660, 0x859edcf8, 0x8cb1b74b, 0x36a7bd04], Base.dSFMT.DSFMT_state(Int32[1728377803, 1073510784, -1426080803, 1073638834, 1526305482, 1072896906, 635323365, 1073540432, 729237756, 1073120764 … 1973961609, 1073348858, 2006398861, 1072853698, -923552792, 380851979, 379299954, 1933571904, 382, 0]), [1.77966, 1.90178, 1.19422, 1.80794, 1.40771, 1.1778, 1.73983, 1.04134, 1.95272, 1.0517 … 1.81721, 1.85347, 1.20855, 1.37782, 1.13193, 1.39421, 1.78027, 1.88269, 1.62524, 1.15302], 16), #undef)"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"rf = RandomForestRegressor(ntrees=100)"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"5-element Array{Float64,1}:\n",
" 0.0180812\n",
" 0.0247816\n",
" 0.0210321\n",
" 0.0172874\n",
" 0.0226158"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"map(score -> -score, cross_val_score(rf, Matrix{Float64}(train_X), Vector{Float64}(train_y); cv=5))"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"DecisionTree.RandomForestRegressor(0, 5, 100, 0.7, -1, MersenneTwister(UInt32[0x2260c660, 0x859edcf8, 0x8cb1b74b, 0x36a7bd04], Base.dSFMT.DSFMT_state(Int32[-1763565617, 1072972762, -1620770262, 1072744832, -795533503, 1073542149, -1018999408, 1072753247, 1466164648, 1072969700 … -346694294, 1073283632, 473949148, 1072965301, -1078901000, -1965756237, 1131152006, 1913764482, 382, 0]), [1.26657, 1.04919, 1.80958, 1.05722, 1.26365, 1.23275, 1.73405, 1.21416, 1.61863, 1.42897 … 1.6701, 1.87049, 1.09712, 1.96342, 1.15374, 1.44459, 1.85263, 1.48102, 1.56303, 1.25945], 222), Ensemble of Decision Trees\n",
"Trees: 100\n",
"Avg Leaves: 338.12\n",
"Avg Depth: 19.73)"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"fit!(rf, Matrix{Float64}(train_X), Vector{Float64}(train_y))"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"1459-element Array{Float64,1}:\n",
" 11.7982\n",
" 11.9792\n",
" 12.0241\n",
" 12.0874\n",
" 12.3244\n",
" 12.0207\n",
" 11.9593\n",
" 11.9599\n",
" 12.2785\n",
" 11.7537\n",
" 12.3239\n",
" 11.4588\n",
" 11.5952\n",
" ⋮ \n",
" 11.7931\n",
" 11.8884\n",
" 11.4767\n",
" 11.426 \n",
" 11.895 \n",
" 11.5121\n",
" 11.419 \n",
" 11.4623\n",
" 11.5128\n",
" 11.9206\n",
" 11.7408\n",
" 12.4708"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"pred_y = predict(rf, Matrix{Float64}(test_X))"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"1459-element Array{Float64,1}:\n",
" 1.3301e5 \n",
" 1.59408e5\n",
" 1.66723e5\n",
" 1.77611e5\n",
" 2.2513e5 \n",
" 1.66161e5\n",
" 1.56267e5\n",
" 1.56357e5\n",
" 2.15017e5\n",
" 1.27228e5\n",
" 225020.0 \n",
" 94728.1 \n",
" 1.08574e5\n",
" ⋮ \n",
" 1.32335e5\n",
" 1.45569e5\n",
" 96438.5 \n",
" 91672.9 \n",
" 1.46526e5\n",
" 99917.7 \n",
" 91031.6 \n",
" 95059.7 \n",
" 99984.0 \n",
" 1.50328e5\n",
" 1.25596e5\n",
" 260618.0 "
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"pred_y = exp.(pred_y)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<table class=\"data-frame\"><thead><tr><th></th><th>Id</th><th>SalePrice</th></tr></thead><tbody><tr><th>1</th><td>1461</td><td>133009.66685967916</td></tr><tr><th>2</th><td>1462</td><td>159407.64150038888</td></tr><tr><th>3</th><td>1463</td><td>166722.83167579595</td></tr><tr><th>4</th><td>1464</td><td>177611.17986166128</td></tr><tr><th>5</th><td>1465</td><td>225129.695972366</td></tr><tr><th>6</th><td>1466</td><td>166161.35890505844</td></tr><tr><th>7</th><td>1467</td><td>156267.45373057236</td></tr><tr><th>8</th><td>1468</td><td>156356.88134079557</td></tr><tr><th>9</th><td>1469</td><td>215017.29300964973</td></tr><tr><th>10</th><td>1470</td><td>127227.5868916092</td></tr><tr><th>11</th><td>1471</td><td>225019.97136354764</td></tr><tr><th>12</th><td>1472</td><td>94728.10828776367</td></tr><tr><th>13</th><td>1473</td><td>108573.5556118873</td></tr><tr><th>14</th><td>1474</td><td>147809.67413035568</td></tr><tr><th>15</th><td>1475</td><td>156481.6306589185</td></tr><tr><th>16</th><td>1476</td><td>325140.92031862517</td></tr><tr><th>17</th><td>1477</td><td>248105.09648656717</td></tr><tr><th>18</th><td>1478</td><td>295077.1290869469</td></tr><tr><th>19</th><td>1479</td><td>281295.15522332885</td></tr><tr><th>20</th><td>1480</td><td>370835.86239633267</td></tr><tr><th>21</th><td>1481</td><td>296345.6401443147</td></tr><tr><th>22</th><td>1482</td><td>230170.0743827182</td></tr><tr><th>23</th><td>1483</td><td>156872.5872147922</td></tr><tr><th>24</th><td>1484</td><td>188830.0108018649</td></tr><tr><th>25</th><td>1485</td><td>169061.66298186404</td></tr><tr><th>26</th><td>1486</td><td>223235.11076146842</td></tr><tr><th>27</th><td>1487</td><td>300209.83974822285</td></tr><tr><th>28</th><td>1488</td><td>247156.18962597597</td></tr><tr><th>29</th><td>1489</td><td>205890.72802189583</td></tr><tr><th>30</th><td>1490</td><td>171871.85723943423</td></tr><tr><th>&vellip;</th><td>&vellip;</td><td>&vellip;</td></tr></tbody></table>"
],
"text/plain": [
"1459×2 DataFrames.DataFrame\n",
"│ Row │ Id │ SalePrice │\n",
"├──────┼──────┼───────────┤\n",
"│ 1 │ 1461 │ 1.3301e5 │\n",
"│ 2 │ 1462 │ 1.59408e5 │\n",
"│ 3 │ 1463 │ 1.66723e5 │\n",
"│ 4 │ 1464 │ 1.77611e5 │\n",
"│ 5 │ 1465 │ 2.2513e5 │\n",
"│ 6 │ 1466 │ 1.66161e5 │\n",
"│ 7 │ 1467 │ 1.56267e5 │\n",
"│ 8 │ 1468 │ 1.56357e5 │\n",
"│ 9 │ 1469 │ 2.15017e5 │\n",
"│ 10 │ 1470 │ 1.27228e5 │\n",
"│ 11 │ 1471 │ 225020.0 │\n",
"⋮\n",
"│ 1448 │ 2908 │ 1.32335e5 │\n",
"│ 1449 │ 2909 │ 1.45569e5 │\n",
"│ 1450 │ 2910 │ 96438.5 │\n",
"│ 1451 │ 2911 │ 91672.9 │\n",
"│ 1452 │ 2912 │ 1.46526e5 │\n",
"│ 1453 │ 2913 │ 99917.7 │\n",
"│ 1454 │ 2914 │ 91031.6 │\n",
"│ 1455 │ 2915 │ 95059.7 │\n",
"│ 1456 │ 2916 │ 99984.0 │\n",
"│ 1457 │ 2917 │ 1.50328e5 │\n",
"│ 1458 │ 2918 │ 1.25596e5 │\n",
"│ 1459 │ 2919 │ 260618.0 │"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"submit = DataFrame(Id=test_id, SalePrice=pred_y)"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [],
"source": [
"writetable(\"../data/result/submit.csv\", submit, separator=',', header=true)"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Julia 0.6.2",
"language": "julia",
"name": "julia-0.6"
},
"language_info": {
"file_extension": ".jl",
"mimetype": "application/julia",
"name": "julia",
"version": "0.6.2"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment