From baa7d06cdc2a6fbeacaea4025189d1b12125d7be Mon Sep 17 00:00:00 2001 From: Alexander Hess Date: Tue, 9 Jul 2024 16:42:10 +0200 Subject: [PATCH] Run notebooks with updates and custom kernel --- 00_data_cleaning.ipynb | 32 +-- 01_pairwise_correlations.ipynb | 10 +- 02_descriptive_visualizations.ipynb | 28 +- 03_predictive_models.ipynb | 262 ++++++++++-------- data/data_clean_with_transformations.csv | 10 +- ...clean_with_transformations_and_factors.csv | 10 +- 6 files changed, 189 insertions(+), 163 deletions(-) diff --git a/00_data_cleaning.ipynb b/00_data_cleaning.ipynb index 547dc52..193d84b 100644 --- a/00_data_cleaning.ipynb +++ b/00_data_cleaning.ipynb @@ -1480,7 +1480,7 @@ "for column, mapping_info in LABEL_COLUMNS.items():\n", " # Note that .unique() returns a numpy array with integer dtype in cases\n", " # where the provided data can be casted as such (e.g., \"Overall Qual\" column).\n", - " values_in_data = set(str(x) for x in df[column].unique() if x is not np.NaN)\n", + " values_in_data = set(str(x) for x in df[column].unique() if x is not np.nan)\n", " values_in_description = set(mapping_info[\"lookups\"].keys())\n", " assert values_in_data <= values_in_description" ] @@ -1877,7 +1877,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2930 entries, (1, 526301100) to (2930, 924151050)\n", + "MultiIndex: 2930 entries, (np.int64(1), np.int64(526301100)) to (np.int64(2930), np.int64(924151050))\n", "Data columns (total 19 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", @@ -2208,7 +2208,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2930 entries, (1, 526301100) to (2930, 924151050)\n", + "MultiIndex: 2930 entries, (np.int64(1), np.int64(526301100)) to (np.int64(2930), np.int64(924151050))\n", "Data columns (total 14 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", @@ -2765,7 +2765,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2930 entries, (1, 526301100) to (2930, 924151050)\n", + "MultiIndex: 2930 entries, (np.int64(1), np.int64(526301100)) to (np.int64(2930), np.int64(924151050))\n", "Data columns (total 23 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", @@ -3320,7 +3320,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2930 entries, (1, 526301100) to (2930, 924151050)\n", + "MultiIndex: 2930 entries, (np.int64(1), np.int64(526301100)) to (np.int64(2930), np.int64(924151050))\n", "Data columns (total 23 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", @@ -3382,9 +3382,7 @@ "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], @@ -3404,9 +3402,7 @@ "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], @@ -3426,9 +3422,7 @@ "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], @@ -3448,9 +3442,7 @@ "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], @@ -4331,9 +4323,9 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "ames-housing", "language": "python", - "name": "python3" + "name": "ames-housing" }, "language_info": { "codemirror_mode": { @@ -4345,7 +4337,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.5" + "version": "3.12.4" } }, "nbformat": 4, diff --git a/01_pairwise_correlations.ipynb b/01_pairwise_correlations.ipynb index cb59e95..096fdef 100644 --- a/01_pairwise_correlations.ipynb +++ b/01_pairwise_correlations.ipynb @@ -1178,8 +1178,8 @@ " cmap = sns.diverging_palette(240, 0, as_cmap=True)\n", " # Adjust the labels' font size.\n", " labels = data.columns\n", - " ax.set_xticklabels(labels, fontsize=10)\n", - " ax.set_yticklabels(labels, fontsize=10)\n", + " ax.set_xticks(range(len(labels)), labels=labels, fontsize=10)\n", + " ax.set_yticks(range(len(labels)), labels=labels, fontsize=10)\n", " # Plot it.\n", " sns.heatmap(\n", " data, vmin=-1, vmax=1, cmap=cmap, center=0, linewidths=.5,\n", @@ -2404,9 +2404,9 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "ames-housing", "language": "python", - "name": "python3" + "name": "ames-housing" }, "language_info": { "codemirror_mode": { @@ -2418,7 +2418,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.5" + "version": "3.12.4" } }, "nbformat": 4, diff --git a/02_descriptive_visualizations.ipynb b/02_descriptive_visualizations.ipynb index e33f795..4b06eb6 100644 --- a/02_descriptive_visualizations.ipynb +++ b/02_descriptive_visualizations.ipynb @@ -1319,7 +1319,7 @@ "sns.boxplot(x=\"Neighborhood\", y=\"SalePrice\", data=df, ax=ax)\n", "ax.set_title(\"Prices by Neighborhood\", fontsize=24)\n", "ax.set_xlabel(\"Neighborhood\", fontsize=18)\n", - "ax.set_xticklabels(ax.get_xticklabels(), rotation=45)\n", + "ax.tick_params(axis='x', labelrotation = 45)\n", "ax.set_ylabel(\"House Price\", fontsize=18);" ] }, @@ -1336,7 +1336,7 @@ "metadata": {}, "outputs": [], "source": [ - "neighborhood = pd.get_dummies(df[\"Neighborhood\"], prefix=\"nhood\")\n", + "neighborhood = pd.get_dummies(df[\"Neighborhood\"], prefix=\"nhood\", dtype=int)\n", "df = pd.concat([df, neighborhood], axis=1)\n", "del df[\"Neighborhood\"]" ] @@ -1827,7 +1827,7 @@ "metadata": {}, "outputs": [], "source": [ - "build_type = pd.get_dummies(df[\"Bldg Type\"], prefix=\"build_type\")\n", + "build_type = pd.get_dummies(df[\"Bldg Type\"], prefix=\"build_type\", dtype=int)\n", "df = pd.concat([df, build_type], axis=1)\n", "del df[\"Bldg Type\"]" ] @@ -2118,7 +2118,7 @@ "PosA 24\n", "RRNn 11\n", "RRNe 6\n", - "dtype: int64" + "Name: count, dtype: int64" ] }, "execution_count": 34, @@ -2527,13 +2527,14 @@ { "data": { "text/plain": [ + "Foundation\n", "PConc 1282\n", "CBlock 1242\n", "BrkTil 310\n", "Slab 48\n", "Stone 11\n", "Wood 5\n", - "Name: Foundation, dtype: int64" + "Name: count, dtype: int64" ] }, "execution_count": 50, @@ -2580,7 +2581,7 @@ "metadata": {}, "outputs": [], "source": [ - "foundation = pd.get_dummies(df[\"Foundation\"], prefix=\"found\")\n", + "foundation = pd.get_dummies(df[\"Foundation\"], prefix=\"found\", dtype=int)\n", "# Only keep the top 3 realizations.\n", "del foundation[\"found_Slab\"]\n", "del foundation[\"found_Stone\"]\n", @@ -2958,6 +2959,7 @@ { "data": { "text/plain": [ + "MS Zoning\n", "RL 2252\n", "RM 459\n", "FV 131\n", @@ -2966,7 +2968,7 @@ "A 2\n", "I 2\n", "RP 0\n", - "Name: MS Zoning, dtype: int64" + "Name: count, dtype: int64" ] }, "execution_count": 67, @@ -3161,13 +3163,14 @@ { "data": { "text/plain": [ + "Sale Condition\n", "Normal 2396\n", "Partial 233\n", "Abnorml 189\n", "Family 46\n", "Alloca 22\n", "AdjLand 12\n", - "Name: Sale Condition, dtype: int64" + "Name: count, dtype: int64" ] }, "execution_count": 77, @@ -3437,9 +3440,10 @@ { "data": { "text/plain": [ + "Street\n", "Pave 2886\n", "Grvl 12\n", - "Name: Street, dtype: int64" + "Name: count, dtype: int64" ] }, "execution_count": 87, @@ -4948,9 +4952,9 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "ames-housing", "language": "python", - "name": "python3" + "name": "ames-housing" }, "language_info": { "codemirror_mode": { @@ -4962,7 +4966,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.5" + "version": "3.12.4" } }, "nbformat": 4, diff --git a/03_predictive_models.ipynb b/03_predictive_models.ipynb index ddcb3a2..f11c1cb 100644 --- a/03_predictive_models.ipynb +++ b/03_predictive_models.ipynb @@ -143,7 +143,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2898 entries, (144, 535153070) to (867, 907253130)\n", + "MultiIndex: 2898 entries, (np.int64(144), np.int64(535153070)) to (np.int64(867), np.int64(907253130))\n", "Columns: 248 entries, 1st Flr SF to SalePrice\n", "dtypes: float64(19), int64(229)\n", "memory usage: 5.7 MB\n" @@ -2720,7 +2720,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2883 entries, (2775, 907175060) to (2660, 902325050)\n", + "MultiIndex: 2883 entries, (np.int64(2775), np.int64(907175060)) to (np.int64(2660), np.int64(902325050))\n", "Columns: 109 entries, 1st Flr SF to SalePrice (box-cox-0)\n", "dtypes: float64(27), int64(82)\n", "memory usage: 2.6 MB\n" @@ -3861,7 +3861,7 @@ "output_type": "stream", "text": [ "\n", - "MultiIndex: 2883 entries, (2775, 907175060) to (2660, 902325050)\n", + "MultiIndex: 2883 entries, (np.int64(2775), np.int64(907175060)) to (np.int64(2660), np.int64(902325050))\n", "Columns: 32 entries, 1st Flr SF to SalePrice (box-cox-0)\n", "dtypes: float64(16), int64(16)\n", "memory usage: 906.2 KB\n" @@ -4371,11 +4371,11 @@ { "data": { "text/plain": [ - "{'bias': 14349804.0,\n", - " 'mae': 18498417.0,\n", - " 'max_dev': 5072252036.0,\n", - " 'r2': -106245976.863,\n", - " 'rmse': 820848886.0}" + "{'bias': np.float64(25204734.0),\n", + " 'mae': np.float64(32984598.0),\n", + " 'max_dev': np.float64(9091844797.0),\n", + " 'r2': np.float64(-374439996.215),\n", + " 'rmse': np.float64(1541948537.0)}" ] }, "execution_count": 26, @@ -4417,11 +4417,11 @@ { "data": { "text/plain": [ - "{'bias': -2.0,\n", - " 'mae': 15277.0,\n", - " 'max_dev': 126472.0,\n", - " 'r2': 0.919,\n", - " 'rmse': 21829.0}" + "{'bias': np.float64(-2.0),\n", + " 'mae': np.float64(15277.0),\n", + " 'max_dev': np.float64(126472.0),\n", + " 'r2': np.float64(0.919),\n", + " 'rmse': np.float64(21829.0)}" ] }, "execution_count": 27, @@ -4456,11 +4456,11 @@ { "data": { "text/plain": [ - "{'bias': -820.0,\n", - " 'mae': 12807.0,\n", - " 'max_dev': 114579.0,\n", - " 'r2': 0.938,\n", - " 'rmse': 19106.0}" + "{'bias': np.float64(-820.0),\n", + " 'mae': np.float64(12807.0),\n", + " 'max_dev': np.float64(114579.0),\n", + " 'r2': np.float64(0.938),\n", + " 'rmse': np.float64(19106.0)}" ] }, "execution_count": 28, @@ -4502,11 +4502,11 @@ { "data": { "text/plain": [ - "{'bias': 4.0,\n", - " 'mae': 18369.0,\n", - " 'max_dev': 142946.0,\n", - " 'r2': 0.887,\n", - " 'rmse': 25682.0}" + "{'bias': np.float64(102.0),\n", + " 'mae': np.float64(18352.0),\n", + " 'max_dev': np.float64(142260.0),\n", + " 'r2': np.float64(0.887),\n", + " 'rmse': np.float64(25648.0)}" ] }, "execution_count": 29, @@ -4541,11 +4541,11 @@ { "data": { "text/plain": [ - "{'bias': -1342.0,\n", - " 'mae': 16126.0,\n", - " 'max_dev': 140216.0,\n", - " 'r2': 0.906,\n", - " 'rmse': 23335.0}" + "{'bias': np.float64(-1461.0),\n", + " 'mae': np.float64(16125.0),\n", + " 'max_dev': np.float64(140115.0),\n", + " 'r2': np.float64(0.906),\n", + " 'rmse': np.float64(23331.0)}" ] }, "execution_count": 30, @@ -4624,11 +4624,11 @@ { "data": { "text/plain": [ - "{'bias': 278.0,\n", - " 'mae': 20892.0,\n", - " 'max_dev': 269314.0,\n", - " 'r2': 0.817,\n", - " 'rmse': 33496.0}" + "{'bias': np.float64(278.0),\n", + " 'mae': np.float64(20892.0),\n", + " 'max_dev': np.float64(269314.0),\n", + " 'r2': np.float64(0.817),\n", + " 'rmse': np.float64(33496.0)}" ] }, "execution_count": 33, @@ -4692,11 +4692,11 @@ { "data": { "text/plain": [ - "{'bias': -49.0,\n", - " 'mae': 17488.0,\n", - " 'max_dev': 134191.0,\n", - " 'r2': 0.896,\n", - " 'rmse': 24529.0}" + "{'bias': np.float64(-49.0),\n", + " 'mae': np.float64(17488.0),\n", + " 'max_dev': np.float64(134191.0),\n", + " 'r2': np.float64(0.896),\n", + " 'rmse': np.float64(24529.0)}" ] }, "execution_count": 35, @@ -4753,11 +4753,11 @@ { "data": { "text/plain": [ - "{'bias': -861.0,\n", - " 'mae': 14346.0,\n", - " 'max_dev': 129044.0,\n", - " 'r2': 0.923,\n", - " 'rmse': 21081.0}" + "{'bias': np.float64(-861.0),\n", + " 'mae': np.float64(14346.0),\n", + " 'max_dev': np.float64(129044.0),\n", + " 'r2': np.float64(0.923),\n", + " 'rmse': np.float64(21081.0)}" ] }, "execution_count": 37, @@ -4821,11 +4821,11 @@ { "data": { "text/plain": [ - "{'bias': -11.0,\n", - " 'mae': 23344.0,\n", - " 'max_dev': 152485.0,\n", - " 'r2': 0.827,\n", - " 'rmse': 31672.0}" + "{'bias': np.float64(-11.0),\n", + " 'mae': np.float64(23344.0),\n", + " 'max_dev': np.float64(152485.0),\n", + " 'r2': np.float64(0.827),\n", + " 'rmse': np.float64(31672.0)}" ] }, "execution_count": 39, @@ -4882,11 +4882,11 @@ { "data": { "text/plain": [ - "{'bias': -877.0,\n", - " 'mae': 16619.0,\n", - " 'max_dev': 143135.0,\n", - " 'r2': 0.899,\n", - " 'rmse': 24205.0}" + "{'bias': np.float64(-877.0),\n", + " 'mae': np.float64(16619.0),\n", + " 'max_dev': np.float64(143135.0),\n", + " 'r2': np.float64(0.899),\n", + " 'rmse': np.float64(24205.0)}" ] }, "execution_count": 41, @@ -4964,11 +4964,11 @@ { "data": { "text/plain": [ - "{'bias': 152.0,\n", - " 'mae': 17064.0,\n", - " 'max_dev': 263561.0,\n", - " 'r2': 0.853,\n", - " 'rmse': 29970.0}" + "{'bias': np.float64(152.0),\n", + " 'mae': np.float64(17064.0),\n", + " 'max_dev': np.float64(263561.0),\n", + " 'r2': np.float64(0.853),\n", + " 'rmse': np.float64(29970.0)}" ] }, "execution_count": 44, @@ -5032,11 +5032,11 @@ { "data": { "text/plain": [ - "{'bias': -6.0,\n", - " 'mae': 15248.0,\n", - " 'max_dev': 126366.0,\n", - " 'r2': 0.919,\n", - " 'rmse': 21835.0}" + "{'bias': np.float64(-6.0),\n", + " 'mae': np.float64(15248.0),\n", + " 'max_dev': np.float64(126366.0),\n", + " 'r2': np.float64(0.919),\n", + " 'rmse': np.float64(21835.0)}" ] }, "execution_count": 46, @@ -5093,11 +5093,11 @@ { "data": { "text/plain": [ - "{'bias': -840.0,\n", - " 'mae': 12803.0,\n", - " 'max_dev': 113756.0,\n", - " 'r2': 0.938,\n", - " 'rmse': 19073.0}" + "{'bias': np.float64(-840.0),\n", + " 'mae': np.float64(12803.0),\n", + " 'max_dev': np.float64(113756.0),\n", + " 'r2': np.float64(0.938),\n", + " 'rmse': np.float64(19073.0)}" ] }, "execution_count": 48, @@ -5161,11 +5161,11 @@ { "data": { "text/plain": [ - "{'bias': 4.0,\n", - " 'mae': 18342.0,\n", - " 'max_dev': 142600.0,\n", - " 'r2': 0.887,\n", - " 'rmse': 25659.0}" + "{'bias': np.float64(4.0),\n", + " 'mae': np.float64(18342.0),\n", + " 'max_dev': np.float64(142600.0),\n", + " 'r2': np.float64(0.887),\n", + " 'rmse': np.float64(25659.0)}" ] }, "execution_count": 50, @@ -5222,11 +5222,11 @@ { "data": { "text/plain": [ - "{'bias': -1400.0,\n", - " 'mae': 16105.0,\n", - " 'max_dev': 139398.0,\n", - " 'r2': 0.907,\n", - " 'rmse': 23280.0}" + "{'bias': np.float64(-1400.0),\n", + " 'mae': np.float64(16105.0),\n", + " 'max_dev': np.float64(139398.0),\n", + " 'r2': np.float64(0.907),\n", + " 'rmse': np.float64(23280.0)}" ] }, "execution_count": 52, @@ -5280,11 +5280,11 @@ { "data": { "text/plain": [ - "{'bias': -26.0,\n", - " 'mae': 15322.0,\n", - " 'max_dev': 164505.0,\n", - " 'r2': 0.898,\n", - " 'rmse': 25354.0}" + "{'bias': np.float64(-26.0),\n", + " 'mae': np.float64(15322.0),\n", + " 'max_dev': np.float64(164505.0),\n", + " 'r2': np.float64(0.898),\n", + " 'rmse': np.float64(25354.0)}" ] }, "execution_count": 54, @@ -5326,11 +5326,11 @@ { "data": { "text/plain": [ - "{'bias': -70.0,\n", - " 'mae': 14916.0,\n", - " 'max_dev': 137911.0,\n", - " 'r2': 0.91,\n", - " 'rmse': 22813.0}" + "{'bias': np.float64(-70.0),\n", + " 'mae': np.float64(14916.0),\n", + " 'max_dev': np.float64(137911.0),\n", + " 'r2': np.float64(0.91),\n", + " 'rmse': np.float64(22813.0)}" ] }, "execution_count": 55, @@ -5365,11 +5365,11 @@ { "data": { "text/plain": [ - "{'bias': -1996.0,\n", - " 'mae': 14952.0,\n", - " 'max_dev': 141360.0,\n", - " 'r2': 0.908,\n", - " 'rmse': 23000.0}" + "{'bias': np.float64(-1996.0),\n", + " 'mae': np.float64(14952.0),\n", + " 'max_dev': np.float64(141360.0),\n", + " 'r2': np.float64(0.908),\n", + " 'rmse': np.float64(23000.0)}" ] }, "execution_count": 56, @@ -5411,11 +5411,11 @@ { "data": { "text/plain": [ - "{'bias': -165.0,\n", - " 'mae': 16042.0,\n", - " 'max_dev': 143762.0,\n", - " 'r2': 0.898,\n", - " 'rmse': 24274.0}" + "{'bias': np.float64(-165.0),\n", + " 'mae': np.float64(16042.0),\n", + " 'max_dev': np.float64(143762.0),\n", + " 'r2': np.float64(0.898),\n", + " 'rmse': np.float64(24274.0)}" ] }, "execution_count": 57, @@ -5450,11 +5450,11 @@ { "data": { "text/plain": [ - "{'bias': -2250.0,\n", - " 'mae': 16356.0,\n", - " 'max_dev': 146888.0,\n", - " 'r2': 0.893,\n", - " 'rmse': 24785.0}" + "{'bias': np.float64(-2250.0),\n", + " 'mae': np.float64(16356.0),\n", + " 'max_dev': np.float64(146888.0),\n", + " 'r2': np.float64(0.893),\n", + " 'rmse': np.float64(24785.0)}" ] }, "execution_count": 58, @@ -5508,7 +5508,10 @@ { "data": { "text/plain": [ - "[('rf', 25354.0), ('ridge', 29970.0), ('lasso', 33496.0), ('lm', 820848886.0)]" + "[('rf', np.float64(25354.0)),\n", + " ('ridge', np.float64(29970.0)),\n", + " ('lasso', np.float64(33496.0)),\n", + " ('lm', np.float64(1541948537.0))]" ] }, "execution_count": 60, @@ -5528,7 +5531,10 @@ { "data": { "text/plain": [ - "[('lm', 21829.0), ('ridge', 21835.0), ('rf', 22813.0), ('lasso', 24529.0)]" + "[('lm', np.float64(21829.0)),\n", + " ('ridge', np.float64(21835.0)),\n", + " ('rf', np.float64(22813.0)),\n", + " ('lasso', np.float64(24529.0))]" ] }, "execution_count": 61, @@ -5548,7 +5554,10 @@ { "data": { "text/plain": [ - "[('ridge', 19073.0), ('lm', 19106.0), ('lasso', 21081.0), ('rf', 23000.0)]" + "[('ridge', np.float64(19073.0)),\n", + " ('lm', np.float64(19106.0)),\n", + " ('lasso', np.float64(21081.0)),\n", + " ('rf', np.float64(23000.0))]" ] }, "execution_count": 62, @@ -5568,7 +5577,10 @@ { "data": { "text/plain": [ - "[('rf', 24274.0), ('ridge', 25659.0), ('lm', 25682.0), ('lasso', 31672.0)]" + "[('rf', np.float64(24274.0)),\n", + " ('lm', np.float64(25648.0)),\n", + " ('ridge', np.float64(25659.0)),\n", + " ('lasso', np.float64(31672.0))]" ] }, "execution_count": 63, @@ -5588,7 +5600,10 @@ { "data": { "text/plain": [ - "[('ridge', 23280.0), ('lm', 23335.0), ('lasso', 24205.0), ('rf', 24785.0)]" + "[('ridge', np.float64(23280.0)),\n", + " ('lm', np.float64(23331.0)),\n", + " ('lasso', np.float64(24205.0)),\n", + " ('rf', np.float64(24785.0))]" ] }, "execution_count": 64, @@ -5615,7 +5630,10 @@ { "data": { "text/plain": [ - "[('rf', 0.898), ('ridge', 0.853), ('lasso', 0.817), ('lm', -106245976.863)]" + "[('rf', np.float64(0.898)),\n", + " ('ridge', np.float64(0.853)),\n", + " ('lasso', np.float64(0.817)),\n", + " ('lm', np.float64(-374439996.215))]" ] }, "execution_count": 65, @@ -5635,7 +5653,10 @@ { "data": { "text/plain": [ - "[('lm', 0.919), ('ridge', 0.919), ('rf', 0.91), ('lasso', 0.896)]" + "[('lm', np.float64(0.919)),\n", + " ('ridge', np.float64(0.919)),\n", + " ('rf', np.float64(0.91)),\n", + " ('lasso', np.float64(0.896))]" ] }, "execution_count": 66, @@ -5655,7 +5676,10 @@ { "data": { "text/plain": [ - "[('lm', 0.938), ('ridge', 0.938), ('lasso', 0.923), ('rf', 0.908)]" + "[('lm', np.float64(0.938)),\n", + " ('ridge', np.float64(0.938)),\n", + " ('lasso', np.float64(0.923)),\n", + " ('rf', np.float64(0.908))]" ] }, "execution_count": 67, @@ -5675,7 +5699,10 @@ { "data": { "text/plain": [ - "[('rf', 0.898), ('lm', 0.887), ('ridge', 0.887), ('lasso', 0.827)]" + "[('rf', np.float64(0.898)),\n", + " ('lm', np.float64(0.887)),\n", + " ('ridge', np.float64(0.887)),\n", + " ('lasso', np.float64(0.827))]" ] }, "execution_count": 68, @@ -5695,7 +5722,10 @@ { "data": { "text/plain": [ - "[('ridge', 0.907), ('lm', 0.906), ('lasso', 0.899), ('rf', 0.893)]" + "[('ridge', np.float64(0.907)),\n", + " ('lm', np.float64(0.906)),\n", + " ('lasso', np.float64(0.899)),\n", + " ('rf', np.float64(0.893))]" ] }, "execution_count": 69, @@ -5710,9 +5740,9 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "ames-housing", "language": "python", - "name": "python3" + "name": "ames-housing" }, "language_info": { "codemirror_mode": { @@ -5724,7 +5754,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.5" + "version": "3.12.4" } }, "nbformat": 4, diff --git a/data/data_clean_with_transformations.csv b/data/data_clean_with_transformations.csv index 5ab98b4..288bf25 100644 --- a/data/data_clean_with_transformations.csv +++ b/data/data_clean_with_transformations.csv @@ -351,7 +351,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Alley,Bedroom 352,527132090,1478.0,7.298445101508147,0.0,0.0,NA,2,1Fam,TA,Av,1,0,Gd,1077.0,341.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,CemntBd,CemntBd,NA,NA,0,PConc,2,Typ,495.0,2,TA,Fin,TA,Attchd,1478.0,7.298445101508147,0,GasA,Ex,1Story,1,TA,Lvl,Gtl,7380.0,14.367200464938653,Corner,IR1,0.0,120,RL,0.0,None,NA,0.0,7,StoneBr,43.0,5,8,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,5,3.0,1418.0,211.0,2896.0,19.622362214685307,AllPub,168.0,1998,1998,2009,240000.0,12.388394202324129 353,527146010,1734.0,7.458186157340487,0.0,0.0,NA,2,TwnhsE,TA,No,1,0,Gd,846.0,741.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,CemntBd,CemntBd,NA,NA,0,PConc,2,Typ,528.0,2,TA,RFn,TA,Attchd,1734.0,7.458186157340487,0,GasA,Ex,1Story,1,Gd,Lvl,Gtl,8013.0,14.56854934744058,Corner,IR1,0.0,120,RL,0.0,None,NA,0.0,9,StoneBr,50.0,5,8,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,3.0,1587.0,102.0,3321.0,20.306016067856913,AllPub,52.0,1995,1996,2009,239500.0,12.386308695833106 354,527161040,751.0,6.621405651764134,631.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,195.0,189.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,396.0,2,TA,Fin,TA,BuiltIn,1382.0,7.231287004327616,1,GasA,Gd,SLvl,1,TA,Lvl,Gtl,8923.0,14.834252319425625,Inside,IR1,0.0,080,RL,0.0,None,NA,0.0,2,Gilbert,0.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,2.5,384.0,256.0,1766.0,17.303249574220334,AllPub,256.0,1998,1998,2009,177500.0,12.086725887897607 -355,527162110,885.0,6.785587645007929,833.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,832.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,427.0,2,TA,Fin,TA,Attchd,1718.0,7.4489161025442,1,GasA,Gd,2Story,1,TA,Lvl,Gtl,10141.0,15.15405917561631,Corner,IR1,0.0,060,RL,40.0,BrkFace,NA,0.0,12,Gilbert,94.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,291.0,Pave,7,2.5,832.0,385.0,2550.0,19.003691717103283,AllPub,0.0,1998,1998,2009,185000.0,12.128111104060462 +355,527162110,885.0,6.785587645007929,833.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,832.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,427.0,2,TA,Fin,TA,Attchd,1718.0,7.4489161025442,1,GasA,Gd,2Story,1,TA,Lvl,Gtl,10141.0,15.15405917561631,Corner,IR1,0.0,060,RL,40.0,BrkFace,NA,0.0,12,Gilbert,94.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,291.0,Pave,7,2.5,832.0,385.0,2550.0,19.00369171710328,AllPub,0.0,1998,1998,2009,185000.0,12.128111104060462 356,527162120,952.0,6.858565034791365,684.0,0.0,NA,3,1Fam,TA,No,1,0,Gd,476.0,476.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,440.0,2,TA,Fin,TA,Attchd,1636.0,7.400009517162692,1,GasA,Gd,2Story,1,TA,Lvl,Gtl,7500.0,14.406534966757283,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,10,Gilbert,84.0,5,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,3.5,952.0,84.0,2588.0,19.07480946817217,AllPub,0.0,1998,1999,2009,191000.0,12.160028707028767 357,527163040,799.0,6.683360945766275,772.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,799.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,380.0,2,TA,RFn,TA,Attchd,1571.0,7.359467638255621,1,GasA,Gd,2Story,1,TA,Lvl,Gtl,7837.0,14.51404532104361,Inside,IR1,0.0,060,RL,0.0,None,NA,0.0,5,Gilbert,40.0,7,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,2.5,799.0,40.0,2370.0,18.654821409606946,AllPub,0.0,1993,1994,2009,178000.0,12.089538829274222 358,527163070,680.0,6.522092798170152,790.0,0.0,NA,3,1Fam,Gd,No,0,0,Gd,370.0,310.0,0.0,ALQ,Unf,Y,Norm,Norm,SBrkr,0.0,Gd,Ex,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,420.0,2,TA,Fin,TA,BuiltIn,1470.0,7.293017679772782,1,GasA,Gd,2Story,1,TA,Lvl,Gtl,9765.0,15.059201296829725,Corner,IR2,0.0,060,RL,68.0,BrkFace,Shed,480.0,4,Gilbert,63.0,8,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,2.5,680.0,295.0,2150.0,18.198382041699816,AllPub,232.0,1993,1993,2009,185000.0,12.128111104060462 @@ -545,7 +545,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Alley,Bedroom 550,531452260,754.0,6.625392368007956,786.0,0.0,NA,3,1Fam,TA,No,1,0,Gd,122.0,36.0,596.0,LwQ,GLQ,Y,RRAe,Norm,SBrkr,0.0,TA,Gd,VinylSd,VinylSd,NA,NA,0,PConc,2,Typ,495.0,2,TA,RFn,TA,Attchd,1540.0,7.3395376954076745,1,GasA,Ex,2Story,1,Gd,Lvl,Gtl,9109.0,14.885540064062317,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,10,SawyerW,32.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,3.5,754.0,172.0,2294.0,18.50112687133047,AllPub,140.0,1994,1994,2009,184000.0,12.122691036591123 551,531453100,698.0,6.548219102762372,702.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,345.0,331.0,0.0,Rec,Unf,Y,Norm,Norm,SBrkr,0.0,Gd,TA,VinylSd,VinylSd,NA,NA,0,CBlock,2,Typ,465.0,2,TA,RFn,TA,Attchd,1400.0,7.24422751560335,1,GasA,TA,2Story,1,TA,Lvl,Gtl,10274.0,15.186855822557384,CulDSac,IR1,0.0,060,RL,141.0,BrkFace,NA,0.0,7,SawyerW,48.0,7,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,2.5,676.0,48.0,2076.0,18.036445788849743,AllPub,0.0,1986,1986,2009,162000.0,11.99535161421452 552,531475220,964.0,6.871091294610546,918.0,0.0,NA,4,Duplx,NA,NA,0,0,NA,0.0,0.0,0.0,NA,NA,Y,Norm,Norm,SBrkr,0.0,TA,TA,Wd Sdng,WdShing,NA,TA,2,Slab,2,Typ,612.0,2,TA,Unf,TA,Attchd,1882.0,7.540090320145325,0,GasA,TA,2Story,2,TA,Lvl,Gtl,8250.0,14.64026616916342,Inside,Reg,0.0,090,RL,0.0,None,NA,0.0,5,SawyerW,0.0,7,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,8,2.0,0.0,0.0,1882.0,17.588839942548756,AllPub,0.0,1981,1981,2009,160000.0,11.982929094215963 -553,531477020,841.0,6.734591659972948,0.0,0.0,NA,2,1Fam,Fa,No,0,0,TA,721.0,0.0,0.0,Unf,Unf,Y,Feedr,Norm,SBrkr,24.0,Fa,Fa,Wd Sdng,AsbShng,NA,NA,0,CBlock,1,Typ,294.0,1,TA,Unf,TA,CarPort,841.0,6.734591659972948,0,GasA,Gd,1Story,1,TA,Lvl,Gtl,8400.0,14.68470426970406,Inside,Reg,0.0,020,RH,0.0,None,NA,0.0,9,SawyerW,0.0,4,4,N,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,4,1.0,721.0,274.0,1562.0,16.762371023178837,AllPub,250.0,1950,1950,2009,82000.0,11.314474526246391 +553,531477020,841.0,6.734591659972948,0.0,0.0,NA,2,1Fam,Fa,No,0,0,TA,721.0,0.0,0.0,Unf,Unf,Y,Feedr,Norm,SBrkr,24.0,Fa,Fa,Wd Sdng,AsbShng,NA,NA,0,CBlock,1,Typ,294.0,1,TA,Unf,TA,CarPort,841.0,6.734591659972948,0,GasA,Gd,1Story,1,TA,Lvl,Gtl,8400.0,14.68470426970406,Inside,Reg,0.0,020,RH,0.0,None,NA,0.0,9,SawyerW,0.0,4,4,N,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,4,1.0,721.0,274.0,1562.0,16.762371023178833,AllPub,250.0,1950,1950,2009,82000.0,11.314474526246391 554,531479020,784.0,6.664409020350408,0.0,0.0,NA,2,1Fam,Fa,No,0,0,Fa,784.0,0.0,0.0,Unf,Unf,N,Norm,Norm,FuseA,91.0,TA,TA,Wd Sdng,Wd Sdng,NA,NA,0,BrkTil,1,Typ,360.0,2,Fa,Unf,Fa,Detchd,784.0,6.664409020350408,0,GasA,TA,1.5Unf,1,TA,Lvl,Gtl,9000.0,14.855599984056148,Corner,Reg,0.0,045,RH,0.0,None,NA,0.0,10,SawyerW,0.0,3,6,N,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,5,1.0,784.0,91.0,1568.0,16.7790642448278,AllPub,0.0,1928,1950,2009,76000.0,11.238488619268468 555,532353020,980.0,6.887552571664617,0.0,0.0,NA,3,1Fam,TA,No,1,0,TA,28.0,68.0,884.0,LwQ,BLQ,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,Plywood,MnPrv,NA,0,CBlock,1,Typ,400.0,2,TA,Unf,TA,Detchd,980.0,6.887552571664617,0,GasA,Gd,1Story,1,TA,Lvl,Gtl,9750.0,15.055349293727405,Inside,IR1,0.0,020,RL,0.0,None,NA,0.0,11,Sawyer,28.0,5,5,Y,0.0,NA,CompShg,Hip,Normal,WD,0.0,Pave,5,2.0,980.0,28.0,1960.0,17.773050992818334,AllPub,0.0,1962,1962,2009,110000.0,11.608235644774552 556,532353130,980.0,6.887552571664617,0.0,0.0,NA,3,1Fam,TA,No,0,0,TA,420.0,560.0,0.0,BLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,Plywood,Plywood,NA,NA,0,CBlock,1,Typ,484.0,2,TA,Unf,TA,Detchd,980.0,6.887552571664617,0,GasA,TA,1Story,1,TA,Lvl,Gtl,7064.0,14.260797286621031,Inside,Reg,0.0,020,RL,153.0,BrkFace,NA,0.0,7,Sawyer,0.0,6,5,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,1.0,980.0,192.0,1960.0,17.773050992818334,AllPub,192.0,1977,1977,2009,135000.0,11.813030057420567 @@ -948,7 +948,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Alley,Bedroom 954,914476380,1217.0,7.104144092987527,0.0,0.0,NA,3,1Fam,TA,Av,1,0,Gd,577.0,611.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,GdPrv,NA,0,PConc,2,Typ,497.0,2,TA,Unf,TA,Attchd,1217.0,7.104144092987527,0,GasA,Ex,SLvl,1,Gd,Lvl,Gtl,9947.0,15.105519458517929,CulDSac,IR1,0.0,080,RL,0.0,None,NA,0.0,6,Mitchel,27.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,3.0,1188.0,195.0,2405.0,18.724278876442806,AllPub,168.0,1990,1991,2009,173000.0,12.061046873479915 955,914476430,1595.0,7.374629015218945,0.0,0.0,NA,2,1Fam,TA,No,1,0,Gd,1527.0,55.0,0.0,BLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,NA,NA,0,PConc,2,Typ,672.0,2,TA,Unf,TA,Detchd,1595.0,7.374629015218945,0,GasA,TA,1Story,1,TA,Lvl,Gtl,11070.0,15.375508981989565,Inside,Reg,0.0,020,RL,0.0,None,NA,0.0,4,Mitchel,0.0,5,5,Y,0.0,NA,CompShg,Gable,Abnorml,COD,0.0,Pave,5,3.0,1582.0,0.0,3177.0,20.082651686134287,AllPub,0.0,1991,1991,2009,152000.0,11.931635799828413 956,916176030,1344.0,7.203405521083095,0.0,0.0,NA,3,1Fam,TA,No,0,1,TA,354.0,111.0,354.0,GLQ,Rec,Y,Norm,Norm,FuseA,0.0,TA,TA,HdBoard,HdBoard,NA,Gd,1,CBlock,1,Typ,525.0,2,TA,RFn,TA,Basment,1344.0,7.203405521083095,0,GasA,Gd,SLvl,1,Gd,Lvl,Gtl,14375.0,16.047184443127506,CulDSac,IR1,0.0,020,RL,541.0,BrkFace,NA,0.0,1,Timber,118.0,6,6,Y,0.0,NA,CompShg,Gable,Abnorml,COD,233.0,Pave,7,1.5,819.0,351.0,2163.0,18.226368292983384,NoSeWa,0.0,1958,1958,2009,137500.0,11.831379196088763 -957,916176125,2036.0,7.618742377670413,0.0,0.0,NA,3,1Fam,TA,Gd,2,0,Gd,80.0,1236.0,820.0,ALQ,Rec,Y,Norm,Norm,SBrkr,0.0,TA,TA,BrkFace,BrkFace,NA,Gd,2,CBlock,2,Typ,513.0,2,TA,RFn,TA,Attchd,2036.0,7.618742377670413,0,GasW,TA,1Story,1,TA,Low,Sev,215245.0,24.142341911893194,Inside,IR3,0.0,020,RL,0.0,None,NA,0.0,6,Timber,0.0,5,7,Y,0.0,NA,CompShg,Hip,Normal,WD,0.0,Pave,8,4.0,2136.0,0.0,4172.0,21.487371590601576,AllPub,0.0,1965,1965,2009,375000.0,12.834681304952548 +957,916176125,2036.0,7.618742377670413,0.0,0.0,NA,3,1Fam,TA,Gd,2,0,Gd,80.0,1236.0,820.0,ALQ,Rec,Y,Norm,Norm,SBrkr,0.0,TA,TA,BrkFace,BrkFace,NA,Gd,2,CBlock,2,Typ,513.0,2,TA,RFn,TA,Attchd,2036.0,7.618742377670413,0,GasW,TA,1Story,1,TA,Low,Sev,215245.0,24.14234191189319,Inside,IR3,0.0,020,RL,0.0,None,NA,0.0,6,Timber,0.0,5,7,Y,0.0,NA,CompShg,Hip,Normal,WD,0.0,Pave,8,4.0,2136.0,0.0,4172.0,21.487371590601576,AllPub,0.0,1965,1965,2009,375000.0,12.834681304952548 958,916380070,1620.0,7.3901814282264295,0.0,0.0,NA,2,1Fam,TA,Gd,1,0,Ex,598.0,1022.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,VinylSd,VinylSd,NA,Ex,1,PConc,2,Typ,912.0,3,TA,Fin,TA,Attchd,1620.0,7.3901814282264295,0,GasA,Ex,1Story,1,Ex,HLS,Gtl,12898.0,15.766310574459004,Inside,IR1,0.0,020,RL,70.0,Stone,NA,0.0,9,Timber,0.0,5,9,Y,0.0,NA,CompShg,Hip,Normal,WD,0.0,Pave,6,3.0,1620.0,228.0,3240.0,20.18134982456163,AllPub,228.0,2007,2008,2009,315500.0,12.661913960963405 959,916382010,846.0,6.740519359606223,846.0,0.0,NA,3,1Fam,TA,Av,0,0,Ex,846.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,NA,NA,0,PConc,2,Typ,650.0,2,TA,RFn,TA,Attchd,1692.0,7.433666540166168,1,GasA,Gd,2Story,1,Gd,HLS,Gtl,13159.0,15.817981703423513,Corner,IR1,0.0,060,RL,0.0,None,NA,0.0,7,Timber,114.0,5,7,Y,0.0,NA,CompShg,Gable,Partial,New,0.0,Pave,6,2.5,846.0,322.0,2538.0,18.981057361211253,AllPub,208.0,2009,2009,2009,224500.0,12.321630986164447 960,916382100,2036.0,7.618742377670413,0.0,0.0,NA,3,1Fam,TA,Gd,1,0,Ex,432.0,1758.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Ex,CemntBd,CemntBd,NA,Ex,1,CBlock,2,Typ,780.0,3,TA,Fin,TA,Attchd,2036.0,7.618742377670413,0,GasA,Ex,1Story,1,Ex,HLS,Gtl,13438.0,15.872206187914584,Corner,IR1,0.0,020,RL,246.0,Stone,NA,0.0,7,Timber,154.0,5,9,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,9,3.0,2190.0,244.0,4226.0,21.55558682405044,AllPub,90.0,2008,2008,2009,410000.0,12.92391243868049 @@ -1607,7 +1607,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Alley,Bedroom 1623,527161090,947.0,6.853299093186078,767.0,0.0,NA,3,1Fam,TA,No,1,0,Gd,52.0,871.0,0.0,ALQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,NA,TA,1,PConc,2,Typ,451.0,2,TA,Fin,TA,Attchd,1714.0,7.446585099157725,1,GasA,Gd,2Story,1,TA,Lvl,Gtl,8637.0,14.753481627067941,Inside,IR1,0.0,060,RL,0.0,None,NA,0.0,4,Gilbert,48.0,5,6,Y,0.0,NA,CompShg,Gable,Abnorml,WD,0.0,Pave,7,3.5,923.0,304.0,2637.0,19.16529105486511,AllPub,256.0,1999,2000,2007,180000.0,12.100712129872347 1624,527162080,691.0,6.53813982376767,862.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,277.0,414.0,0.0,Rec,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,HdBoard,HdBoard,NA,NA,0,PConc,2,Typ,420.0,2,TA,Fin,TA,Attchd,1553.0,7.347943823148687,1,GasA,Gd,2Story,1,Gd,Lvl,Gtl,7875.0,14.525905820919508,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,8,Gilbert,44.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,2.5,691.0,44.0,2244.0,18.397775781250722,AllPub,0.0,1996,1996,2007,178750.0,12.093743460556254 1625,527162090,1253.0,7.133295954896068,0.0,0.0,NA,3,1Fam,Gd,No,0,0,Gd,1237.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,NA,TA,1,PConc,2,Typ,402.0,2,TA,Fin,TA,Attchd,1253.0,7.133295954896068,0,GasA,Gd,1Story,1,TA,Lvl,Gtl,7875.0,14.525905820919508,Inside,Reg,0.0,020,RL,38.0,BrkFace,NA,0.0,6,Gilbert,21.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,2.0,1237.0,241.0,2490.0,18.88965476782098,AllPub,220.0,1995,1996,2007,176000.0,12.078239274020289 -1626,527162140,957.0,6.863803391452954,1342.0,0.0,NA,5,1Fam,TA,No,0,0,Gd,938.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,NA,TA,1,PConc,3,Typ,482.0,2,TA,Fin,TA,Attchd,2299.0,7.740229524763182,1,GasA,Ex,2Story,1,TA,Lvl,Gtl,7500.0,14.406534966757283,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,8,Gilbert,30.0,5,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,3.5,938.0,218.0,3237.0,20.176684883555122,AllPub,188.0,1999,2003,2007,204000.0,12.225875272826354 +1626,527162140,957.0,6.863803391452954,1342.0,0.0,NA,5,1Fam,TA,No,0,0,Gd,938.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,NA,TA,1,PConc,3,Typ,482.0,2,TA,Fin,TA,Attchd,2299.0,7.740229524763182,1,GasA,Ex,2Story,1,TA,Lvl,Gtl,7500.0,14.406534966757283,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,8,Gilbert,30.0,5,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,3.5,938.0,218.0,3237.0,20.17668488355512,AllPub,188.0,1999,2003,2007,204000.0,12.225875272826354 1627,527163080,1187.0,7.079184394609668,0.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,1168.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,NA,NA,0,PConc,2,Typ,420.0,2,TA,RFn,TA,Attchd,1187.0,7.079184394609668,0,GasA,Gd,1Story,1,Gd,Lvl,Gtl,9556.0,15.005043482926363,Corner,IR1,0.0,020,RL,52.0,BrkFace,NA,0.0,8,Gilbert,21.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,2.0,1168.0,21.0,2355.0,18.62480250396189,AllPub,0.0,1992,1993,2007,160000.0,11.982929094215963 1628,527165020,802.0,6.687108607866515,670.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,384.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,Gd,HdBoard,HdBoard,NA,TA,1,PConc,2,Typ,402.0,2,TA,RFn,TA,Attchd,1472.0,7.294377299288821,1,GasA,Gd,SLvl,1,Gd,Lvl,Gtl,10784.0,15.309174951796374,FR2,IR1,0.0,080,RL,76.0,BrkFace,NA,0.0,5,Gilbert,0.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,2.5,384.0,164.0,1856.0,17.526078784323257,AllPub,164.0,1991,1992,2007,160000.0,11.982929094215963 1629,527165100,812.0,6.699500340161678,670.0,0.0,NA,3,1Fam,TA,No,0,0,Gd,384.0,0.0,0.0,Unf,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,NA,TA,1,PConc,2,Typ,392.0,2,TA,Fin,TA,Attchd,1482.0,7.301147805856032,1,GasA,Gd,SLvl,1,Gd,Lvl,Gtl,9125.0,14.889907769270682,Inside,IR1,0.0,080,RL,170.0,BrkFace,NA,0.0,7,Gilbert,25.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,7,2.5,384.0,125.0,1866.0,17.550300430394216,AllPub,100.0,1992,1992,2007,163900.0,12.00701176473192 @@ -2326,7 +2326,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Alley,Bedroom 2352,527356060,811.0,6.698268054115413,741.0,0.0,NA,3,1Fam,TA,No,1,0,Gd,163.0,550.0,0.0,ALQ,Unf,Y,RRAn,Norm,SBrkr,0.0,TA,TA,VinylSd,VinylSd,MnPrv,TA,1,CBlock,2,Typ,434.0,2,TA,RFn,TA,Attchd,1552.0,7.347299700743164,1,GasA,TA,2Story,1,TA,Lvl,Gtl,11475.0,15.466852293432254,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,2,NWAmes,208.0,6,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,3.5,713.0,417.0,2265.0,18.441405394566303,AllPub,209.0,1975,1975,2006,179900.0,12.100156419938624 2353,527358090,1083.0,6.9874902470009905,0.0,0.0,NA,2,1Fam,TA,Gd,1,0,Ex,42.0,1005.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,40.0,TA,Gd,VinylSd,WdShing,NA,Fa,1,CBlock,1,Typ,596.0,2,TA,RFn,TA,Attchd,1083.0,6.9874902470009905,0,GasA,TA,SFoyer,1,TA,Lvl,Gtl,9927.0,15.10046702787839,Inside,IR1,0.0,085,RL,252.0,Stone,NA,0.0,7,NWAmes,0.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,5,2.0,1047.0,484.0,2130.0,18.155060764405075,AllPub,444.0,1976,1976,2006,172000.0,12.05524975579559 2354,527365010,960.0,6.866933284461882,1358.0,0.0,NA,3,1Fam,TA,No,1,0,Gd,172.0,788.0,0.0,ALQ,Unf,Y,RRAn,Norm,SBrkr,0.0,TA,Gd,VinylSd,VinylSd,NA,Ex,1,PConc,2,Typ,541.0,2,TA,Fin,TA,BuiltIn,2318.0,7.748460023899697,1,GasA,Ex,2Story,1,Gd,Lvl,Gtl,9512.0,14.99350614262242,Inside,IR1,0.0,060,FV,0.0,None,NA,0.0,6,Somerst,246.0,5,7,Y,0.0,NA,CompShg,Gable,Partial,New,0.0,Pave,8,3.5,960.0,246.0,3278.0,20.240142016334854,AllPub,0.0,2005,2006,2006,294323.0,12.592433082713933 -2355,527375160,1109.0,7.011213987350367,766.0,0.0,NA,3,1Fam,Fa,No,0,0,TA,127.0,548.0,0.0,ALQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,Plywood,Plywood,NA,TA,1,CBlock,3,Typ,485.0,2,TA,RFn,TA,Attchd,1875.0,7.536363938404511,0,GasA,TA,SLvl,1,Gd,Lvl,Gtl,10530.0,15.248921792104442,Inside,Reg,0.0,080,RL,248.0,BrkFace,NA,0.0,6,NWAmes,28.0,6,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,8,3.0,675.0,76.0,2550.0,19.003691717103283,AllPub,48.0,1975,2000,2006,184500.0,12.125404742462718 +2355,527375160,1109.0,7.011213987350367,766.0,0.0,NA,3,1Fam,Fa,No,0,0,TA,127.0,548.0,0.0,ALQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,Plywood,Plywood,NA,TA,1,CBlock,3,Typ,485.0,2,TA,RFn,TA,Attchd,1875.0,7.536363938404511,0,GasA,TA,SLvl,1,Gd,Lvl,Gtl,10530.0,15.248921792104442,Inside,Reg,0.0,080,RL,248.0,BrkFace,NA,0.0,6,NWAmes,28.0,6,6,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,8,3.0,675.0,76.0,2550.0,19.00369171710328,AllPub,48.0,1975,2000,2006,184500.0,12.125404742462718 2356,527376090,1074.0,6.97914527506881,0.0,0.0,NA,3,1Fam,TA,No,1,0,Gd,268.0,788.0,0.0,ALQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,MnPrv,NA,0,CBlock,1,Typ,495.0,2,TA,RFn,TA,Attchd,1074.0,6.97914527506881,1,GasA,Ex,1Story,1,TA,Lvl,Gtl,10140.0,15.153811121425997,Inside,Reg,0.0,020,RL,0.0,None,NA,0.0,7,NWAmes,88.0,6,5,Y,0.0,NA,CompShg,Gable,Normal,WD,0.0,Pave,6,2.5,1056.0,88.0,2130.0,18.155060764405075,AllPub,0.0,1975,1975,2006,153500.0,11.941455846009388 2357,527376110,832.0,6.723832440821209,832.0,0.0,NA,4,1Fam,TA,No,0,0,Gd,638.0,194.0,0.0,GLQ,Unf,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,GdWo,TA,1,PConc,2,Typ,528.0,2,TA,RFn,TA,Attchd,1664.0,7.416979621381154,1,GasA,TA,2Story,1,TA,Lvl,Gtl,10140.0,15.153811121425997,Inside,Reg,0.0,060,RL,0.0,None,NA,0.0,3,NWAmes,28.0,5,7,Y,0.0,NA,CompShg,Gable,Normal,WD,259.0,Pave,8,2.5,832.0,287.0,2496.0,18.901156773521873,AllPub,0.0,1976,1976,2006,162900.0,12.000891794590137 2358,527377030,1309.0,7.1770187659099,0.0,0.0,NA,3,1Fam,TA,No,1,0,TA,0.0,663.0,377.0,ALQ,LwQ,Y,Norm,Norm,SBrkr,0.0,TA,TA,HdBoard,HdBoard,GdPrv,Fa,1,CBlock,1,Typ,484.0,2,TA,RFn,TA,Attchd,1309.0,7.1770187659099,1,GasA,Fa,1Story,1,Gd,Lvl,Gtl,10140.0,15.153811121425997,Inside,Reg,0.0,020,RL,99.0,BrkFace,NA,0.0,1,NWAmes,0.0,6,6,Y,648.0,Fa,CompShg,Hip,Normal,WD,0.0,Pave,5,2.5,1040.0,265.0,2349.0,18.61275210110533,AllPub,265.0,1974,1999,2006,181000.0,12.106252310247962 diff --git a/data/data_clean_with_transformations_and_factors.csv b/data/data_clean_with_transformations_and_factors.csv index eecf2a8..1fff8a9 100644 --- a/data/data_clean_with_transformations_and_factors.csv +++ b/data/data_clean_with_transformations_and_factors.csv @@ -350,7 +350,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Bedroom AbvGr, 352,527132090,1478.0,7.298445101508147,0.0,0.0,2,TA,Av,1,0,Gd,1077.0,341.0,0.0,GLQ,Unf,SBrkr,0.0,NA,NA,0,2,Typ,495.0,2,TA,Fin,TA,1478.0,7.298445101508147,0,1,TA,Gtl,7380.0,14.367200464938653,IR1,0.0,0.0,0.0,7,43.0,5,8,Y,0.0,NA,0.0,5,3.0,1418.0,211.0,2896.0,19.622362214685307,AllPub,168.0,0,1,1,0,0,0,0,1,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,11,11,240000.0,12.388394202324129 353,527146010,1734.0,7.458186157340487,0.0,0.0,2,TA,No,1,0,Gd,846.0,741.0,0.0,GLQ,Unf,SBrkr,0.0,NA,NA,0,2,Typ,528.0,2,TA,RFn,TA,1734.0,7.458186157340487,0,1,Gd,Gtl,8013.0,14.56854934744058,IR1,0.0,0.0,0.0,9,50.0,5,8,Y,0.0,NA,0.0,6,3.0,1587.0,102.0,3321.0,20.306016067856913,AllPub,52.0,0,1,0,0,1,0,0,1,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,14,13,239500.0,12.386308695833106 354,527161040,751.0,6.621405651764134,631.0,0.0,3,TA,No,0,0,Gd,195.0,189.0,0.0,GLQ,Unf,SBrkr,0.0,NA,TA,1,2,Typ,396.0,2,TA,Fin,TA,1382.0,7.231287004327616,1,1,TA,Gtl,8923.0,14.834252319425625,IR1,0.0,0.0,0.0,2,0.0,5,7,Y,0.0,NA,0.0,7,2.5,384.0,256.0,1766.0,17.303249574220334,AllPub,256.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,11,177500.0,12.086725887897607 -355,527162110,885.0,6.785587645007929,833.0,0.0,3,TA,No,0,0,Gd,832.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,2,Typ,427.0,2,TA,Fin,TA,1718.0,7.4489161025442,1,1,TA,Gtl,10141.0,15.15405917561631,IR1,0.0,40.0,0.0,12,94.0,5,7,Y,0.0,NA,291.0,7,2.5,832.0,385.0,2550.0,19.003691717103283,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,11,185000.0,12.128111104060462 +355,527162110,885.0,6.785587645007929,833.0,0.0,3,TA,No,0,0,Gd,832.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,2,Typ,427.0,2,TA,Fin,TA,1718.0,7.4489161025442,1,1,TA,Gtl,10141.0,15.15405917561631,IR1,0.0,40.0,0.0,12,94.0,5,7,Y,0.0,NA,291.0,7,2.5,832.0,385.0,2550.0,19.00369171710328,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,11,185000.0,12.128111104060462 356,527162120,952.0,6.858565034791365,684.0,0.0,3,TA,No,1,0,Gd,476.0,476.0,0.0,GLQ,Unf,SBrkr,0.0,NA,TA,1,2,Typ,440.0,2,TA,Fin,TA,1636.0,7.400009517162692,1,1,TA,Gtl,7500.0,14.406534966757283,Reg,0.0,0.0,0.0,10,84.0,5,6,Y,0.0,NA,0.0,7,3.5,952.0,84.0,2588.0,19.07480946817217,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,11,10,191000.0,12.160028707028767 357,527163040,799.0,6.683360945766275,772.0,0.0,3,TA,No,0,0,Gd,799.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,2,Typ,380.0,2,TA,RFn,TA,1571.0,7.359467638255621,1,1,TA,Gtl,7837.0,14.51404532104361,IR1,0.0,0.0,0.0,5,40.0,7,6,Y,0.0,NA,0.0,7,2.5,799.0,40.0,2370.0,18.654821409606946,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,16,15,178000.0,12.089538829274222 358,527163070,680.0,6.522092798170152,790.0,0.0,3,Gd,No,0,0,Gd,370.0,310.0,0.0,ALQ,Unf,SBrkr,0.0,NA,TA,1,2,Typ,420.0,2,TA,Fin,TA,1470.0,7.293017679772782,1,1,TA,Gtl,9765.0,15.059201296829725,IR2,0.0,68.0,480.0,4,63.0,8,6,Y,0.0,NA,0.0,6,2.5,680.0,295.0,2150.0,18.198382041699816,AllPub,232.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,16,16,185000.0,12.128111104060462 @@ -543,7 +543,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Bedroom AbvGr, 550,531452260,754.0,6.625392368007956,786.0,0.0,3,TA,No,1,0,Gd,122.0,36.0,596.0,LwQ,GLQ,SBrkr,0.0,NA,NA,0,2,Typ,495.0,2,TA,RFn,TA,1540.0,7.3395376954076745,1,1,Gd,Gtl,9109.0,14.885540064062317,Reg,0.0,0.0,0.0,10,32.0,5,7,Y,0.0,NA,0.0,6,3.5,754.0,172.0,2294.0,18.50112687133047,AllPub,140.0,0,1,1,0,0,0,0,1,1,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,15,15,184000.0,12.122691036591123 551,531453100,698.0,6.548219102762372,702.0,0.0,3,TA,No,0,0,Gd,345.0,331.0,0.0,Rec,Unf,SBrkr,0.0,NA,NA,0,2,Typ,465.0,2,TA,RFn,TA,1400.0,7.24422751560335,1,1,TA,Gtl,10274.0,15.186855822557384,IR1,0.0,141.0,0.0,7,48.0,7,6,Y,0.0,NA,0.0,6,2.5,676.0,48.0,2076.0,18.036445788849743,AllPub,0.0,0,1,1,0,0,0,1,0,1,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,23,23,162000.0,11.99535161421452 552,531475220,964.0,6.871091294610546,918.0,0.0,4,NA,NA,0,0,NA,0.0,0.0,0.0,NA,NA,SBrkr,0.0,NA,TA,2,2,Typ,612.0,2,TA,Unf,TA,1882.0,7.540090320145325,0,2,TA,Gtl,8250.0,14.64026616916342,Reg,0.0,0.0,0.0,5,0.0,7,6,Y,0.0,NA,0.0,8,2.0,0.0,0.0,1882.0,17.588839942548756,AllPub,0.0,0,1,0,1,0,0,0,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,28,28,160000.0,11.982929094215963 -553,531477020,841.0,6.734591659972948,0.0,0.0,2,Fa,No,0,0,TA,721.0,0.0,0.0,Unf,Unf,SBrkr,24.0,NA,NA,0,1,Typ,294.0,1,TA,Unf,TA,841.0,6.734591659972948,0,1,TA,Gtl,8400.0,14.68470426970406,Reg,0.0,0.0,0.0,9,0.0,4,4,N,0.0,NA,0.0,4,1.0,721.0,274.0,1562.0,16.762371023178837,AllPub,250.0,0,1,1,0,0,0,1,0,0,1,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,59,59,82000.0,11.314474526246391 +553,531477020,841.0,6.734591659972948,0.0,0.0,2,Fa,No,0,0,TA,721.0,0.0,0.0,Unf,Unf,SBrkr,24.0,NA,NA,0,1,Typ,294.0,1,TA,Unf,TA,841.0,6.734591659972948,0,1,TA,Gtl,8400.0,14.68470426970406,Reg,0.0,0.0,0.0,9,0.0,4,4,N,0.0,NA,0.0,4,1.0,721.0,274.0,1562.0,16.762371023178833,AllPub,250.0,0,1,1,0,0,0,1,0,0,1,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,59,59,82000.0,11.314474526246391 554,531479020,784.0,6.664409020350408,0.0,0.0,2,Fa,No,0,0,Fa,784.0,0.0,0.0,Unf,Unf,FuseA,91.0,NA,NA,0,1,Typ,360.0,2,Fa,Unf,Fa,784.0,6.664409020350408,0,1,TA,Gtl,9000.0,14.855599984056148,Reg,0.0,0.0,0.0,10,0.0,3,6,N,0.0,NA,0.0,5,1.0,784.0,91.0,1568.0,16.7790642448278,AllPub,0.0,0,0,1,0,0,1,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,81,59,76000.0,11.238488619268468 555,532353020,980.0,6.887552571664617,0.0,0.0,3,TA,No,1,0,TA,28.0,68.0,884.0,LwQ,BLQ,SBrkr,0.0,MnPrv,NA,0,1,Typ,400.0,2,TA,Unf,TA,980.0,6.887552571664617,0,1,TA,Gtl,9750.0,15.055349293727405,IR1,0.0,0.0,0.0,11,28.0,5,5,Y,0.0,NA,0.0,5,2.0,980.0,28.0,1960.0,17.773050992818334,AllPub,0.0,0,1,1,0,0,0,1,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,47,47,110000.0,11.608235644774552 556,532353130,980.0,6.887552571664617,0.0,0.0,3,TA,No,0,0,TA,420.0,560.0,0.0,BLQ,Unf,SBrkr,0.0,NA,NA,0,1,Typ,484.0,2,TA,Unf,TA,980.0,6.887552571664617,0,1,TA,Gtl,7064.0,14.260797286621031,Reg,0.0,153.0,0.0,7,0.0,6,5,Y,0.0,NA,0.0,6,1.0,980.0,192.0,1960.0,17.773050992818334,AllPub,192.0,0,1,1,0,0,0,1,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,32,32,135000.0,11.813030057420567 @@ -943,7 +943,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Bedroom AbvGr, 954,914476380,1217.0,7.104144092987527,0.0,0.0,3,TA,Av,1,0,Gd,577.0,611.0,0.0,GLQ,Unf,SBrkr,0.0,GdPrv,NA,0,2,Typ,497.0,2,TA,Unf,TA,1217.0,7.104144092987527,0,1,Gd,Gtl,9947.0,15.105519458517929,IR1,0.0,0.0,0.0,6,27.0,5,7,Y,0.0,NA,0.0,6,3.0,1188.0,195.0,2405.0,18.724278876442806,AllPub,168.0,0,1,1,0,0,0,0,1,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,19,18,173000.0,12.061046873479915 955,914476430,1595.0,7.374629015218945,0.0,0.0,2,TA,No,1,0,Gd,1527.0,55.0,0.0,BLQ,Unf,SBrkr,0.0,NA,NA,0,2,Typ,672.0,2,TA,Unf,TA,1595.0,7.374629015218945,0,1,TA,Gtl,11070.0,15.375508981989565,Reg,0.0,0.0,0.0,4,0.0,5,5,Y,0.0,NA,0.0,5,3.0,1582.0,0.0,3177.0,20.082651686134287,AllPub,0.0,1,1,1,0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,18,18,152000.0,11.931635799828413 956,916176030,1344.0,7.203405521083095,0.0,0.0,3,TA,No,0,1,TA,354.0,111.0,354.0,GLQ,Rec,FuseA,0.0,NA,Gd,1,1,Typ,525.0,2,TA,RFn,TA,1344.0,7.203405521083095,0,1,Gd,Gtl,14375.0,16.047184443127506,IR1,0.0,541.0,0.0,1,118.0,6,6,Y,0.0,NA,233.0,7,1.5,819.0,351.0,2163.0,18.226368292983384,NoSeWa,0.0,1,1,1,0,0,0,1,0,0,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,51,51,137500.0,11.831379196088763 -957,916176125,2036.0,7.618742377670413,0.0,0.0,3,TA,Gd,2,0,Gd,80.0,1236.0,820.0,ALQ,Rec,SBrkr,0.0,NA,Gd,2,2,Typ,513.0,2,TA,RFn,TA,2036.0,7.618742377670413,0,1,TA,Sev,215245.0,24.142341911893194,IR3,0.0,0.0,0.0,6,0.0,5,7,Y,0.0,NA,0.0,8,4.0,2136.0,0.0,4172.0,21.487371590601576,AllPub,0.0,0,1,1,0,0,0,1,0,0,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,44,44,375000.0,12.834681304952548 +957,916176125,2036.0,7.618742377670413,0.0,0.0,3,TA,Gd,2,0,Gd,80.0,1236.0,820.0,ALQ,Rec,SBrkr,0.0,NA,Gd,2,2,Typ,513.0,2,TA,RFn,TA,2036.0,7.618742377670413,0,1,TA,Sev,215245.0,24.14234191189319,IR3,0.0,0.0,0.0,6,0.0,5,7,Y,0.0,NA,0.0,8,4.0,2136.0,0.0,4172.0,21.487371590601576,AllPub,0.0,0,1,1,0,0,0,1,0,0,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,44,44,375000.0,12.834681304952548 958,916380070,1620.0,7.3901814282264295,0.0,0.0,2,TA,Gd,1,0,Ex,598.0,1022.0,0.0,GLQ,Unf,SBrkr,0.0,NA,Ex,1,2,Typ,912.0,3,TA,Fin,TA,1620.0,7.3901814282264295,0,1,Ex,Gtl,12898.0,15.766310574459004,IR1,0.0,70.0,0.0,9,0.0,5,9,Y,0.0,NA,0.0,6,3.0,1620.0,228.0,3240.0,20.18134982456163,AllPub,228.0,0,1,1,0,0,0,0,1,0,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,1,2,1,315500.0,12.661913960963405 959,916382010,846.0,6.740519359606223,846.0,0.0,3,TA,Av,0,0,Ex,846.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,NA,0,2,Typ,650.0,2,TA,RFn,TA,1692.0,7.433666540166168,1,1,Gd,Gtl,13159.0,15.817981703423513,IR1,0.0,0.0,0.0,7,114.0,5,7,Y,0.0,NA,0.0,6,2.5,846.0,322.0,2538.0,18.981057361211253,AllPub,208.0,0,1,1,0,0,0,0,1,1,1,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,1,1,0,0,0,224500.0,12.321630986164447 960,916382100,2036.0,7.618742377670413,0.0,0.0,3,TA,Gd,1,0,Ex,432.0,1758.0,0.0,GLQ,Unf,SBrkr,0.0,NA,Ex,1,2,Typ,780.0,3,TA,Fin,TA,2036.0,7.618742377670413,0,1,Ex,Gtl,13438.0,15.872206187914584,IR1,0.0,246.0,0.0,7,154.0,5,9,Y,0.0,NA,0.0,9,3.0,2190.0,244.0,4226.0,21.55558682405044,AllPub,90.0,0,1,1,0,0,0,1,0,0,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,1,1,410000.0,12.92391243868049 @@ -1600,7 +1600,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Bedroom AbvGr, 1623,527161090,947.0,6.853299093186078,767.0,0.0,3,TA,No,1,0,Gd,52.0,871.0,0.0,ALQ,Unf,SBrkr,0.0,NA,TA,1,2,Typ,451.0,2,TA,Fin,TA,1714.0,7.446585099157725,1,1,TA,Gtl,8637.0,14.753481627067941,IR1,0.0,0.0,0.0,4,48.0,5,6,Y,0.0,NA,0.0,7,3.5,923.0,304.0,2637.0,19.16529105486511,AllPub,256.0,1,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,8,7,180000.0,12.100712129872347 1624,527162080,691.0,6.53813982376767,862.0,0.0,3,TA,No,0,0,Gd,277.0,414.0,0.0,Rec,Unf,SBrkr,0.0,NA,NA,0,2,Typ,420.0,2,TA,Fin,TA,1553.0,7.347943823148687,1,1,Gd,Gtl,7875.0,14.525905820919508,Reg,0.0,0.0,0.0,8,44.0,5,7,Y,0.0,NA,0.0,6,2.5,691.0,44.0,2244.0,18.397775781250722,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,11,178750.0,12.093743460556254 1625,527162090,1253.0,7.133295954896068,0.0,0.0,3,Gd,No,0,0,Gd,1237.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,2,Typ,402.0,2,TA,Fin,TA,1253.0,7.133295954896068,0,1,TA,Gtl,7875.0,14.525905820919508,Reg,0.0,38.0,0.0,6,21.0,5,7,Y,0.0,NA,0.0,6,2.0,1237.0,241.0,2490.0,18.88965476782098,AllPub,220.0,0,1,1,0,0,0,0,1,0,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,12,11,176000.0,12.078239274020289 -1626,527162140,957.0,6.863803391452954,1342.0,0.0,5,TA,No,0,0,Gd,938.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,3,Typ,482.0,2,TA,Fin,TA,2299.0,7.740229524763182,1,1,TA,Gtl,7500.0,14.406534966757283,Reg,0.0,0.0,0.0,8,30.0,5,6,Y,0.0,NA,0.0,7,3.5,938.0,218.0,3237.0,20.176684883555122,AllPub,188.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,8,4,204000.0,12.225875272826354 +1626,527162140,957.0,6.863803391452954,1342.0,0.0,5,TA,No,0,0,Gd,938.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,3,Typ,482.0,2,TA,Fin,TA,2299.0,7.740229524763182,1,1,TA,Gtl,7500.0,14.406534966757283,Reg,0.0,0.0,0.0,8,30.0,5,6,Y,0.0,NA,0.0,7,3.5,938.0,218.0,3237.0,20.17668488355512,AllPub,188.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,8,4,204000.0,12.225875272826354 1627,527163080,1187.0,7.079184394609668,0.0,0.0,3,TA,No,0,0,Gd,1168.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,NA,0,2,Typ,420.0,2,TA,RFn,TA,1187.0,7.079184394609668,0,1,Gd,Gtl,9556.0,15.005043482926363,IR1,0.0,52.0,0.0,8,21.0,5,7,Y,0.0,NA,0.0,6,2.0,1168.0,21.0,2355.0,18.62480250396189,AllPub,0.0,0,1,1,0,0,0,0,1,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,15,14,160000.0,11.982929094215963 1628,527165020,802.0,6.687108607866515,670.0,0.0,3,TA,No,0,0,Gd,384.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,2,Typ,402.0,2,TA,RFn,TA,1472.0,7.294377299288821,1,1,Gd,Gtl,10784.0,15.309174951796374,IR1,0.0,76.0,0.0,5,0.0,5,7,Y,0.0,NA,0.0,7,2.5,384.0,164.0,1856.0,17.526078784323257,AllPub,164.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,16,15,160000.0,11.982929094215963 1629,527165100,812.0,6.699500340161678,670.0,0.0,3,TA,No,0,0,Gd,384.0,0.0,0.0,Unf,Unf,SBrkr,0.0,NA,TA,1,2,Typ,392.0,2,TA,Fin,TA,1482.0,7.301147805856032,1,1,Gd,Gtl,9125.0,14.889907769270682,IR1,0.0,170.0,0.0,7,25.0,5,7,Y,0.0,NA,0.0,7,2.5,384.0,125.0,1866.0,17.550300430394216,AllPub,100.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,15,163900.0,12.00701176473192 @@ -2313,7 +2313,7 @@ Order,PID,1st Flr SF,1st Flr SF (box-cox-0),2nd Flr SF,3Ssn Porch,Bedroom AbvGr, 2352,527356060,811.0,6.698268054115413,741.0,0.0,3,TA,No,1,0,Gd,163.0,550.0,0.0,ALQ,Unf,SBrkr,0.0,MnPrv,TA,1,2,Typ,434.0,2,TA,RFn,TA,1552.0,7.347299700743164,1,1,TA,Gtl,11475.0,15.466852293432254,Reg,0.0,0.0,0.0,2,208.0,6,6,Y,0.0,NA,0.0,6,3.5,713.0,417.0,2265.0,18.441405394566303,AllPub,209.0,0,1,1,0,0,0,1,0,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,31,31,179900.0,12.100156419938624 2353,527358090,1083.0,6.9874902470009905,0.0,0.0,2,TA,Gd,1,0,Ex,42.0,1005.0,0.0,GLQ,Unf,SBrkr,40.0,NA,Fa,1,1,Typ,596.0,2,TA,RFn,TA,1083.0,6.9874902470009905,0,1,TA,Gtl,9927.0,15.10046702787839,IR1,0.0,252.0,0.0,7,0.0,5,7,Y,0.0,NA,0.0,5,2.0,1047.0,484.0,2130.0,18.155060764405075,AllPub,444.0,0,1,1,0,0,0,1,0,0,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,30,30,172000.0,12.05524975579559 2354,527365010,960.0,6.866933284461882,1358.0,0.0,3,TA,No,1,0,Gd,172.0,788.0,0.0,ALQ,Unf,SBrkr,0.0,NA,Ex,1,2,Typ,541.0,2,TA,Fin,TA,2318.0,7.748460023899697,1,1,Gd,Gtl,9512.0,14.99350614262242,IR1,0.0,0.0,0.0,6,246.0,5,7,Y,0.0,NA,0.0,8,3.5,960.0,246.0,3278.0,20.240142016334854,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,1,1,1,1,0,294323.0,12.592433082713933 -2355,527375160,1109.0,7.011213987350367,766.0,0.0,3,Fa,No,0,0,TA,127.0,548.0,0.0,ALQ,Unf,SBrkr,0.0,NA,TA,1,3,Typ,485.0,2,TA,RFn,TA,1875.0,7.536363938404511,0,1,Gd,Gtl,10530.0,15.248921792104442,Reg,0.0,248.0,0.0,6,28.0,6,6,Y,0.0,NA,0.0,8,3.0,675.0,76.0,2550.0,19.003691717103283,AllPub,48.0,0,1,1,0,0,0,1,0,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,31,6,184500.0,12.125404742462718 +2355,527375160,1109.0,7.011213987350367,766.0,0.0,3,Fa,No,0,0,TA,127.0,548.0,0.0,ALQ,Unf,SBrkr,0.0,NA,TA,1,3,Typ,485.0,2,TA,RFn,TA,1875.0,7.536363938404511,0,1,Gd,Gtl,10530.0,15.248921792104442,Reg,0.0,248.0,0.0,6,28.0,6,6,Y,0.0,NA,0.0,8,3.0,675.0,76.0,2550.0,19.00369171710328,AllPub,48.0,0,1,1,0,0,0,1,0,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,31,6,184500.0,12.125404742462718 2356,527376090,1074.0,6.97914527506881,0.0,0.0,3,TA,No,1,0,Gd,268.0,788.0,0.0,ALQ,Unf,SBrkr,0.0,MnPrv,NA,0,1,Typ,495.0,2,TA,RFn,TA,1074.0,6.97914527506881,1,1,TA,Gtl,10140.0,15.153811121425997,Reg,0.0,0.0,0.0,7,88.0,6,5,Y,0.0,NA,0.0,6,2.5,1056.0,88.0,2130.0,18.155060764405075,AllPub,0.0,0,1,1,0,0,0,1,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,31,31,153500.0,11.941455846009388 2357,527376110,832.0,6.723832440821209,832.0,0.0,4,TA,No,0,0,Gd,638.0,194.0,0.0,GLQ,Unf,SBrkr,0.0,GdWo,TA,1,2,Typ,528.0,2,TA,RFn,TA,1664.0,7.416979621381154,1,1,TA,Gtl,10140.0,15.153811121425997,Reg,0.0,0.0,0.0,3,28.0,5,7,Y,0.0,NA,259.0,8,2.5,832.0,287.0,2496.0,18.901156773521873,AllPub,0.0,0,1,1,0,0,0,0,1,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,30,30,162900.0,12.000891794590137 2358,527377030,1309.0,7.1770187659099,0.0,0.0,3,TA,No,1,0,TA,0.0,663.0,377.0,ALQ,LwQ,SBrkr,0.0,GdPrv,Fa,1,1,Typ,484.0,2,TA,RFn,TA,1309.0,7.1770187659099,1,1,Gd,Gtl,10140.0,15.153811121425997,Reg,0.0,99.0,0.0,1,0.0,6,6,Y,648.0,Fa,0.0,5,2.5,1040.0,265.0,2349.0,18.61275210110533,AllPub,265.0,0,1,1,0,0,0,1,0,0,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,32,7,181000.0,12.106252310247962