{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.model_selection import StratifiedShuffleSplit" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Project Goals\n", "To create a model that predicts median house values in Californian districts, given a number of features from these districts" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Get the data" ] }, { "cell_type": "code", "execution_count": 125, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-122.23 | \n", "37.88 | \n", "41.0 | \n", "880.0 | \n", "129.0 | \n", "322.0 | \n", "126.0 | \n", "8.3252 | \n", "452600.0 | \n", "NEAR BAY | \n", "
1 | \n", "-122.22 | \n", "37.86 | \n", "21.0 | \n", "7099.0 | \n", "1106.0 | \n", "2401.0 | \n", "1138.0 | \n", "8.3014 | \n", "358500.0 | \n", "NEAR BAY | \n", "
2 | \n", "-122.24 | \n", "37.85 | \n", "52.0 | \n", "1467.0 | \n", "190.0 | \n", "496.0 | \n", "177.0 | \n", "7.2574 | \n", "352100.0 | \n", "NEAR BAY | \n", "
3 | \n", "-122.25 | \n", "37.85 | \n", "52.0 | \n", "1274.0 | \n", "235.0 | \n", "558.0 | \n", "219.0 | \n", "5.6431 | \n", "341300.0 | \n", "NEAR BAY | \n", "
4 | \n", "-122.25 | \n", "37.85 | \n", "52.0 | \n", "1627.0 | \n", "280.0 | \n", "565.0 | \n", "259.0 | \n", "3.8462 | \n", "342200.0 | \n", "NEAR BAY | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "
---|---|---|---|---|---|---|---|---|---|
count | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20433.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "
mean | \n", "-119.569704 | \n", "35.631861 | \n", "28.639486 | \n", "2635.763081 | \n", "537.870553 | \n", "1425.476744 | \n", "499.539680 | \n", "3.870671 | \n", "206855.816909 | \n", "
std | \n", "2.003532 | \n", "2.135952 | \n", "12.585558 | \n", "2181.615252 | \n", "421.385070 | \n", "1132.462122 | \n", "382.329753 | \n", "1.899822 | \n", "115395.615874 | \n", "
min | \n", "-124.350000 | \n", "32.540000 | \n", "1.000000 | \n", "2.000000 | \n", "1.000000 | \n", "3.000000 | \n", "1.000000 | \n", "0.499900 | \n", "14999.000000 | \n", "
25% | \n", "-121.800000 | \n", "33.930000 | \n", "18.000000 | \n", "1447.750000 | \n", "296.000000 | \n", "787.000000 | \n", "280.000000 | \n", "2.563400 | \n", "119600.000000 | \n", "
50% | \n", "-118.490000 | \n", "34.260000 | \n", "29.000000 | \n", "2127.000000 | \n", "435.000000 | \n", "1166.000000 | \n", "409.000000 | \n", "3.534800 | \n", "179700.000000 | \n", "
75% | \n", "-118.010000 | \n", "37.710000 | \n", "37.000000 | \n", "3148.000000 | \n", "647.000000 | \n", "1725.000000 | \n", "605.000000 | \n", "4.743250 | \n", "264725.000000 | \n", "
max | \n", "-114.310000 | \n", "41.950000 | \n", "52.000000 | \n", "39320.000000 | \n", "6445.000000 | \n", "35682.000000 | \n", "6082.000000 | \n", "15.000100 | \n", "500001.000000 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|---|
17875 | \n", "-121.99 | \n", "37.40 | \n", "35.0 | \n", "1845.0 | \n", "325.0 | \n", "1343.0 | \n", "317.0 | \n", "5.3912 | \n", "235300.0 | \n", "<1H OCEAN | \n", "
9360 | \n", "-122.53 | \n", "37.95 | \n", "22.0 | \n", "7446.0 | \n", "1979.0 | \n", "2980.0 | \n", "1888.0 | \n", "3.5838 | \n", "271300.0 | \n", "NEAR BAY | \n", "
4338 | \n", "-118.31 | \n", "34.08 | \n", "26.0 | \n", "1609.0 | \n", "534.0 | \n", "1868.0 | \n", "497.0 | \n", "2.7038 | \n", "227100.0 | \n", "<1H OCEAN | \n", "
986 | \n", "-121.85 | \n", "37.72 | \n", "43.0 | \n", "228.0 | \n", "40.0 | \n", "83.0 | \n", "42.0 | \n", "10.3203 | \n", "400000.0 | \n", "INLAND | \n", "
8129 | \n", "-118.17 | \n", "33.80 | \n", "26.0 | \n", "1589.0 | \n", "380.0 | \n", "883.0 | \n", "366.0 | \n", "3.5313 | \n", "187500.0 | \n", "NEAR OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|---|
15722 | \n", "-122.46 | \n", "37.78 | \n", "47.0 | \n", "1682.0 | \n", "379.0 | \n", "837.0 | \n", "375.0 | \n", "5.2806 | \n", "400000.0 | \n", "NEAR BAY | \n", "
19685 | \n", "-121.61 | \n", "39.14 | \n", "44.0 | \n", "2035.0 | \n", "476.0 | \n", "1030.0 | \n", "453.0 | \n", "1.4661 | \n", "65200.0 | \n", "INLAND | \n", "
6989 | \n", "-118.04 | \n", "33.97 | \n", "29.0 | \n", "2376.0 | \n", "700.0 | \n", "1968.0 | \n", "680.0 | \n", "2.6082 | \n", "162500.0 | \n", "<1H OCEAN | \n", "
5804 | \n", "-118.25 | \n", "34.15 | \n", "13.0 | \n", "1107.0 | \n", "479.0 | \n", "616.0 | \n", "443.0 | \n", "0.8185 | \n", "187500.0 | \n", "<1H OCEAN | \n", "
5806 | \n", "-118.26 | \n", "34.14 | \n", "29.0 | \n", "3431.0 | \n", "1222.0 | \n", "4094.0 | \n", "1205.0 | \n", "2.2614 | \n", "248100.0 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "rooms_per_household | \n", "bedrooms_per_room | \n", "population_per_household | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "16512.000000 | \n", "16512.000000 | \n", "16512.000000 | \n", "16512.000000 | \n", "16354.000000 | \n", "16512.000000 | \n", "16512.000000 | \n", "16512.000000 | \n", "16512.000000 | \n", "16512.000000 | \n", "16354.000000 | \n", "16512.000000 | \n", "
mean | \n", "-119.575834 | \n", "35.639577 | \n", "28.653101 | \n", "2622.728319 | \n", "534.973890 | \n", "1419.790819 | \n", "497.060380 | \n", "3.875589 | \n", "206990.920724 | \n", "5.440341 | \n", "0.212878 | \n", "3.096437 | \n", "
std | \n", "2.001860 | \n", "2.138058 | \n", "12.574726 | \n", "2138.458419 | \n", "412.699041 | \n", "1115.686241 | \n", "375.720845 | \n", "1.904950 | \n", "115703.014830 | \n", "2.611712 | \n", "0.057379 | \n", "11.584826 | \n", "
min | \n", "-124.350000 | \n", "32.540000 | \n", "1.000000 | \n", "6.000000 | \n", "2.000000 | \n", "3.000000 | \n", "2.000000 | \n", "0.499900 | \n", "14999.000000 | \n", "1.130435 | \n", "0.100000 | \n", "0.692308 | \n", "
25% | \n", "-121.800000 | \n", "33.940000 | \n", "18.000000 | \n", "1443.000000 | \n", "295.000000 | \n", "784.000000 | \n", "279.000000 | \n", "2.566775 | \n", "119800.000000 | \n", "4.442040 | \n", "0.175304 | \n", "2.431287 | \n", "
50% | \n", "-118.510000 | \n", "34.260000 | \n", "29.000000 | \n", "2119.500000 | \n", "433.000000 | \n", "1164.000000 | \n", "408.000000 | \n", "3.540900 | \n", "179500.000000 | \n", "5.232284 | \n", "0.203031 | \n", "2.817653 | \n", "
75% | \n", "-118.010000 | \n", "37.720000 | \n", "37.000000 | \n", "3141.000000 | \n", "644.000000 | \n", "1719.250000 | \n", "602.000000 | \n", "4.744475 | \n", "263900.000000 | \n", "6.056361 | \n", "0.239831 | \n", "3.281420 | \n", "
max | \n", "-114.310000 | \n", "41.950000 | \n", "52.000000 | \n", "39320.000000 | \n", "6210.000000 | \n", "35682.000000 | \n", "5358.000000 | \n", "15.000100 | \n", "500001.000000 | \n", "141.909091 | \n", "1.000000 | \n", "1243.333333 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "NaN | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "<1H OCEAN | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "NaN | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "<1H OCEAN | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "NaN | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "<1H OCEAN | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "NaN | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "INLAND | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "NaN | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "<1H OCEAN | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "<1H OCEAN | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "<1H OCEAN | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "INLAND | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "433.0 | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "<1H OCEAN | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "433.0 | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "<1H OCEAN | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "433.0 | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "<1H OCEAN | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "433.0 | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "INLAND | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "433.0 | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "
---|---|---|---|---|---|---|---|---|
17606 | \n", "-121.89 | \n", "37.29 | \n", "38.0 | \n", "1568.0 | \n", "351.0 | \n", "710.0 | \n", "339.0 | \n", "2.7042 | \n", "
18632 | \n", "-121.93 | \n", "37.05 | \n", "14.0 | \n", "679.0 | \n", "108.0 | \n", "306.0 | \n", "113.0 | \n", "6.4214 | \n", "
14650 | \n", "-117.20 | \n", "32.77 | \n", "31.0 | \n", "1952.0 | \n", "471.0 | \n", "936.0 | \n", "462.0 | \n", "2.8621 | \n", "
3230 | \n", "-119.61 | \n", "36.31 | \n", "25.0 | \n", "1847.0 | \n", "371.0 | \n", "1460.0 | \n", "353.0 | \n", "1.8839 | \n", "
3555 | \n", "-118.59 | \n", "34.23 | \n", "17.0 | \n", "6592.0 | \n", "1525.0 | \n", "4459.0 | \n", "1463.0 | \n", "3.0347 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "
---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "433.0 | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "433.0 | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "433.0 | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "433.0 | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "433.0 | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "
---|---|---|---|---|---|---|---|---|
0 | \n", "-121.89 | \n", "37.29 | \n", "38.0 | \n", "1568.0 | \n", "351.0 | \n", "710.0 | \n", "339.0 | \n", "2.7042 | \n", "
1 | \n", "-121.93 | \n", "37.05 | \n", "14.0 | \n", "679.0 | \n", "108.0 | \n", "306.0 | \n", "113.0 | \n", "6.4214 | \n", "
2 | \n", "-117.20 | \n", "32.77 | \n", "31.0 | \n", "1952.0 | \n", "471.0 | \n", "936.0 | \n", "462.0 | \n", "2.8621 | \n", "
3 | \n", "-119.61 | \n", "36.31 | \n", "25.0 | \n", "1847.0 | \n", "371.0 | \n", "1460.0 | \n", "353.0 | \n", "1.8839 | \n", "
4 | \n", "-118.59 | \n", "34.23 | \n", "17.0 | \n", "6592.0 | \n", "1525.0 | \n", "4459.0 | \n", "1463.0 | \n", "3.0347 | \n", "
\n", " | ocean_proximity | \n", "
---|---|
17606 | \n", "<1H OCEAN | \n", "
18632 | \n", "<1H OCEAN | \n", "
14650 | \n", "NEAR OCEAN | \n", "
3230 | \n", "INLAND | \n", "
3555 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "rooms_per_household | \n", "population_per_household | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-121.89 | \n", "37.29 | \n", "38 | \n", "1568 | \n", "351 | \n", "710 | \n", "339 | \n", "2.7042 | \n", "<1H OCEAN | \n", "4.62537 | \n", "2.0944 | \n", "
1 | \n", "-121.93 | \n", "37.05 | \n", "14 | \n", "679 | \n", "108 | \n", "306 | \n", "113 | \n", "6.4214 | \n", "<1H OCEAN | \n", "6.00885 | \n", "2.70796 | \n", "
2 | \n", "-117.2 | \n", "32.77 | \n", "31 | \n", "1952 | \n", "471 | \n", "936 | \n", "462 | \n", "2.8621 | \n", "NEAR OCEAN | \n", "4.22511 | \n", "2.02597 | \n", "
3 | \n", "-119.61 | \n", "36.31 | \n", "25 | \n", "1847 | \n", "371 | \n", "1460 | \n", "353 | \n", "1.8839 | \n", "INLAND | \n", "5.23229 | \n", "4.13598 | \n", "
4 | \n", "-118.59 | \n", "34.23 | \n", "17 | \n", "6592 | \n", "1525 | \n", "4459 | \n", "1463 | \n", "3.0347 | \n", "<1H OCEAN | \n", "4.50581 | \n", "3.04785 | \n", "
\n", " | Labels | \n", "Predictions | \n", "
---|---|---|
0 | \n", "286600.0 | \n", "210644.604593 | \n", "
1 | \n", "340600.0 | \n", "317768.806972 | \n", "
2 | \n", "196900.0 | \n", "210956.433312 | \n", "
3 | \n", "46300.0 | \n", "59218.988868 | \n", "
4 | \n", "254500.0 | \n", "189747.558499 | \n", "
\n", " | Labels | \n", "Predictions | \n", "
---|---|---|
0 | \n", "286600.0 | \n", "286600.0 | \n", "
1 | \n", "340600.0 | \n", "340600.0 | \n", "
2 | \n", "196900.0 | \n", "196900.0 | \n", "
3 | \n", "46300.0 | \n", "46300.0 | \n", "
4 | \n", "254500.0 | \n", "254500.0 | \n", "
\n", " | mean_fit_time | \n", "mean_score_time | \n", "mean_test_score | \n", "mean_train_score | \n", "param_bootstrap | \n", "param_max_features | \n", "param_n_estimators | \n", "params | \n", "rank_test_score | \n", "split0_test_score | \n", "... | \n", "split2_test_score | \n", "split2_train_score | \n", "split3_test_score | \n", "split3_train_score | \n", "split4_test_score | \n", "split4_train_score | \n", "std_fit_time | \n", "std_score_time | \n", "std_test_score | \n", "std_train_score | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
11 | \n", "3.354504 | \n", "0.053489 | \n", "-2.468326e+09 | \n", "-3.810330e+08 | \n", "NaN | \n", "8 | \n", "30 | \n", "{'n_estimators': 30, 'max_features': 8} | \n", "1 | \n", "-2.357390e+09 | \n", "... | \n", "-2.591972e+09 | \n", "-3.773239e+08 | \n", "-2.318617e+09 | \n", "-3.882250e+08 | \n", "-2.527022e+09 | \n", "-3.810005e+08 | \n", "0.172000 | \n", "0.009551 | \n", "1.091647e+08 | \n", "4.871017e+06 | \n", "
8 | \n", "2.525017 | \n", "0.050918 | \n", "-2.514668e+09 | \n", "-3.841296e+08 | \n", "NaN | \n", "6 | \n", "30 | \n", "{'n_estimators': 30, 'max_features': 6} | \n", "2 | \n", "-2.370010e+09 | \n", "... | \n", "-2.607703e+09 | \n", "-3.805218e+08 | \n", "-2.350953e+09 | \n", "-3.856095e+08 | \n", "-2.661059e+09 | \n", "-3.901917e+08 | \n", "0.221924 | \n", "0.002579 | \n", "1.285063e+08 | \n", "3.617057e+06 | \n", "
5 | \n", "1.784167 | \n", "0.058159 | \n", "-2.537877e+09 | \n", "-3.879289e+08 | \n", "NaN | \n", "4 | \n", "30 | \n", "{'n_estimators': 30, 'max_features': 4} | \n", "3 | \n", "-2.387153e+09 | \n", "... | \n", "-2.666426e+09 | \n", "-3.790867e+08 | \n", "-2.398071e+09 | \n", "-4.040957e+08 | \n", "-2.649316e+09 | \n", "-3.845520e+08 | \n", "0.122772 | \n", "0.017129 | \n", "1.214603e+08 | \n", "8.571233e+06 | \n", "
17 | \n", "0.976491 | \n", "0.028234 | \n", "-2.601971e+09 | \n", "-3.028238e-03 | \n", "False | \n", "4 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 4, 'boots... | \n", "4 | \n", "-2.525578e+09 | \n", "... | \n", "-2.609100e+09 | \n", "-0.000000e+00 | \n", "-2.439607e+09 | \n", "-0.000000e+00 | \n", "-2.725548e+09 | \n", "-0.000000e+00 | \n", "0.295675 | \n", "0.007139 | \n", "1.088031e+08 | \n", "6.056477e-03 | \n", "
10 | \n", "1.112599 | \n", "0.019048 | \n", "-2.674037e+09 | \n", "-4.923911e+08 | \n", "NaN | \n", "8 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 8} | \n", "5 | \n", "-2.571970e+09 | \n", "... | \n", "-2.842317e+09 | \n", "-4.730979e+08 | \n", "-2.460258e+09 | \n", "-5.155367e+08 | \n", "-2.776666e+09 | \n", "-4.985555e+08 | \n", "0.100974 | \n", "0.002301 | \n", "1.392720e+08 | \n", "1.459294e+07 | \n", "
7 | \n", "0.827751 | \n", "0.020989 | \n", "-2.704640e+09 | \n", "-5.013349e+08 | \n", "NaN | \n", "6 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 6} | \n", "6 | \n", "-2.549663e+09 | \n", "... | \n", "-2.762720e+09 | \n", "-4.994664e+08 | \n", "-2.521134e+09 | \n", "-4.990325e+08 | \n", "-2.907667e+09 | \n", "-5.055542e+08 | \n", "0.077836 | \n", "0.006335 | \n", "1.471542e+08 | \n", "3.100456e+06 | \n", "
15 | \n", "0.675495 | \n", "0.022814 | \n", "-2.779927e+09 | \n", "-5.272080e+00 | \n", "False | \n", "3 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 3, 'boots... | \n", "7 | \n", "-2.757999e+09 | \n", "... | \n", "-2.830927e+09 | \n", "-0.000000e+00 | \n", "-2.672765e+09 | \n", "-0.000000e+00 | \n", "-2.786190e+09 | \n", "-5.465556e+00 | \n", "0.073931 | \n", "0.001319 | \n", "6.286611e+07 | \n", "8.093117e+00 | \n", "
4 | \n", "0.558351 | \n", "0.021956 | \n", "-2.781611e+09 | \n", "-5.163863e+08 | \n", "NaN | \n", "4 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 4} | \n", "8 | \n", "-2.666283e+09 | \n", "... | \n", "-2.892276e+09 | \n", "-4.962893e+08 | \n", "-2.616813e+09 | \n", "-5.436192e+08 | \n", "-2.948207e+09 | \n", "-5.160297e+08 | \n", "0.039796 | \n", "0.008723 | \n", "1.268562e+08 | \n", "1.542862e+07 | \n", "
2 | \n", "1.151661 | \n", "0.052023 | \n", "-2.849913e+09 | \n", "-4.394734e+08 | \n", "NaN | \n", "2 | \n", "30 | \n", "{'n_estimators': 30, 'max_features': 2} | \n", "9 | \n", "-2.689185e+09 | \n", "... | \n", "-2.948330e+09 | \n", "-4.371702e+08 | \n", "-2.619995e+09 | \n", "-4.376955e+08 | \n", "-2.970968e+09 | \n", "-4.452654e+08 | \n", "0.144397 | \n", "0.002657 | \n", "1.626879e+08 | \n", "2.966320e+06 | \n", "
13 | \n", "0.611461 | \n", "0.023005 | \n", "-2.987513e+09 | \n", "-6.056027e-01 | \n", "False | \n", "2 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 2, 'boots... | \n", "10 | \n", "-2.810721e+09 | \n", "... | \n", "-3.131187e+09 | \n", "-0.000000e+00 | \n", "-2.788537e+09 | \n", "-0.000000e+00 | \n", "-3.099347e+09 | \n", "-2.967449e+00 | \n", "0.043821 | \n", "0.000978 | \n", "1.539231e+08 | \n", "1.181156e+00 | \n", "
1 | \n", "0.373621 | \n", "0.023403 | \n", "-3.094381e+09 | \n", "-5.818785e+08 | \n", "NaN | \n", "2 | \n", "10 | \n", "{'n_estimators': 10, 'max_features': 2} | \n", "11 | \n", "-3.047771e+09 | \n", "... | \n", "-3.130196e+09 | \n", "-5.776964e+08 | \n", "-2.865188e+09 | \n", "-5.716332e+08 | \n", "-3.173856e+09 | \n", "-5.802501e+08 | \n", "0.079333 | \n", "0.005578 | \n", "1.327046e+08 | \n", "7.345821e+06 | \n", "
16 | \n", "0.253212 | \n", "0.007124 | \n", "-3.305171e+09 | \n", "0.000000e+00 | \n", "False | \n", "4 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 4, 'bootst... | \n", "12 | \n", "-3.134040e+09 | \n", "... | \n", "-3.440422e+09 | \n", "-0.000000e+00 | \n", "-3.053647e+09 | \n", "-0.000000e+00 | \n", "-3.338344e+09 | \n", "-0.000000e+00 | \n", "0.097383 | \n", "0.000550 | \n", "1.879203e+08 | \n", "0.000000e+00 | \n", "
9 | \n", "0.280610 | \n", "0.006559 | \n", "-3.348851e+09 | \n", "-8.883545e+08 | \n", "NaN | \n", "8 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 8} | \n", "13 | \n", "-3.353504e+09 | \n", "... | \n", "-3.402843e+09 | \n", "-8.603321e+08 | \n", "-3.129307e+09 | \n", "-8.881964e+08 | \n", "-3.510047e+09 | \n", "-9.151287e+08 | \n", "0.043096 | \n", "0.000172 | \n", "1.241864e+08 | \n", "2.750227e+07 | \n", "
6 | \n", "0.129712 | \n", "0.006625 | \n", "-3.441447e+09 | \n", "-9.023976e+08 | \n", "NaN | \n", "6 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 6} | \n", "14 | \n", "-3.119657e+09 | \n", "... | \n", "-3.592772e+09 | \n", "-9.353135e+08 | \n", "-3.328934e+09 | \n", "-9.009801e+08 | \n", "-3.579607e+09 | \n", "-8.624664e+08 | \n", "0.020992 | \n", "0.000224 | \n", "1.893141e+08 | \n", "2.591445e+07 | \n", "
14 | \n", "0.216452 | \n", "0.007962 | \n", "-3.536728e+09 | \n", "-1.214568e+01 | \n", "False | \n", "3 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 3, 'bootst... | \n", "15 | \n", "-3.618324e+09 | \n", "... | \n", "-3.554815e+09 | \n", "-0.000000e+00 | \n", "-3.619116e+09 | \n", "-0.000000e+00 | \n", "-3.449864e+09 | \n", "-6.072840e+01 | \n", "0.081226 | \n", "0.000395 | \n", "7.795196e+07 | \n", "2.429136e+01 | \n", "
3 | \n", "0.143291 | \n", "0.007133 | \n", "-3.716852e+09 | \n", "-9.848396e+08 | \n", "NaN | \n", "4 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 4} | \n", "16 | \n", "-3.730181e+09 | \n", "... | \n", "-3.734515e+09 | \n", "-9.169425e+08 | \n", "-3.418747e+09 | \n", "-1.037400e+09 | \n", "-3.913907e+09 | \n", "-9.707739e+08 | \n", "0.027455 | \n", "0.001225 | \n", "1.631421e+08 | \n", "4.084607e+07 | \n", "
12 | \n", "0.137781 | \n", "0.007999 | \n", "-3.955792e+09 | \n", "0.000000e+00 | \n", "False | \n", "2 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 2, 'bootst... | \n", "17 | \n", "-3.785816e+09 | \n", "... | \n", "-4.061751e+09 | \n", "-0.000000e+00 | \n", "-3.675704e+09 | \n", "-0.000000e+00 | \n", "-4.089667e+09 | \n", "-0.000000e+00 | \n", "0.022286 | \n", "0.000159 | \n", "1.900966e+08 | \n", "0.000000e+00 | \n", "
0 | \n", "0.177232 | \n", "0.007945 | \n", "-4.053749e+09 | \n", "-1.105559e+09 | \n", "NaN | \n", "2 | \n", "3 | \n", "{'n_estimators': 3, 'max_features': 2} | \n", "18 | \n", "-3.837622e+09 | \n", "... | \n", "-4.196408e+09 | \n", "-1.116550e+09 | \n", "-3.903319e+09 | \n", "-1.112342e+09 | \n", "-4.184325e+09 | \n", "-1.129650e+09 | \n", "0.034350 | \n", "0.001114 | \n", "1.519609e+08 | \n", "2.220402e+07 | \n", "
18 rows × 23 columns
\n", "\n", " | feature_importances | \n", "
---|---|
attributes | \n", "\n", " |
median_income | \n", "0.366159 | \n", "
INLAND | \n", "0.164781 | \n", "
pop_per_hhold | \n", "0.108793 | \n", "
longitude | \n", "0.073344 | \n", "
latitude | \n", "0.062909 | \n", "
rooms_per_hhold | \n", "0.056419 | \n", "
bedrooms_per_room | \n", "0.053351 | \n", "
housing_median_age | \n", "0.041144 | \n", "
population | \n", "0.014874 | \n", "
total_rooms | \n", "0.014673 | \n", "
households | \n", "0.014258 | \n", "
total_bedrooms | \n", "0.014106 | \n", "
<1H OCEAN | \n", "0.010311 | \n", "
NEAR OCEAN | \n", "0.002856 | \n", "
NEAR BAY | \n", "0.001960 | \n", "
ISLAND | \n", "0.000060 | \n", "