From 867c5a6fcf74a7925eba64f86c09a4f71678f076 Mon Sep 17 00:00:00 2001 From: annnieglez Date: Sun, 23 Mar 2025 13:45:09 +0100 Subject: [PATCH] lab done --- your-code/main.ipynb | 7571 +++++++++++++++++++++++++++++++++++++++++- 1 file changed, 7489 insertions(+), 82 deletions(-) diff --git a/your-code/main.ipynb b/your-code/main.ipynb index 68b3762..be93c36 100644 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -12,11 +12,15 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ - "#Import your libraries\n" + "#Import your libraries\n", + "import pandas as pd\n", + "\n", + "# Set display options for Pandas to show all columns\n", + "pd.set_option('display.max_columns', None)" ] }, { @@ -38,11 +42,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, "outputs": [], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin = pd.read_csv('austin_weather.csv')\n" ] }, { @@ -57,29 +62,695 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Date object\n", + "TempHighF int64\n", + "TempAvgF int64\n", + "TempLowF int64\n", + "DewPointHighF object\n", + "DewPointAvgF object\n", + "DewPointLowF object\n", + "HumidityHighPercent object\n", + "HumidityAvgPercent object\n", + "HumidityLowPercent object\n", + "SeaLevelPressureHighInches object\n", + "SeaLevelPressureAvgInches object\n", + "SeaLevelPressureLowInches object\n", + "VisibilityHighMiles object\n", + "VisibilityAvgMiles object\n", + "VisibilityLowMiles object\n", + "WindHighMPH object\n", + "WindAvgMPH object\n", + "WindGustMPH object\n", + "PrecipitationSumInches object\n", + "Events object\n", + "dtype: object" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin.dtypes\n" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "object", + "type": "string" + }, + { + "name": "count", + "rawType": "float64", + "type": "float" + }, + { + "name": "mean", + "rawType": "float64", + "type": "float" + }, + { + "name": "std", + "rawType": "float64", + "type": "float" + }, + { + "name": "min", + "rawType": "float64", + "type": "float" + }, + { + "name": "25%", + "rawType": "float64", + "type": "float" + }, + { + "name": "50%", + "rawType": "float64", + "type": "float" + }, + { + "name": "75%", + "rawType": "float64", + "type": "float" + }, + { + "name": "max", + "rawType": "float64", + "type": "float" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "76a567b7-50c2-4c41-b3b9-21752308a6b1", + "rows": [ + [ + "TempHighF", + "1319.0", + "80.86277482941622", + "14.766522914053354", + "32.0", + "72.0", + "83.0", + "92.0", + "107.0" + ], + [ + "TempAvgF", + "1319.0", + "70.6429112964367", + "14.045903804052708", + "29.0", + "62.0", + "73.0", + "83.0", + "93.0" + ], + [ + "TempLowF", + "1319.0", + "59.902956785443514", + "14.190647994086149", + "19.0", + "49.0", + "63.0", + "73.0", + "81.0" + ] + ], + "shape": { + "columns": 8, + "rows": 3 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
countmeanstdmin25%50%75%max
TempHighF1319.080.86277514.76652332.072.083.092.0107.0
TempAvgF1319.070.64291114.04590429.062.073.083.093.0
TempLowF1319.059.90295714.19064819.049.063.073.081.0
\n", + "
" + ], + "text/plain": [ + " count mean std min 25% 50% 75% max\n", + "TempHighF 1319.0 80.862775 14.766523 32.0 72.0 83.0 92.0 107.0\n", + "TempAvgF 1319.0 70.642911 14.045904 29.0 62.0 73.0 83.0 93.0\n", + "TempLowF 1319.0 59.902957 14.190648 19.0 49.0 63.0 73.0 81.0" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin.describe().T\n" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date", + "rawType": "object", + "type": "string" + }, + { + "name": "TempHighF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempAvgF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempLowF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "DewPointHighF", + "rawType": "object", + "type": "string" + }, + { + "name": "DewPointAvgF", + "rawType": "object", + "type": "string" + }, + { + "name": "DewPointLowF", + "rawType": "object", + "type": "string" + }, + { + "name": "HumidityHighPercent", + "rawType": "object", + "type": "string" + }, + { + "name": "HumidityAvgPercent", + "rawType": "object", + "type": "string" + }, + { + "name": "HumidityLowPercent", + "rawType": "object", + "type": "string" + }, + { + "name": "SeaLevelPressureHighInches", + "rawType": "object", + "type": "string" + }, + { + "name": "SeaLevelPressureAvgInches", + "rawType": "object", + "type": "string" + }, + { + "name": "SeaLevelPressureLowInches", + "rawType": "object", + "type": "string" + }, + { + "name": "VisibilityHighMiles", + "rawType": "object", + "type": "string" + }, + { + "name": "VisibilityAvgMiles", + "rawType": "object", + "type": "string" + }, + { + "name": "VisibilityLowMiles", + "rawType": "object", + "type": "string" + }, + { + "name": "WindHighMPH", + "rawType": "object", + "type": "string" + }, + { + "name": "WindAvgMPH", + "rawType": "object", + "type": "string" + }, + { + "name": "WindGustMPH", + "rawType": "object", + "type": "string" + }, + { + "name": "PrecipitationSumInches", + "rawType": "object", + "type": "string" + }, + { + "name": "Events", + "rawType": "object", + "type": "string" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "6cce6158-ef62-4530-8b68-bbe216169f7c", + "rows": [ + [ + "0", + "2013-12-21", + "74", + "60", + "45", + "67", + "49", + "43", + "93", + "75", + "57", + "29.86", + "29.68", + "29.59", + "10", + "7", + "2", + "20", + "4", + "31", + "0.46", + "Rain , Thunderstorm" + ], + [ + "1", + "2013-12-22", + "56", + "48", + "39", + "43", + "36", + "28", + "93", + "68", + "43", + "30.41", + "30.13", + "29.87", + "10", + "10", + "5", + "16", + "6", + "25", + "0", + " " + ], + [ + "2", + "2013-12-23", + "58", + "45", + "32", + "31", + "27", + "23", + "76", + "52", + "27", + "30.56", + "30.49", + "30.41", + "10", + "10", + "10", + "8", + "3", + "12", + "0", + " " + ], + [ + "3", + "2013-12-24", + "61", + "46", + "31", + "36", + "28", + "21", + "89", + "56", + "22", + "30.56", + "30.45", + "30.3", + "10", + "10", + "7", + "12", + "4", + "20", + "0", + " " + ], + [ + "4", + "2013-12-25", + "58", + "50", + "41", + "44", + "40", + "36", + "86", + "71", + "56", + "30.41", + "30.33", + "30.27", + "10", + "10", + "7", + "10", + "2", + "16", + "T", + " " + ] + ], + "shape": { + "columns": 21, + "rows": 5 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
DateTempHighFTempAvgFTempLowFDewPointHighFDewPointAvgFDewPointLowFHumidityHighPercentHumidityAvgPercentHumidityLowPercentSeaLevelPressureHighInchesSeaLevelPressureAvgInchesSeaLevelPressureLowInchesVisibilityHighMilesVisibilityAvgMilesVisibilityLowMilesWindHighMPHWindAvgMPHWindGustMPHPrecipitationSumInchesEvents
02013-12-2174604567494393755729.8629.6829.591072204310.46Rain , Thunderstorm
12013-12-2256483943362893684330.4130.1329.8710105166250
22013-12-2358453231272376522730.5630.4930.4110101083120
32013-12-2461463136282189562230.5630.4530.310107124200
42013-12-2558504144403686715630.4130.3330.271010710216T
\n", + "
" + ], + "text/plain": [ + " Date TempHighF TempAvgF TempLowF DewPointHighF DewPointAvgF \\\n", + "0 2013-12-21 74 60 45 67 49 \n", + "1 2013-12-22 56 48 39 43 36 \n", + "2 2013-12-23 58 45 32 31 27 \n", + "3 2013-12-24 61 46 31 36 28 \n", + "4 2013-12-25 58 50 41 44 40 \n", + "\n", + " DewPointLowF HumidityHighPercent HumidityAvgPercent HumidityLowPercent \\\n", + "0 43 93 75 57 \n", + "1 28 93 68 43 \n", + "2 23 76 52 27 \n", + "3 21 89 56 22 \n", + "4 36 86 71 56 \n", + "\n", + " SeaLevelPressureHighInches SeaLevelPressureAvgInches \\\n", + "0 29.86 29.68 \n", + "1 30.41 30.13 \n", + "2 30.56 30.49 \n", + "3 30.56 30.45 \n", + "4 30.41 30.33 \n", + "\n", + " SeaLevelPressureLowInches VisibilityHighMiles VisibilityAvgMiles \\\n", + "0 29.59 10 7 \n", + "1 29.87 10 10 \n", + "2 30.41 10 10 \n", + "3 30.3 10 10 \n", + "4 30.27 10 10 \n", + "\n", + " VisibilityLowMiles WindHighMPH WindAvgMPH WindGustMPH \\\n", + "0 2 20 4 31 \n", + "1 5 16 6 25 \n", + "2 10 8 3 12 \n", + "3 7 12 4 20 \n", + "4 7 10 2 16 \n", + "\n", + " PrecipitationSumInches Events \n", + "0 0.46 Rain , Thunderstorm \n", + "1 0 \n", + "2 0 \n", + "3 0 \n", + "4 T " + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin.head()" ] }, { @@ -95,9 +766,9 @@ "source": [ "#### Your Insights:\n", "\n", - "1. There are 21 variables in the dataset. 3 of them are numeric and the rest contain some text.\n", + "1. There are 21 variables in the dataset. 3 of them are int and the rest are saved as object.\n", "\n", - "2. The average temperature in Austin ranged between around 70 degrees F and around 93 degrees F. The highest temperature observed during this period was 107 degrees F and the lowest was 19 degrees F.\n", + "2. The average temperature in Austin ranged between around 56 degrees F and around 93 degrees F. The highest temperature observed during this period was 107 degrees F and the lowest was 19 degrees F.\n", "\n", "3. When we look at the head function, we see that a lot of variables contain numeric data even though these columns are of object type. This means we might have to do some data cleansing.\n" ] @@ -113,20 +784,38 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 14, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "array(['67', '43', '31', '36', '44', '39', '41', '49', '51', '37', '55',\n", + " '54', '15', '29', '60', '64', '58', '28', '42', '22', '38', '45',\n", + " '19', '59', '62', '40', '17', '53', '34', '48', '52', '61', '63',\n", + " '33', '57', '65', '46', '32', '50', '27', '56', '47', '68', '69',\n", + " '66', '70', '73', '71', '76', '72', '75', '74', '-', '77', '23',\n", + " '35', '30', '79', '78', '80', '26', '18', '25', '13'], dtype=object)" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin[\"DewPointHighF\"].unique()\n" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 15, "metadata": {}, "outputs": [], "source": [ - "# Your observation here\n" + "# Your observation here\n", + "# There is a value of '-' in the DewPointHighF column. This is an incorrect value and might need to be removed, the rest are numerical values, so the column should be of type int or float." ] }, { @@ -140,7 +829,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 16, "metadata": {}, "outputs": [], "source": [ @@ -153,11 +842,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 17, "metadata": {}, "outputs": [], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin[wrong_type_columns] = austin[wrong_type_columns].apply(pd.to_numeric, errors='coerce')\n" ] }, { @@ -169,11 +859,44 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 18, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Date object\n", + "TempHighF int64\n", + "TempAvgF int64\n", + "TempLowF int64\n", + "DewPointHighF float64\n", + "DewPointAvgF float64\n", + "DewPointLowF float64\n", + "HumidityHighPercent float64\n", + "HumidityAvgPercent float64\n", + "HumidityLowPercent float64\n", + "SeaLevelPressureHighInches float64\n", + "SeaLevelPressureAvgInches float64\n", + "SeaLevelPressureLowInches float64\n", + "VisibilityHighMiles float64\n", + "VisibilityAvgMiles float64\n", + "VisibilityLowMiles float64\n", + "WindHighMPH float64\n", + "WindAvgMPH float64\n", + "WindGustMPH float64\n", + "PrecipitationSumInches float64\n", + "Events object\n", + "dtype: object" + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin.dtypes\n" ] }, { @@ -200,11 +923,1821 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 19, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "0 False\n", + "1 False\n", + "2 False\n", + "3 False\n", + "4 True\n", + " ... \n", + "1314 False\n", + "1315 False\n", + "1316 False\n", + "1317 False\n", + "1318 False\n", + "Length: 1319, dtype: bool" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "austin.isnull().any(axis=1)" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Date 0\n", + "TempHighF 0\n", + "TempAvgF 0\n", + "TempLowF 0\n", + "DewPointHighF 7\n", + "DewPointAvgF 7\n", + "DewPointLowF 7\n", + "HumidityHighPercent 2\n", + "HumidityAvgPercent 2\n", + "HumidityLowPercent 2\n", + "SeaLevelPressureHighInches 3\n", + "SeaLevelPressureAvgInches 3\n", + "SeaLevelPressureLowInches 3\n", + "VisibilityHighMiles 12\n", + "VisibilityAvgMiles 12\n", + "VisibilityLowMiles 12\n", + "WindHighMPH 2\n", + "WindAvgMPH 2\n", + "WindGustMPH 4\n", + "PrecipitationSumInches 124\n", + "Events 0\n", + "dtype: int64" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin.isnull().sum()" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date", + "rawType": "object", + "type": "string" + }, + { + "name": "TempHighF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempAvgF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempLowF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "DewPointHighF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointAvgF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointLowF", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityHighPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityAvgPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityLowPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureHighInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureAvgInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureLowInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityHighMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityAvgMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityLowMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindHighMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindAvgMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindGustMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "PrecipitationSumInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "Events", + "rawType": "object", + "type": "string" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "d8489bac-fb1c-4e06-87a5-b5ea754894af", + "rows": [ + [ + "4", + "2013-12-25", + "58", + "50", + "41", + "44.0", + "40.0", + "36.0", + "86.0", + "71.0", + "56.0", + "30.41", + "30.33", + "30.27", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "16.0", + null, + " " + ], + [ + "6", + "2013-12-27", + "60", + "53", + "45", + "41.0", + "39.0", + "37.0", + "83.0", + "65.0", + "47.0", + "30.46", + "30.39", + "30.34", + "10.0", + "9.0", + "7.0", + "7.0", + "1.0", + "11.0", + null, + " " + ], + [ + "7", + "2013-12-28", + "62", + "51", + "40", + "43.0", + "39.0", + "33.0", + "92.0", + "64.0", + "36.0", + "30.33", + "30.17", + "30.04", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "14.0", + null, + " " + ], + [ + "42", + "2014-02-01", + "76", + "66", + "55", + "62.0", + "59.0", + "41.0", + "81.0", + "71.0", + "60.0", + "29.91", + "29.81", + "29.75", + "10.0", + "10.0", + "9.0", + "14.0", + "6.0", + "26.0", + null, + "Rain" + ], + [ + "51", + "2014-02-10", + "60", + "48", + "35", + "49.0", + "36.0", + "30.0", + "82.0", + "74.0", + "66.0", + "30.23", + "30.15", + "30.02", + "10.0", + "8.0", + "4.0", + "15.0", + "9.0", + "23.0", + null, + "Rain" + ], + [ + "66", + "2014-02-25", + "71", + "62", + "52", + "65.0", + "60.0", + "47.0", + "93.0", + "85.0", + "77.0", + "30.06", + "30.01", + "29.95", + "10.0", + "4.0", + "1.0", + "12.0", + "5.0", + "20.0", + null, + "Rain" + ], + [ + "95", + "2014-03-26", + "66", + "60", + "54", + "55.0", + "47.0", + "30.0", + "78.0", + "57.0", + "36.0", + "30.2", + "30.08", + "29.95", + "10.0", + "10.0", + "6.0", + "22.0", + "10.0", + "33.0", + null, + "Rain" + ], + [ + "102", + "2014-04-02", + "82", + "76", + "70", + "69.0", + "67.0", + "63.0", + "97.0", + "78.0", + "58.0", + "29.9", + "29.8", + "29.69", + "10.0", + "9.0", + "4.0", + "16.0", + "9.0", + "30.0", + null, + "Rain" + ], + [ + "103", + "2014-04-03", + "82", + "77", + "71", + "69.0", + "67.0", + "66.0", + "90.0", + "74.0", + "58.0", + "29.81", + "29.74", + "29.66", + "10.0", + "8.0", + "5.0", + "14.0", + "7.0", + "25.0", + null, + " " + ], + [ + "104", + "2014-04-04", + "74", + "64", + "54", + "69.0", + "35.0", + "28.0", + "93.0", + "58.0", + "22.0", + "30.14", + "30.03", + "29.82", + "10.0", + "10.0", + "5.0", + "17.0", + "8.0", + "28.0", + null, + "Rain" + ], + [ + "105", + "2014-04-05", + "65", + "60", + "54", + "46.0", + "38.0", + "33.0", + "60.0", + "48.0", + "36.0", + "30.08", + "29.99", + "29.88", + "10.0", + "10.0", + "10.0", + "10.0", + "4.0", + "17.0", + null, + " " + ], + [ + "113", + "2014-04-13", + "78", + "73", + "68", + "68.0", + "66.0", + "61.0", + "90.0", + "79.0", + "67.0", + "29.85", + "29.76", + "29.62", + "10.0", + "9.0", + "8.0", + "18.0", + "7.0", + "29.0", + null, + " " + ], + [ + "126", + "2014-04-26", + "86", + "77", + "68", + "69.0", + "66.0", + "62.0", + "90.0", + "73.0", + "55.0", + "29.87", + "29.78", + "29.64", + "10.0", + "6.0", + "2.0", + "16.0", + "8.0", + "28.0", + null, + "Rain" + ], + [ + "139", + "2014-05-09", + "86", + "76", + "66", + "71.0", + "68.0", + "58.0", + "87.0", + "69.0", + "50.0", + "29.96", + "29.89", + "29.77", + "10.0", + "5.0", + "1.0", + "20.0", + "5.0", + "39.0", + null, + "Rain , Thunderstorm" + ], + [ + "152", + "2014-05-22", + "87", + "79", + "70", + "68.0", + "65.0", + "61.0", + "90.0", + "70.0", + "50.0", + "30.11", + "30.05", + "29.96", + "10.0", + "10.0", + "7.0", + "15.0", + "7.0", + "25.0", + null, + " " + ], + [ + "154", + "2014-05-24", + "86", + "78", + "70", + "70.0", + "68.0", + "66.0", + "97.0", + "79.0", + "61.0", + "30.06", + "29.99", + "29.89", + "10.0", + "9.0", + "7.0", + "15.0", + "7.0", + "23.0", + null, + " " + ], + [ + "155", + "2014-05-25", + "87", + "80", + "72", + "67.0", + "66.0", + "63.0", + "84.0", + "66.0", + "48.0", + "30.07", + "29.98", + "29.89", + "10.0", + "10.0", + "10.0", + "15.0", + "6.0", + "24.0", + null, + "Thunderstorm" + ], + [ + "164", + "2014-06-03", + "90", + "83", + "75", + "72.0", + "70.0", + "68.0", + "82.0", + "67.0", + "52.0", + "30.03", + "29.96", + "29.88", + "10.0", + "10.0", + "10.0", + "10.0", + "6.0", + "17.0", + null, + " " + ], + [ + "169", + "2014-06-08", + "90", + "83", + "76", + "72.0", + "70.0", + "64.0", + "87.0", + "67.0", + "46.0", + "29.99", + "29.88", + "29.76", + "10.0", + "10.0", + "5.0", + "16.0", + "7.0", + "27.0", + null, + "Rain" + ], + [ + "174", + "2014-06-13", + "89", + "79", + "68", + null, + null, + null, + "95.0", + "75.0", + "55.0", + "30.01", + "29.95", + "29.87", + null, + null, + null, + "15.0", + "4.0", + "22.0", + "0.0", + " " + ], + [ + "175", + "2014-06-14", + "87", + "92", + "73", + null, + null, + null, + "95.0", + "77.0", + "59.0", + "29.99", + "29.93", + "29.84", + null, + null, + null, + "15.0", + "6.0", + "22.0", + "0.0", + " " + ], + [ + "176", + "2014-06-15", + "91", + "83", + "74", + null, + null, + null, + null, + null, + null, + "29.98", + "29.9", + "29.87", + null, + null, + null, + "14.0", + "9.0", + "23.0", + "0.0", + " " + ], + [ + "177", + "2014-06-16", + "92", + "84", + "75", + null, + null, + null, + "94.0", + "72.0", + "49.0", + "30.05", + "29.99", + "29.93", + null, + null, + null, + "12.0", + "8.0", + "24.0", + null, + " " + ], + [ + "182", + "2014-06-21", + "92", + "84", + "75", + "74.0", + "72.0", + "68.0", + "94.0", + "72.0", + "49.0", + "30.07", + "29.99", + "29.87", + "10.0", + "10.0", + "8.0", + "15.0", + "6.0", + "21.0", + null, + " " + ], + [ + "183", + "2014-06-22", + "90", + "83", + "76", + "74.0", + "72.0", + "68.0", + "85.0", + "70.0", + "55.0", + "29.96", + "29.9", + "29.82", + "10.0", + "9.0", + "8.0", + "13.0", + "8.0", + "22.0", + null, + " " + ], + [ + "188", + "2014-06-27", + "91", + "83", + "75", + "74.0", + "72.0", + "70.0", + "88.0", + "69.0", + "49.0", + "29.93", + "29.87", + "29.79", + "10.0", + "10.0", + "8.0", + "17.0", + "8.0", + "32.0", + null, + " " + ], + [ + "189", + "2014-06-28", + "93", + "86", + "78", + "74.0", + "73.0", + "71.0", + "85.0", + "69.0", + "52.0", + "29.97", + "29.88", + "29.83", + "10.0", + "10.0", + "8.0", + "16.0", + "9.0", + "27.0", + null, + " " + ], + [ + "248", + "2014-08-26", + "101", + "89", + "77", + "71.0", + "68.0", + "62.0", + "71.0", + "52.0", + "33.0", + "29.98", + "29.93", + "29.89", + "10.0", + "10.0", + "8.0", + "14.0", + "4.0", + "23.0", + null, + "Rain , Thunderstorm" + ], + [ + "278", + "2014-09-25", + "83", + "73", + "62", + "66.0", + "62.0", + "57.0", + "90.0", + "74.0", + "58.0", + "30.14", + "30.1", + "30.07", + "10.0", + "10.0", + "8.0", + "13.0", + "3.0", + "20.0", + null, + " " + ], + [ + "280", + "2014-09-27", + "80", + "74", + "68", + "69.0", + "66.0", + "64.0", + "93.0", + "78.0", + "62.0", + "30.05", + "30.0", + "29.95", + "10.0", + "10.0", + "8.0", + "9.0", + "2.0", + "14.0", + null, + "Rain" + ], + [ + "292", + "2014-10-09", + "92", + "84", + "75", + "73.0", + "71.0", + "66.0", + "94.0", + "69.0", + "44.0", + "30.01", + "29.93", + "29.83", + "10.0", + "10.0", + "9.0", + "14.0", + "7.0", + "22.0", + null, + "Rain" + ], + [ + "305", + "2014-10-22", + "83", + "72", + "61", + "62.0", + "59.0", + "56.0", + "84.0", + "67.0", + "49.0", + "30.12", + "30.06", + "30.03", + "10.0", + "10.0", + "10.0", + "9.0", + "2.0", + "14.0", + null, + "Rain" + ], + [ + "306", + "2014-10-23", + "83", + "75", + "66", + "62.0", + "59.0", + "57.0", + "81.0", + "64.0", + "46.0", + "30.14", + "30.09", + "30.04", + "10.0", + "10.0", + "10.0", + "8.0", + "2.0", + "11.0", + null, + "Rain" + ], + [ + "313", + "2014-10-30", + "82", + "73", + "63", + "61.0", + "59.0", + "54.0", + "93.0", + "72.0", + "51.0", + "30.18", + "30.1", + "30.03", + "10.0", + "10.0", + "9.0", + "8.0", + "2.0", + "10.0", + null, + "Rain" + ], + [ + "317", + "2014-11-03", + "76", + "68", + "59", + "63.0", + "59.0", + "52.0", + "84.0", + "72.0", + "60.0", + "30.18", + "30.12", + "30.07", + "10.0", + "10.0", + "10.0", + "14.0", + "6.0", + "23.0", + null, + " " + ], + [ + "356", + "2014-12-12", + "71", + "65", + "59", + "58.0", + "57.0", + "56.0", + "90.0", + "78.0", + "66.0", + "30.3", + "30.23", + "30.18", + "10.0", + "10.0", + "9.0", + "12.0", + "5.0", + "17.0", + null, + "Rain" + ], + [ + "362", + "2014-12-18", + "60", + "55", + "49", + "56.0", + "51.0", + "48.0", + "100.0", + "92.0", + "84.0", + "30.14", + "30.1", + "30.06", + "10.0", + "4.0", + "1.0", + "12.0", + "3.0", + "17.0", + null, + " " + ], + [ + "367", + "2014-12-23", + "59", + "51", + "43", + "44.0", + "40.0", + "34.0", + "77.0", + "66.0", + "55.0", + "30.02", + "29.81", + "29.63", + "10.0", + "10.0", + "10.0", + "18.0", + "8.0", + "31.0", + null, + "Rain" + ], + [ + "375", + "2014-12-31", + "42", + "39", + "36", + "31.0", + "29.0", + "27.0", + "76.0", + "70.0", + "64.0", + "30.57", + "30.48", + "30.41", + "10.0", + "10.0", + "9.0", + "14.0", + "8.0", + "21.0", + null, + " " + ], + [ + "383", + "2015-01-08", + "36", + "30", + "23", + "23.0", + "12.0", + "5.0", + "56.0", + "48.0", + "39.0", + "30.79", + "30.54", + "30.3", + "10.0", + "10.0", + "10.0", + "15.0", + "5.0", + "23.0", + null, + "Rain" + ], + [ + "404", + "2015-01-29", + "79", + "66", + "52", + "55.0", + "49.0", + "34.0", + "100.0", + "68.0", + "35.0", + "30.39", + "30.22", + "30.12", + "10.0", + "10.0", + "6.0", + "16.0", + "4.0", + "25.0", + null, + " " + ], + [ + "405", + "2015-01-30", + "58", + "53", + "48", + "39.0", + "36.0", + "33.0", + "63.0", + "52.0", + "40.0", + "30.46", + "30.37", + "30.28", + "10.0", + "10.0", + "10.0", + "14.0", + "6.0", + "23.0", + null, + "Rain" + ], + [ + "411", + "2015-02-05", + "52", + "45", + "38", + "48.0", + "35.0", + "31.0", + "92.0", + "77.0", + "62.0", + "30.48", + "30.38", + "30.22", + "10.0", + "10.0", + "5.0", + "16.0", + "7.0", + "26.0", + null, + " " + ], + [ + "421", + "2015-02-15", + "68", + "63", + "57", + "62.0", + "58.0", + "52.0", + "87.0", + "80.0", + "73.0", + "30.15", + "30.02", + "29.88", + "10.0", + "10.0", + "7.0", + "10.0", + "5.0", + "19.0", + null, + " " + ], + [ + "441", + "2015-03-07", + "60", + "49", + "38", + "37.0", + "30.0", + "24.0", + "82.0", + "56.0", + "29.0", + "30.5", + "30.4", + "30.27", + "10.0", + "10.0", + "10.0", + "10.0", + "2.0", + "13.0", + null, + " " + ], + [ + "466", + "2015-04-01", + "83", + "76", + "68", + "67.0", + "65.0", + "61.0", + "90.0", + "71.0", + "51.0", + "29.98", + "29.92", + "29.83", + "10.0", + "9.0", + "4.0", + "14.0", + "7.0", + "25.0", + null, + "Rain" + ], + [ + "473", + "2015-04-08", + "79", + "74", + "69", + "69.0", + "67.0", + "65.0", + "90.0", + "81.0", + "71.0", + "30.0", + "29.92", + "29.83", + "10.0", + "9.0", + "6.0", + "16.0", + "8.0", + "29.0", + null, + " " + ], + [ + "476", + "2015-04-11", + "70", + "65", + "59", + "66.0", + "62.0", + "53.0", + "100.0", + "86.0", + "72.0", + "30.12", + "30.04", + "29.96", + "10.0", + "5.0", + "1.0", + "7.0", + "3.0", + "12.0", + null, + "Rain" + ], + [ + "487", + "2015-04-22", + "81", + "74", + "67", + "68.0", + "65.0", + "63.0", + "93.0", + "79.0", + "64.0", + "29.95", + "29.89", + "29.81", + "10.0", + "10.0", + "7.0", + "16.0", + "7.0", + "23.0", + null, + " " + ], + [ + "514", + "2015-05-19", + "89", + "82", + "74", + "75.0", + "72.0", + "69.0", + "87.0", + "73.0", + "59.0", + "30.06", + "29.99", + "29.86", + "10.0", + "8.0", + "5.0", + "17.0", + "8.0", + "28.0", + null, + "Rain" + ] + ], + "shape": { + "columns": 21, + "rows": 136 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
DateTempHighFTempAvgFTempLowFDewPointHighFDewPointAvgFDewPointLowFHumidityHighPercentHumidityAvgPercentHumidityLowPercentSeaLevelPressureHighInchesSeaLevelPressureAvgInchesSeaLevelPressureLowInchesVisibilityHighMilesVisibilityAvgMilesVisibilityLowMilesWindHighMPHWindAvgMPHWindGustMPHPrecipitationSumInchesEvents
42013-12-2558504144.040.036.086.071.056.030.4130.3330.2710.010.07.010.02.016.0NaN
62013-12-2760534541.039.037.083.065.047.030.4630.3930.3410.09.07.07.01.011.0NaN
72013-12-2862514043.039.033.092.064.036.030.3330.1730.0410.010.07.010.02.014.0NaN
422014-02-0176665562.059.041.081.071.060.029.9129.8129.7510.010.09.014.06.026.0NaNRain
512014-02-1060483549.036.030.082.074.066.030.2330.1530.0210.08.04.015.09.023.0NaNRain
..................................................................
12692017-06-1294857572.068.062.087.062.036.029.9629.8929.8110.010.02.015.07.022.0NaNRain
12882017-07-0198897976.072.066.085.062.038.030.1330.0229.9210.09.06.015.07.024.0NaN
13042017-07-1798887775.071.066.088.063.038.029.9429.9029.8410.010.010.016.03.023.0NaNRain , Thunderstorm
13082017-07-21104917774.068.061.085.056.027.030.0129.9529.8610.010.010.014.05.024.0NaN
13132017-07-26103917875.070.061.091.058.025.030.1330.0329.9310.010.010.015.06.027.0NaN
\n", + "

136 rows × 21 columns

\n", + "
" + ], + "text/plain": [ + " Date TempHighF TempAvgF TempLowF DewPointHighF DewPointAvgF \\\n", + "4 2013-12-25 58 50 41 44.0 40.0 \n", + "6 2013-12-27 60 53 45 41.0 39.0 \n", + "7 2013-12-28 62 51 40 43.0 39.0 \n", + "42 2014-02-01 76 66 55 62.0 59.0 \n", + "51 2014-02-10 60 48 35 49.0 36.0 \n", + "... ... ... ... ... ... ... \n", + "1269 2017-06-12 94 85 75 72.0 68.0 \n", + "1288 2017-07-01 98 89 79 76.0 72.0 \n", + "1304 2017-07-17 98 88 77 75.0 71.0 \n", + "1308 2017-07-21 104 91 77 74.0 68.0 \n", + "1313 2017-07-26 103 91 78 75.0 70.0 \n", + "\n", + " DewPointLowF HumidityHighPercent HumidityAvgPercent \\\n", + "4 36.0 86.0 71.0 \n", + "6 37.0 83.0 65.0 \n", + "7 33.0 92.0 64.0 \n", + "42 41.0 81.0 71.0 \n", + "51 30.0 82.0 74.0 \n", + "... ... ... ... \n", + "1269 62.0 87.0 62.0 \n", + "1288 66.0 85.0 62.0 \n", + "1304 66.0 88.0 63.0 \n", + "1308 61.0 85.0 56.0 \n", + "1313 61.0 91.0 58.0 \n", + "\n", + " HumidityLowPercent SeaLevelPressureHighInches \\\n", + "4 56.0 30.41 \n", + "6 47.0 30.46 \n", + "7 36.0 30.33 \n", + "42 60.0 29.91 \n", + "51 66.0 30.23 \n", + "... ... ... \n", + "1269 36.0 29.96 \n", + "1288 38.0 30.13 \n", + "1304 38.0 29.94 \n", + "1308 27.0 30.01 \n", + "1313 25.0 30.13 \n", + "\n", + " SeaLevelPressureAvgInches SeaLevelPressureLowInches \\\n", + "4 30.33 30.27 \n", + "6 30.39 30.34 \n", + "7 30.17 30.04 \n", + "42 29.81 29.75 \n", + "51 30.15 30.02 \n", + "... ... ... \n", + "1269 29.89 29.81 \n", + "1288 30.02 29.92 \n", + "1304 29.90 29.84 \n", + "1308 29.95 29.86 \n", + "1313 30.03 29.93 \n", + "\n", + " VisibilityHighMiles VisibilityAvgMiles VisibilityLowMiles \\\n", + "4 10.0 10.0 7.0 \n", + "6 10.0 9.0 7.0 \n", + "7 10.0 10.0 7.0 \n", + "42 10.0 10.0 9.0 \n", + "51 10.0 8.0 4.0 \n", + "... ... ... ... \n", + "1269 10.0 10.0 2.0 \n", + "1288 10.0 9.0 6.0 \n", + "1304 10.0 10.0 10.0 \n", + "1308 10.0 10.0 10.0 \n", + "1313 10.0 10.0 10.0 \n", + "\n", + " WindHighMPH WindAvgMPH WindGustMPH PrecipitationSumInches \\\n", + "4 10.0 2.0 16.0 NaN \n", + "6 7.0 1.0 11.0 NaN \n", + "7 10.0 2.0 14.0 NaN \n", + "42 14.0 6.0 26.0 NaN \n", + "51 15.0 9.0 23.0 NaN \n", + "... ... ... ... ... \n", + "1269 15.0 7.0 22.0 NaN \n", + "1288 15.0 7.0 24.0 NaN \n", + "1304 16.0 3.0 23.0 NaN \n", + "1308 14.0 5.0 24.0 NaN \n", + "1313 15.0 6.0 27.0 NaN \n", + "\n", + " Events \n", + "4 \n", + "6 \n", + "7 \n", + "42 Rain \n", + "51 Rain \n", + "... ... \n", + "1269 Rain \n", + "1288 \n", + "1304 Rain , Thunderstorm \n", + "1308 \n", + "1313 \n", + "\n", + "[136 rows x 21 columns]" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "missing_values = austin[austin.isnull().any(axis=1)]\n", + "missing_values" ] }, { @@ -233,11 +2766,22 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 22, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "1319\n", + "136\n" + ] + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "print(austin.shape[0])\n", + "print(missing_values.shape[0])\n" ] }, { @@ -249,11 +2793,24 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 23, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "0.10310841546626232" + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "ratio_missing_values = missing_values.shape[0] / austin.shape[0]\n", + "ratio_missing_values\n" ] }, { @@ -267,11 +2824,45 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 24, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Date 0\n", + "TempHighF 0\n", + "TempAvgF 0\n", + "TempLowF 0\n", + "DewPointHighF 7\n", + "DewPointAvgF 7\n", + "DewPointLowF 7\n", + "HumidityHighPercent 2\n", + "HumidityAvgPercent 2\n", + "HumidityLowPercent 2\n", + "SeaLevelPressureHighInches 3\n", + "SeaLevelPressureAvgInches 3\n", + "SeaLevelPressureLowInches 3\n", + "VisibilityHighMiles 12\n", + "VisibilityAvgMiles 12\n", + "VisibilityLowMiles 12\n", + "WindHighMPH 2\n", + "WindAvgMPH 2\n", + "WindGustMPH 4\n", + "PrecipitationSumInches 124\n", + "Events 0\n", + "dtype: int64" + ] + }, + "execution_count": 24, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "\n", + "austin.isna().sum()\n" ] }, { @@ -283,11 +2874,24 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 25, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "np.float64(0.09401061410159212)" + ] + }, + "execution_count": 25, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "ratio_missing_values_precip = austin['PrecipitationSumInches'].isna().sum() / austin.shape[0]\n", + "ratio_missing_values_precip\n" ] }, { @@ -309,12 +2913,1668 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 26, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date", + "rawType": "object", + "type": "string" + }, + { + "name": "TempHighF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempAvgF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempLowF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "DewPointHighF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointAvgF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointLowF", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityHighPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityAvgPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityLowPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureHighInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureAvgInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureLowInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityHighMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityAvgMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityLowMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindHighMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindAvgMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindGustMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "Events", + "rawType": "object", + "type": "string" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "48ee801a-7650-4576-92ee-d0e0a8b865f8", + "rows": [ + [ + "0", + "2013-12-21", + "74", + "60", + "45", + "67.0", + "49.0", + "43.0", + "93.0", + "75.0", + "57.0", + "29.86", + "29.68", + "29.59", + "10.0", + "7.0", + "2.0", + "20.0", + "4.0", + "31.0", + "Rain , Thunderstorm" + ], + [ + "1", + "2013-12-22", + "56", + "48", + "39", + "43.0", + "36.0", + "28.0", + "93.0", + "68.0", + "43.0", + "30.41", + "30.13", + "29.87", + "10.0", + "10.0", + "5.0", + "16.0", + "6.0", + "25.0", + " " + ], + [ + "2", + "2013-12-23", + "58", + "45", + "32", + "31.0", + "27.0", + "23.0", + "76.0", + "52.0", + "27.0", + "30.56", + "30.49", + "30.41", + "10.0", + "10.0", + "10.0", + "8.0", + "3.0", + "12.0", + " " + ], + [ + "3", + "2013-12-24", + "61", + "46", + "31", + "36.0", + "28.0", + "21.0", + "89.0", + "56.0", + "22.0", + "30.56", + "30.45", + "30.3", + "10.0", + "10.0", + "7.0", + "12.0", + "4.0", + "20.0", + " " + ], + [ + "4", + "2013-12-25", + "58", + "50", + "41", + "44.0", + "40.0", + "36.0", + "86.0", + "71.0", + "56.0", + "30.41", + "30.33", + "30.27", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "16.0", + " " + ], + [ + "5", + "2013-12-26", + "57", + "48", + "39", + "39.0", + "36.0", + "33.0", + "79.0", + "63.0", + "47.0", + "30.47", + "30.4", + "30.34", + "10.0", + "9.0", + "7.0", + "12.0", + "3.0", + "17.0", + " " + ], + [ + "6", + "2013-12-27", + "60", + "53", + "45", + "41.0", + "39.0", + "37.0", + "83.0", + "65.0", + "47.0", + "30.46", + "30.39", + "30.34", + "10.0", + "9.0", + "7.0", + "7.0", + "1.0", + "11.0", + " " + ], + [ + "7", + "2013-12-28", + "62", + "51", + "40", + "43.0", + "39.0", + "33.0", + "92.0", + "64.0", + "36.0", + "30.33", + "30.17", + "30.04", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "14.0", + " " + ], + [ + "8", + "2013-12-29", + "64", + "50", + "36", + "49.0", + "41.0", + "28.0", + "92.0", + "76.0", + "60.0", + "30.31", + "30.1", + "29.99", + "10.0", + "10.0", + "4.0", + "17.0", + "5.0", + "24.0", + " " + ], + [ + "9", + "2013-12-30", + "44", + "40", + "35", + "31.0", + "26.0", + "21.0", + "75.0", + "60.0", + "45.0", + "30.44", + "30.33", + "30.26", + "10.0", + "10.0", + "10.0", + "13.0", + "5.0", + "21.0", + " " + ], + [ + "10", + "2013-12-31", + "55", + "46", + "36", + "31.0", + "28.0", + "23.0", + "76.0", + "54.0", + "32.0", + "30.49", + "30.39", + "30.27", + "10.0", + "10.0", + "10.0", + "8.0", + "1.0", + "12.0", + " " + ], + [ + "11", + "2014-01-01", + "69", + "54", + "39", + "51.0", + "42.0", + "30.0", + "83.0", + "68.0", + "52.0", + "30.25", + "30.11", + "30.01", + "10.0", + "10.0", + "8.0", + "13.0", + "4.0", + "22.0", + " " + ], + [ + "12", + "2014-01-02", + "55", + "44", + "33", + "39.0", + "26.0", + "19.0", + "83.0", + "55.0", + "26.0", + "30.49", + "30.37", + "30.15", + "10.0", + "10.0", + "9.0", + "21.0", + "8.0", + "31.0", + " " + ], + [ + "13", + "2014-01-03", + "58", + "43", + "28", + "37.0", + "22.0", + "18.0", + "75.0", + "49.0", + "22.0", + "30.48", + "30.35", + "30.14", + "10.0", + "10.0", + "10.0", + "14.0", + "4.0", + "21.0", + " " + ], + [ + "14", + "2014-01-04", + "71", + "57", + "42", + "55.0", + "48.0", + "38.0", + "89.0", + "68.0", + "47.0", + "30.12", + "29.95", + "29.81", + "10.0", + "10.0", + "8.0", + "16.0", + "7.0", + "28.0", + " " + ], + [ + "15", + "2014-01-05", + "59", + "47", + "34", + "54.0", + "32.0", + "15.0", + "87.0", + "59.0", + "31.0", + "30.48", + "30.08", + "29.79", + "10.0", + "10.0", + "4.0", + "21.0", + "10.0", + "34.0", + " " + ], + [ + "16", + "2014-01-06", + "36", + "29", + "22", + "15.0", + "8.0", + "2.0", + "50.0", + "38.0", + "26.0", + "30.8", + "30.68", + "30.5", + "10.0", + "10.0", + "10.0", + "17.0", + "7.0", + "27.0", + " " + ], + [ + "17", + "2014-01-07", + "48", + "35", + "22", + "29.0", + "11.0", + "4.0", + "68.0", + "43.0", + "17.0", + "30.66", + "30.52", + "30.36", + "10.0", + "10.0", + "10.0", + "13.0", + "5.0", + "22.0", + " " + ], + [ + "18", + "2014-01-08", + "53", + "47", + "40", + "51.0", + "45.0", + "30.0", + "93.0", + "75.0", + "57.0", + "30.33", + "30.2", + "30.12", + "10.0", + "2.0", + "1.0", + "12.0", + "1.0", + "18.0", + "Rain" + ], + [ + "19", + "2014-01-09", + "70", + "62", + "53", + "60.0", + "55.0", + "50.0", + "93.0", + "80.0", + "66.0", + "30.18", + "30.11", + "30.0", + "10.0", + "4.0", + "0.0", + "12.0", + "3.0", + "19.0", + "Fog" + ], + [ + "20", + "2014-01-10", + "72", + "65", + "57", + "64.0", + "61.0", + "54.0", + "93.0", + "81.0", + "68.0", + "29.97", + "29.87", + "29.75", + "10.0", + "8.0", + "1.0", + "13.0", + "6.0", + "21.0", + "Rain" + ], + [ + "21", + "2014-01-11", + "75", + "62", + "48", + "54.0", + "37.0", + "20.0", + "93.0", + "53.0", + "13.0", + "30.16", + "30.06", + "29.87", + "10.0", + "9.0", + "5.0", + "12.0", + "3.0", + "19.0", + " " + ], + [ + "22", + "2014-01-12", + "67", + "57", + "46", + "58.0", + "47.0", + "33.0", + "84.0", + "68.0", + "52.0", + "30.12", + "30.01", + "29.9", + "10.0", + "10.0", + "10.0", + "15.0", + "4.0", + "24.0", + "Rain" + ], + [ + "23", + "2014-01-13", + "71", + "57", + "43", + "60.0", + "36.0", + "17.0", + "87.0", + "51.0", + "14.0", + "30.16", + "30.01", + "29.86", + "10.0", + "9.0", + "7.0", + "17.0", + "7.0", + "29.0", + " " + ], + [ + "24", + "2014-01-14", + "76", + "57", + "37", + "31.0", + "25.0", + "20.0", + "70.0", + "41.0", + "12.0", + "30.34", + "30.13", + "30.01", + "10.0", + "10.0", + "10.0", + "16.0", + "5.0", + "29.0", + " " + ], + [ + "25", + "2014-01-15", + "64", + "52", + "40", + "29.0", + "23.0", + "16.0", + "49.0", + "35.0", + "21.0", + "30.47", + "30.33", + "30.17", + "10.0", + "10.0", + "10.0", + "14.0", + "4.0", + "21.0", + " " + ], + [ + "26", + "2014-01-16", + "72", + "56", + "40", + "31.0", + "27.0", + "23.0", + "55.0", + "38.0", + "20.0", + "30.21", + "30.13", + "30.06", + "10.0", + "10.0", + "10.0", + "14.0", + "4.0", + "20.0", + " " + ], + [ + "27", + "2014-01-17", + "64", + "54", + "43", + "31.0", + "20.0", + "15.0", + "45.0", + "31.0", + "17.0", + "30.37", + "30.29", + "30.21", + "10.0", + "10.0", + "9.0", + "14.0", + "5.0", + "21.0", + " " + ], + [ + "28", + "2014-01-18", + "70", + "54", + "37", + "41.0", + "33.0", + "23.0", + "59.0", + "45.0", + "31.0", + "30.26", + "30.19", + "30.1", + "10.0", + "10.0", + "10.0", + "12.0", + "2.0", + "19.0", + " " + ], + [ + "29", + "2014-01-19", + "72", + "59", + "45", + "41.0", + "30.0", + "18.0", + "64.0", + "39.0", + "14.0", + "30.35", + "30.22", + "30.12", + "10.0", + "10.0", + "10.0", + "9.0", + "3.0", + "16.0", + " " + ], + [ + "30", + "2014-01-20", + "82", + "64", + "46", + "51.0", + "36.0", + "23.0", + "71.0", + "44.0", + "17.0", + "30.16", + "30.0", + "29.85", + "10.0", + "10.0", + "10.0", + "16.0", + "5.0", + "26.0", + " " + ], + [ + "31", + "2014-01-21", + "63", + "51", + "38", + "28.0", + "23.0", + "19.0", + "59.0", + "39.0", + "19.0", + "30.43", + "30.31", + "30.19", + "10.0", + "10.0", + "10.0", + "15.0", + "6.0", + "25.0", + " " + ], + [ + "32", + "2014-01-22", + "70", + "54", + "37", + "39.0", + "27.0", + "24.0", + "70.0", + "45.0", + "19.0", + "30.23", + "30.11", + "30.01", + "10.0", + "10.0", + "10.0", + "12.0", + "4.0", + "18.0", + " " + ], + [ + "33", + "2014-01-23", + "56", + "42", + "27", + "42.0", + "29.0", + "20.0", + "78.0", + "64.0", + "50.0", + "30.73", + "30.47", + "30.06", + "10.0", + "8.0", + "2.0", + "20.0", + "9.0", + "31.0", + "Rain , Snow" + ], + [ + "34", + "2014-01-24", + "40", + "33", + "26", + "22.0", + "17.0", + "10.0", + "81.0", + "60.0", + "39.0", + "30.76", + "30.63", + "30.4", + "10.0", + "9.0", + "3.0", + "16.0", + "5.0", + "24.0", + " " + ], + [ + "35", + "2014-01-25", + "70", + "48", + "26", + "38.0", + "27.0", + "22.0", + "85.0", + "53.0", + "20.0", + "30.38", + "30.19", + "30.02", + "10.0", + "10.0", + "8.0", + "8.0", + "1.0", + "14.0", + " " + ], + [ + "36", + "2014-01-26", + "76", + "60", + "43", + "45.0", + "39.0", + "33.0", + "76.0", + "52.0", + "27.0", + "30.0", + "29.84", + "29.69", + "10.0", + "10.0", + "10.0", + "12.0", + "3.0", + "20.0", + " " + ], + [ + "37", + "2014-01-27", + "60", + "47", + "34", + "43.0", + "23.0", + "5.0", + "66.0", + "44.0", + "21.0", + "30.28", + "30.09", + "29.81", + "10.0", + "10.0", + "10.0", + "21.0", + "9.0", + "32.0", + "Rain" + ], + [ + "38", + "2014-01-28", + "39", + "33", + "27", + "19.0", + "14.0", + "7.0", + "69.0", + "48.0", + "27.0", + "30.51", + "30.4", + "30.27", + "10.0", + "10.0", + "10.0", + "15.0", + "6.0", + "23.0", + "Rain" + ], + [ + "39", + "2014-01-29", + "49", + "38", + "27", + "19.0", + "13.0", + "9.0", + "63.0", + "42.0", + "21.0", + "30.52", + "30.41", + "30.29", + "10.0", + "10.0", + "10.0", + "15.0", + "5.0", + "23.0", + " " + ], + [ + "40", + "2014-01-30", + "65", + "48", + "31", + "51.0", + "36.0", + "20.0", + "80.0", + "64.0", + "48.0", + "30.26", + "30.06", + "29.9", + "10.0", + "10.0", + "10.0", + "15.0", + "7.0", + "27.0", + " " + ], + [ + "41", + "2014-01-31", + "80", + "68", + "55", + "59.0", + "54.0", + "51.0", + "86.0", + "64.0", + "42.0", + "29.96", + "29.87", + "29.79", + "10.0", + "10.0", + "9.0", + "14.0", + "9.0", + "25.0", + " " + ], + [ + "42", + "2014-02-01", + "76", + "66", + "55", + "62.0", + "59.0", + "41.0", + "81.0", + "71.0", + "60.0", + "29.91", + "29.81", + "29.75", + "10.0", + "10.0", + "9.0", + "14.0", + "6.0", + "26.0", + "Rain" + ], + [ + "43", + "2014-02-02", + "55", + "45", + "35", + "40.0", + "33.0", + "27.0", + "79.0", + "69.0", + "59.0", + "30.27", + "30.09", + "29.9", + "10.0", + "8.0", + "4.0", + "18.0", + "11.0", + "29.0", + "Rain" + ], + [ + "44", + "2014-02-03", + "46", + "40", + "34", + "38.0", + "33.0", + "28.0", + "82.0", + "74.0", + "65.0", + "30.28", + "30.17", + "29.98", + "10.0", + "6.0", + "3.0", + "13.0", + "6.0", + "17.0", + " " + ], + [ + "45", + "2014-02-04", + "64", + "53", + "42", + "45.0", + "41.0", + "39.0", + "89.0", + "68.0", + "46.0", + "30.11", + "29.95", + "29.87", + "10.0", + "6.0", + "2.0", + "10.0", + "2.0", + "18.0", + "Rain" + ], + [ + "46", + "2014-02-05", + "48", + "40", + "31", + "42.0", + "26.0", + "16.0", + "80.0", + "60.0", + "39.0", + "30.5", + "30.37", + "30.13", + "10.0", + "10.0", + "10.0", + "16.0", + "10.0", + "24.0", + " " + ], + [ + "47", + "2014-02-06", + "32", + "29", + "26", + "17.0", + "15.0", + "13.0", + "58.0", + "54.0", + "49.0", + "30.57", + "30.48", + "30.42", + "10.0", + "10.0", + "10.0", + "15.0", + "8.0", + "23.0", + " " + ], + [ + "48", + "2014-02-07", + "38", + "34", + "29", + "29.0", + "24.0", + "17.0", + "78.0", + "68.0", + "58.0", + "30.41", + "30.32", + "30.24", + "10.0", + "7.0", + "2.0", + "8.0", + "3.0", + "12.0", + " " + ], + [ + "49", + "2014-02-08", + "65", + "51", + "37", + "42.0", + "36.0", + "29.0", + "85.0", + "63.0", + "40.0", + "30.26", + "30.17", + "30.03", + "10.0", + "7.0", + "3.0", + "14.0", + "5.0", + "21.0", + " " + ] + ], + "shape": { + "columns": 20, + "rows": 1319 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
DateTempHighFTempAvgFTempLowFDewPointHighFDewPointAvgFDewPointLowFHumidityHighPercentHumidityAvgPercentHumidityLowPercentSeaLevelPressureHighInchesSeaLevelPressureAvgInchesSeaLevelPressureLowInchesVisibilityHighMilesVisibilityAvgMilesVisibilityLowMilesWindHighMPHWindAvgMPHWindGustMPHEvents
02013-12-2174604567.049.043.093.075.057.029.8629.6829.5910.07.02.020.04.031.0Rain , Thunderstorm
12013-12-2256483943.036.028.093.068.043.030.4130.1329.8710.010.05.016.06.025.0
22013-12-2358453231.027.023.076.052.027.030.5630.4930.4110.010.010.08.03.012.0
32013-12-2461463136.028.021.089.056.022.030.5630.4530.3010.010.07.012.04.020.0
42013-12-2558504144.040.036.086.071.056.030.4130.3330.2710.010.07.010.02.016.0
...............................................................
13142017-07-27103897571.067.061.082.054.025.030.0429.9729.8810.010.010.012.05.021.0
13152017-07-28105917671.064.055.087.054.020.029.9729.9029.8110.010.010.014.05.020.0
13162017-07-29107927772.064.055.082.051.019.029.9129.8629.7910.010.010.012.04.017.0
13172017-07-30106937970.068.063.069.048.027.029.9629.9129.8710.010.010.013.04.020.0
13182017-07-3199887766.061.054.064.043.022.030.0429.9729.9110.010.010.012.04.020.0
\n", + "

1319 rows × 20 columns

\n", + "
" + ], + "text/plain": [ + " Date TempHighF TempAvgF TempLowF DewPointHighF DewPointAvgF \\\n", + "0 2013-12-21 74 60 45 67.0 49.0 \n", + "1 2013-12-22 56 48 39 43.0 36.0 \n", + "2 2013-12-23 58 45 32 31.0 27.0 \n", + "3 2013-12-24 61 46 31 36.0 28.0 \n", + "4 2013-12-25 58 50 41 44.0 40.0 \n", + "... ... ... ... ... ... ... \n", + "1314 2017-07-27 103 89 75 71.0 67.0 \n", + "1315 2017-07-28 105 91 76 71.0 64.0 \n", + "1316 2017-07-29 107 92 77 72.0 64.0 \n", + "1317 2017-07-30 106 93 79 70.0 68.0 \n", + "1318 2017-07-31 99 88 77 66.0 61.0 \n", + "\n", + " DewPointLowF HumidityHighPercent HumidityAvgPercent \\\n", + "0 43.0 93.0 75.0 \n", + "1 28.0 93.0 68.0 \n", + "2 23.0 76.0 52.0 \n", + "3 21.0 89.0 56.0 \n", + "4 36.0 86.0 71.0 \n", + "... ... ... ... \n", + "1314 61.0 82.0 54.0 \n", + "1315 55.0 87.0 54.0 \n", + "1316 55.0 82.0 51.0 \n", + "1317 63.0 69.0 48.0 \n", + "1318 54.0 64.0 43.0 \n", + "\n", + " HumidityLowPercent SeaLevelPressureHighInches \\\n", + "0 57.0 29.86 \n", + "1 43.0 30.41 \n", + "2 27.0 30.56 \n", + "3 22.0 30.56 \n", + "4 56.0 30.41 \n", + "... ... ... \n", + "1314 25.0 30.04 \n", + "1315 20.0 29.97 \n", + "1316 19.0 29.91 \n", + "1317 27.0 29.96 \n", + "1318 22.0 30.04 \n", + "\n", + " SeaLevelPressureAvgInches SeaLevelPressureLowInches \\\n", + "0 29.68 29.59 \n", + "1 30.13 29.87 \n", + "2 30.49 30.41 \n", + "3 30.45 30.30 \n", + "4 30.33 30.27 \n", + "... ... ... \n", + "1314 29.97 29.88 \n", + "1315 29.90 29.81 \n", + "1316 29.86 29.79 \n", + "1317 29.91 29.87 \n", + "1318 29.97 29.91 \n", + "\n", + " VisibilityHighMiles VisibilityAvgMiles VisibilityLowMiles \\\n", + "0 10.0 7.0 2.0 \n", + "1 10.0 10.0 5.0 \n", + "2 10.0 10.0 10.0 \n", + "3 10.0 10.0 7.0 \n", + "4 10.0 10.0 7.0 \n", + "... ... ... ... \n", + "1314 10.0 10.0 10.0 \n", + "1315 10.0 10.0 10.0 \n", + "1316 10.0 10.0 10.0 \n", + "1317 10.0 10.0 10.0 \n", + "1318 10.0 10.0 10.0 \n", + "\n", + " WindHighMPH WindAvgMPH WindGustMPH Events \n", + "0 20.0 4.0 31.0 Rain , Thunderstorm \n", + "1 16.0 6.0 25.0 \n", + "2 8.0 3.0 12.0 \n", + "3 12.0 4.0 20.0 \n", + "4 10.0 2.0 16.0 \n", + "... ... ... ... ... \n", + "1314 12.0 5.0 21.0 \n", + "1315 14.0 5.0 20.0 \n", + "1316 12.0 4.0 17.0 \n", + "1317 13.0 4.0 20.0 \n", + "1318 12.0 4.0 20.0 \n", + "\n", + "[1319 rows x 20 columns]" + ] + }, + "execution_count": 26, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here \n", - "\n", + "austin.drop('PrecipitationSumInches', axis=1, inplace=True)\n", "\n", "# Print `austin` to confirm the column is indeed removed\n", "\n", @@ -336,11 +4596,15 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 28, "metadata": {}, "outputs": [], "source": [ - "# Your code here\n" + "# Your code here\n", + "\n", + "austin_numeric = austin.select_dtypes(include=['number'])\n", + "austin_fixed = austin.copy()\n", + "austin_fixed[austin_numeric.columns] = austin_numeric.interpolate(method='linear')" ] }, { @@ -352,11 +4616,83 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 29, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Date 0\n", + "TempHighF 0\n", + "TempAvgF 0\n", + "TempLowF 0\n", + "DewPointHighF 7\n", + "DewPointAvgF 7\n", + "DewPointLowF 7\n", + "HumidityHighPercent 2\n", + "HumidityAvgPercent 2\n", + "HumidityLowPercent 2\n", + "SeaLevelPressureHighInches 3\n", + "SeaLevelPressureAvgInches 3\n", + "SeaLevelPressureLowInches 3\n", + "VisibilityHighMiles 12\n", + "VisibilityAvgMiles 12\n", + "VisibilityLowMiles 12\n", + "WindHighMPH 2\n", + "WindAvgMPH 2\n", + "WindGustMPH 4\n", + "Events 0\n", + "dtype: int64" + ] + }, + "execution_count": 29, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin.isna().sum()" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Date 0\n", + "TempHighF 0\n", + "TempAvgF 0\n", + "TempLowF 0\n", + "DewPointHighF 0\n", + "DewPointAvgF 0\n", + "DewPointLowF 0\n", + "HumidityHighPercent 0\n", + "HumidityAvgPercent 0\n", + "HumidityLowPercent 0\n", + "SeaLevelPressureHighInches 0\n", + "SeaLevelPressureAvgInches 0\n", + "SeaLevelPressureLowInches 0\n", + "VisibilityHighMiles 0\n", + "VisibilityAvgMiles 0\n", + "VisibilityLowMiles 0\n", + "WindHighMPH 0\n", + "WindAvgMPH 0\n", + "WindGustMPH 0\n", + "Events 0\n", + "dtype: int64" + ] + }, + "execution_count": 30, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "austin_fixed.isna().sum()" ] }, { @@ -377,11 +4713,33 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 33, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Events\n", + " 903\n", + "Rain 192\n", + "Rain , Thunderstorm 137\n", + "Fog , Rain , Thunderstorm 33\n", + "Fog 21\n", + "Thunderstorm 17\n", + "Fog , Rain 14\n", + "Rain , Snow 1\n", + "Fog , Thunderstorm 1\n", + "Name: count, dtype: int64" + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here:\n" + "# Your code here:\n", + "austin_fixed[\"Events\"].value_counts()\n" ] }, { @@ -397,9 +4755,20 @@ "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "3\n" + ] + } + ], "source": [ - "# Your answer:\n" + "# Your answer:\n", + "\n", + "max_events_in_a_day = austin_fixed['Events'].str.split(',').apply(len).max()\n", + "print(max_events_in_a_day)" ] }, { @@ -415,14 +4784,1952 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 35, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date", + "rawType": "object", + "type": "string" + }, + { + "name": "TempHighF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempAvgF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempLowF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "DewPointHighF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointAvgF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointLowF", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityHighPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityAvgPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityLowPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureHighInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureAvgInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureLowInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityHighMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityAvgMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityLowMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindHighMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindAvgMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindGustMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "Events", + "rawType": "object", + "type": "string" + }, + { + "name": "Snow", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Fog", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Rain", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Thunderstorm", + "rawType": "int64", + "type": "integer" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "4eb91254-76f1-4cde-8352-9b25e5f4e109", + "rows": [ + [ + "0", + "2013-12-21", + "74", + "60", + "45", + "67.0", + "49.0", + "43.0", + "93.0", + "75.0", + "57.0", + "29.86", + "29.68", + "29.59", + "10.0", + "7.0", + "2.0", + "20.0", + "4.0", + "31.0", + "Rain , Thunderstorm", + "0", + "0", + "0", + "0" + ], + [ + "1", + "2013-12-22", + "56", + "48", + "39", + "43.0", + "36.0", + "28.0", + "93.0", + "68.0", + "43.0", + "30.41", + "30.13", + "29.87", + "10.0", + "10.0", + "5.0", + "16.0", + "6.0", + "25.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "2", + "2013-12-23", + "58", + "45", + "32", + "31.0", + "27.0", + "23.0", + "76.0", + "52.0", + "27.0", + "30.56", + "30.49", + "30.41", + "10.0", + "10.0", + "10.0", + "8.0", + "3.0", + "12.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "3", + "2013-12-24", + "61", + "46", + "31", + "36.0", + "28.0", + "21.0", + "89.0", + "56.0", + "22.0", + "30.56", + "30.45", + "30.3", + "10.0", + "10.0", + "7.0", + "12.0", + "4.0", + "20.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "4", + "2013-12-25", + "58", + "50", + "41", + "44.0", + "40.0", + "36.0", + "86.0", + "71.0", + "56.0", + "30.41", + "30.33", + "30.27", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "16.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "5", + "2013-12-26", + "57", + "48", + "39", + "39.0", + "36.0", + "33.0", + "79.0", + "63.0", + "47.0", + "30.47", + "30.4", + "30.34", + "10.0", + "9.0", + "7.0", + "12.0", + "3.0", + "17.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "6", + "2013-12-27", + "60", + "53", + "45", + "41.0", + "39.0", + "37.0", + "83.0", + "65.0", + "47.0", + "30.46", + "30.39", + "30.34", + "10.0", + "9.0", + "7.0", + "7.0", + "1.0", + "11.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "7", + "2013-12-28", + "62", + "51", + "40", + "43.0", + "39.0", + "33.0", + "92.0", + "64.0", + "36.0", + "30.33", + "30.17", + "30.04", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "14.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "8", + "2013-12-29", + "64", + "50", + "36", + "49.0", + "41.0", + "28.0", + "92.0", + "76.0", + "60.0", + "30.31", + "30.1", + "29.99", + "10.0", + "10.0", + "4.0", + "17.0", + "5.0", + "24.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "9", + "2013-12-30", + "44", + "40", + "35", + "31.0", + "26.0", + "21.0", + "75.0", + "60.0", + "45.0", + "30.44", + "30.33", + "30.26", + "10.0", + "10.0", + "10.0", + "13.0", + "5.0", + "21.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "10", + "2013-12-31", + "55", + "46", + "36", + "31.0", + "28.0", + "23.0", + "76.0", + "54.0", + "32.0", + "30.49", + "30.39", + "30.27", + "10.0", + "10.0", + "10.0", + "8.0", + "1.0", + "12.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "11", + "2014-01-01", + "69", + "54", + "39", + "51.0", + "42.0", + "30.0", + "83.0", + "68.0", + "52.0", + "30.25", + "30.11", + "30.01", + "10.0", + "10.0", + "8.0", + "13.0", + "4.0", + "22.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "12", + "2014-01-02", + "55", + "44", + "33", + "39.0", + "26.0", + "19.0", + "83.0", + "55.0", + "26.0", + "30.49", + "30.37", + "30.15", + "10.0", + "10.0", + "9.0", + "21.0", + "8.0", + "31.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "13", + "2014-01-03", + "58", + "43", + "28", + "37.0", + "22.0", + "18.0", + "75.0", + "49.0", + "22.0", + "30.48", + "30.35", + "30.14", + "10.0", + "10.0", + "10.0", + "14.0", + "4.0", + "21.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "14", + "2014-01-04", + "71", + "57", + "42", + "55.0", + "48.0", + "38.0", + "89.0", + "68.0", + "47.0", + "30.12", + "29.95", + "29.81", + "10.0", + "10.0", + "8.0", + "16.0", + "7.0", + "28.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "15", + "2014-01-05", + "59", + "47", + "34", + "54.0", + "32.0", + "15.0", + "87.0", + "59.0", + "31.0", + "30.48", + "30.08", + "29.79", + "10.0", + "10.0", + "4.0", + "21.0", + "10.0", + "34.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "16", + "2014-01-06", + "36", + "29", + "22", + "15.0", + "8.0", + "2.0", + "50.0", + "38.0", + "26.0", + "30.8", + "30.68", + "30.5", + "10.0", + "10.0", + "10.0", + "17.0", + "7.0", + "27.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "17", + "2014-01-07", + "48", + "35", + "22", + "29.0", + "11.0", + "4.0", + "68.0", + "43.0", + "17.0", + "30.66", + "30.52", + "30.36", + "10.0", + "10.0", + "10.0", + "13.0", + "5.0", + "22.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "18", + "2014-01-08", + "53", + "47", + "40", + "51.0", + "45.0", + "30.0", + "93.0", + "75.0", + "57.0", + "30.33", + "30.2", + "30.12", + "10.0", + "2.0", + "1.0", + "12.0", + "1.0", + "18.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "19", + "2014-01-09", + "70", + "62", + "53", + "60.0", + "55.0", + "50.0", + "93.0", + "80.0", + "66.0", + "30.18", + "30.11", + "30.0", + "10.0", + "4.0", + "0.0", + "12.0", + "3.0", + "19.0", + "Fog", + "0", + "0", + "0", + "0" + ], + [ + "20", + "2014-01-10", + "72", + "65", + "57", + "64.0", + "61.0", + "54.0", + "93.0", + "81.0", + "68.0", + "29.97", + "29.87", + "29.75", + "10.0", + "8.0", + "1.0", + "13.0", + "6.0", + "21.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "21", + "2014-01-11", + "75", + "62", + "48", + "54.0", + "37.0", + "20.0", + "93.0", + "53.0", + "13.0", + "30.16", + "30.06", + "29.87", + "10.0", + "9.0", + "5.0", + "12.0", + "3.0", + "19.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "22", + "2014-01-12", + "67", + "57", + "46", + "58.0", + "47.0", + "33.0", + "84.0", + "68.0", + "52.0", + "30.12", + "30.01", + "29.9", + "10.0", + "10.0", + "10.0", + "15.0", + "4.0", + "24.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "23", + "2014-01-13", + "71", + "57", + "43", + "60.0", + "36.0", + "17.0", + "87.0", + "51.0", + "14.0", + "30.16", + "30.01", + "29.86", + "10.0", + "9.0", + "7.0", + "17.0", + "7.0", + "29.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "24", + "2014-01-14", + "76", + "57", + "37", + "31.0", + "25.0", + "20.0", + "70.0", + "41.0", + "12.0", + "30.34", + "30.13", + "30.01", + "10.0", + "10.0", + "10.0", + "16.0", + "5.0", + "29.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "25", + "2014-01-15", + "64", + "52", + "40", + "29.0", + "23.0", + "16.0", + "49.0", + "35.0", + "21.0", + "30.47", + "30.33", + "30.17", + "10.0", + "10.0", + "10.0", + "14.0", + "4.0", + "21.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "26", + "2014-01-16", + "72", + "56", + "40", + "31.0", + "27.0", + "23.0", + "55.0", + "38.0", + "20.0", + "30.21", + "30.13", + "30.06", + "10.0", + "10.0", + "10.0", + "14.0", + "4.0", + "20.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "27", + "2014-01-17", + "64", + "54", + "43", + "31.0", + "20.0", + "15.0", + "45.0", + "31.0", + "17.0", + "30.37", + "30.29", + "30.21", + "10.0", + "10.0", + "9.0", + "14.0", + "5.0", + "21.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "28", + "2014-01-18", + "70", + "54", + "37", + "41.0", + "33.0", + "23.0", + "59.0", + "45.0", + "31.0", + "30.26", + "30.19", + "30.1", + "10.0", + "10.0", + "10.0", + "12.0", + "2.0", + "19.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "29", + "2014-01-19", + "72", + "59", + "45", + "41.0", + "30.0", + "18.0", + "64.0", + "39.0", + "14.0", + "30.35", + "30.22", + "30.12", + "10.0", + "10.0", + "10.0", + "9.0", + "3.0", + "16.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "30", + "2014-01-20", + "82", + "64", + "46", + "51.0", + "36.0", + "23.0", + "71.0", + "44.0", + "17.0", + "30.16", + "30.0", + "29.85", + "10.0", + "10.0", + "10.0", + "16.0", + "5.0", + "26.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "31", + "2014-01-21", + "63", + "51", + "38", + "28.0", + "23.0", + "19.0", + "59.0", + "39.0", + "19.0", + "30.43", + "30.31", + "30.19", + "10.0", + "10.0", + "10.0", + "15.0", + "6.0", + "25.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "32", + "2014-01-22", + "70", + "54", + "37", + "39.0", + "27.0", + "24.0", + "70.0", + "45.0", + "19.0", + "30.23", + "30.11", + "30.01", + "10.0", + "10.0", + "10.0", + "12.0", + "4.0", + "18.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "33", + "2014-01-23", + "56", + "42", + "27", + "42.0", + "29.0", + "20.0", + "78.0", + "64.0", + "50.0", + "30.73", + "30.47", + "30.06", + "10.0", + "8.0", + "2.0", + "20.0", + "9.0", + "31.0", + "Rain , Snow", + "0", + "0", + "0", + "0" + ], + [ + "34", + "2014-01-24", + "40", + "33", + "26", + "22.0", + "17.0", + "10.0", + "81.0", + "60.0", + "39.0", + "30.76", + "30.63", + "30.4", + "10.0", + "9.0", + "3.0", + "16.0", + "5.0", + "24.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "35", + "2014-01-25", + "70", + "48", + "26", + "38.0", + "27.0", + "22.0", + "85.0", + "53.0", + "20.0", + "30.38", + "30.19", + "30.02", + "10.0", + "10.0", + "8.0", + "8.0", + "1.0", + "14.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "36", + "2014-01-26", + "76", + "60", + "43", + "45.0", + "39.0", + "33.0", + "76.0", + "52.0", + "27.0", + "30.0", + "29.84", + "29.69", + "10.0", + "10.0", + "10.0", + "12.0", + "3.0", + "20.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "37", + "2014-01-27", + "60", + "47", + "34", + "43.0", + "23.0", + "5.0", + "66.0", + "44.0", + "21.0", + "30.28", + "30.09", + "29.81", + "10.0", + "10.0", + "10.0", + "21.0", + "9.0", + "32.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "38", + "2014-01-28", + "39", + "33", + "27", + "19.0", + "14.0", + "7.0", + "69.0", + "48.0", + "27.0", + "30.51", + "30.4", + "30.27", + "10.0", + "10.0", + "10.0", + "15.0", + "6.0", + "23.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "39", + "2014-01-29", + "49", + "38", + "27", + "19.0", + "13.0", + "9.0", + "63.0", + "42.0", + "21.0", + "30.52", + "30.41", + "30.29", + "10.0", + "10.0", + "10.0", + "15.0", + "5.0", + "23.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "40", + "2014-01-30", + "65", + "48", + "31", + "51.0", + "36.0", + "20.0", + "80.0", + "64.0", + "48.0", + "30.26", + "30.06", + "29.9", + "10.0", + "10.0", + "10.0", + "15.0", + "7.0", + "27.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "41", + "2014-01-31", + "80", + "68", + "55", + "59.0", + "54.0", + "51.0", + "86.0", + "64.0", + "42.0", + "29.96", + "29.87", + "29.79", + "10.0", + "10.0", + "9.0", + "14.0", + "9.0", + "25.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "42", + "2014-02-01", + "76", + "66", + "55", + "62.0", + "59.0", + "41.0", + "81.0", + "71.0", + "60.0", + "29.91", + "29.81", + "29.75", + "10.0", + "10.0", + "9.0", + "14.0", + "6.0", + "26.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "43", + "2014-02-02", + "55", + "45", + "35", + "40.0", + "33.0", + "27.0", + "79.0", + "69.0", + "59.0", + "30.27", + "30.09", + "29.9", + "10.0", + "8.0", + "4.0", + "18.0", + "11.0", + "29.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "44", + "2014-02-03", + "46", + "40", + "34", + "38.0", + "33.0", + "28.0", + "82.0", + "74.0", + "65.0", + "30.28", + "30.17", + "29.98", + "10.0", + "6.0", + "3.0", + "13.0", + "6.0", + "17.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "45", + "2014-02-04", + "64", + "53", + "42", + "45.0", + "41.0", + "39.0", + "89.0", + "68.0", + "46.0", + "30.11", + "29.95", + "29.87", + "10.0", + "6.0", + "2.0", + "10.0", + "2.0", + "18.0", + "Rain", + "0", + "0", + "0", + "0" + ], + [ + "46", + "2014-02-05", + "48", + "40", + "31", + "42.0", + "26.0", + "16.0", + "80.0", + "60.0", + "39.0", + "30.5", + "30.37", + "30.13", + "10.0", + "10.0", + "10.0", + "16.0", + "10.0", + "24.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "47", + "2014-02-06", + "32", + "29", + "26", + "17.0", + "15.0", + "13.0", + "58.0", + "54.0", + "49.0", + "30.57", + "30.48", + "30.42", + "10.0", + "10.0", + "10.0", + "15.0", + "8.0", + "23.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "48", + "2014-02-07", + "38", + "34", + "29", + "29.0", + "24.0", + "17.0", + "78.0", + "68.0", + "58.0", + "30.41", + "30.32", + "30.24", + "10.0", + "7.0", + "2.0", + "8.0", + "3.0", + "12.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "49", + "2014-02-08", + "65", + "51", + "37", + "42.0", + "36.0", + "29.0", + "85.0", + "63.0", + "40.0", + "30.26", + "30.17", + "30.03", + "10.0", + "7.0", + "3.0", + "14.0", + "5.0", + "21.0", + " ", + "0", + "0", + "0", + "0" + ] + ], + "shape": { + "columns": 24, + "rows": 1319 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
DateTempHighFTempAvgFTempLowFDewPointHighFDewPointAvgFDewPointLowFHumidityHighPercentHumidityAvgPercentHumidityLowPercentSeaLevelPressureHighInchesSeaLevelPressureAvgInchesSeaLevelPressureLowInchesVisibilityHighMilesVisibilityAvgMilesVisibilityLowMilesWindHighMPHWindAvgMPHWindGustMPHEventsSnowFogRainThunderstorm
02013-12-2174604567.049.043.093.075.057.029.8629.6829.5910.07.02.020.04.031.0Rain , Thunderstorm0000
12013-12-2256483943.036.028.093.068.043.030.4130.1329.8710.010.05.016.06.025.00000
22013-12-2358453231.027.023.076.052.027.030.5630.4930.4110.010.010.08.03.012.00000
32013-12-2461463136.028.021.089.056.022.030.5630.4530.3010.010.07.012.04.020.00000
42013-12-2558504144.040.036.086.071.056.030.4130.3330.2710.010.07.010.02.016.00000
...........................................................................
13142017-07-27103897571.067.061.082.054.025.030.0429.9729.8810.010.010.012.05.021.00000
13152017-07-28105917671.064.055.087.054.020.029.9729.9029.8110.010.010.014.05.020.00000
13162017-07-29107927772.064.055.082.051.019.029.9129.8629.7910.010.010.012.04.017.00000
13172017-07-30106937970.068.063.069.048.027.029.9629.9129.8710.010.010.013.04.020.00000
13182017-07-3199887766.061.054.064.043.022.030.0429.9729.9110.010.010.012.04.020.00000
\n", + "

1319 rows × 24 columns

\n", + "
" + ], + "text/plain": [ + " Date TempHighF TempAvgF TempLowF DewPointHighF DewPointAvgF \\\n", + "0 2013-12-21 74 60 45 67.0 49.0 \n", + "1 2013-12-22 56 48 39 43.0 36.0 \n", + "2 2013-12-23 58 45 32 31.0 27.0 \n", + "3 2013-12-24 61 46 31 36.0 28.0 \n", + "4 2013-12-25 58 50 41 44.0 40.0 \n", + "... ... ... ... ... ... ... \n", + "1314 2017-07-27 103 89 75 71.0 67.0 \n", + "1315 2017-07-28 105 91 76 71.0 64.0 \n", + "1316 2017-07-29 107 92 77 72.0 64.0 \n", + "1317 2017-07-30 106 93 79 70.0 68.0 \n", + "1318 2017-07-31 99 88 77 66.0 61.0 \n", + "\n", + " DewPointLowF HumidityHighPercent HumidityAvgPercent \\\n", + "0 43.0 93.0 75.0 \n", + "1 28.0 93.0 68.0 \n", + "2 23.0 76.0 52.0 \n", + "3 21.0 89.0 56.0 \n", + "4 36.0 86.0 71.0 \n", + "... ... ... ... \n", + "1314 61.0 82.0 54.0 \n", + "1315 55.0 87.0 54.0 \n", + "1316 55.0 82.0 51.0 \n", + "1317 63.0 69.0 48.0 \n", + "1318 54.0 64.0 43.0 \n", + "\n", + " HumidityLowPercent SeaLevelPressureHighInches \\\n", + "0 57.0 29.86 \n", + "1 43.0 30.41 \n", + "2 27.0 30.56 \n", + "3 22.0 30.56 \n", + "4 56.0 30.41 \n", + "... ... ... \n", + "1314 25.0 30.04 \n", + "1315 20.0 29.97 \n", + "1316 19.0 29.91 \n", + "1317 27.0 29.96 \n", + "1318 22.0 30.04 \n", + "\n", + " SeaLevelPressureAvgInches SeaLevelPressureLowInches \\\n", + "0 29.68 29.59 \n", + "1 30.13 29.87 \n", + "2 30.49 30.41 \n", + "3 30.45 30.30 \n", + "4 30.33 30.27 \n", + "... ... ... \n", + "1314 29.97 29.88 \n", + "1315 29.90 29.81 \n", + "1316 29.86 29.79 \n", + "1317 29.91 29.87 \n", + "1318 29.97 29.91 \n", + "\n", + " VisibilityHighMiles VisibilityAvgMiles VisibilityLowMiles \\\n", + "0 10.0 7.0 2.0 \n", + "1 10.0 10.0 5.0 \n", + "2 10.0 10.0 10.0 \n", + "3 10.0 10.0 7.0 \n", + "4 10.0 10.0 7.0 \n", + "... ... ... ... \n", + "1314 10.0 10.0 10.0 \n", + "1315 10.0 10.0 10.0 \n", + "1316 10.0 10.0 10.0 \n", + "1317 10.0 10.0 10.0 \n", + "1318 10.0 10.0 10.0 \n", + "\n", + " WindHighMPH WindAvgMPH WindGustMPH Events Snow Fog \\\n", + "0 20.0 4.0 31.0 Rain , Thunderstorm 0 0 \n", + "1 16.0 6.0 25.0 0 0 \n", + "2 8.0 3.0 12.0 0 0 \n", + "3 12.0 4.0 20.0 0 0 \n", + "4 10.0 2.0 16.0 0 0 \n", + "... ... ... ... ... ... ... \n", + "1314 12.0 5.0 21.0 0 0 \n", + "1315 14.0 5.0 20.0 0 0 \n", + "1316 12.0 4.0 17.0 0 0 \n", + "1317 13.0 4.0 20.0 0 0 \n", + "1318 12.0 4.0 20.0 0 0 \n", + "\n", + " Rain Thunderstorm \n", + "0 0 0 \n", + "1 0 0 \n", + "2 0 0 \n", + "3 0 0 \n", + "4 0 0 \n", + "... ... ... \n", + "1314 0 0 \n", + "1315 0 0 \n", + "1316 0 0 \n", + "1317 0 0 \n", + "1318 0 0 \n", + "\n", + "[1319 rows x 24 columns]" + ] + }, + "execution_count": 35, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "event_list = ['Snow', 'Fog', 'Rain', 'Thunderstorm']\n", "\n", "# Your code here\n", - "\n", + "for event in event_list:\n", + " austin_fixed[event] = 0\n", "\n", "# Print your new dataframe to check whether new columns have been created:\n", "\n", @@ -446,11 +6753,15 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 36, "metadata": {}, "outputs": [], "source": [ - "# Your code here\n" + "# Your code here\n", + "for event in event_list:\n", + " # Check if the event is present in the 'Events' column and assign 1 where it happens\n", + " austin_fixed.loc[austin_fixed['Events'].str.contains(event, case=False, na=False), event] = 1\n", + "\n" ] }, { @@ -462,11 +6773,527 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 42, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date", + "rawType": "object", + "type": "string" + }, + { + "name": "TempHighF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempAvgF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempLowF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "DewPointHighF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointAvgF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointLowF", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityHighPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityAvgPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityLowPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureHighInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureAvgInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureLowInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityHighMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityAvgMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityLowMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindHighMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindAvgMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindGustMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "Events", + "rawType": "object", + "type": "string" + }, + { + "name": "Snow", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Fog", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Rain", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Thunderstorm", + "rawType": "int64", + "type": "integer" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "6ea762d9-637a-4853-b9ac-bfb4294d7ad1", + "rows": [ + [ + "300", + "2014-10-17", + "87", + "74", + "61", + "64.0", + "60.0", + "54.0", + "97.0", + "69.0", + "40.0", + "29.95", + "29.9", + "29.86", + "10.0", + "10.0", + "10.0", + "13.0", + "3.0", + "17.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "612", + "2015-08-25", + "101", + "89", + "77", + "71.0", + "68.0", + "65.0", + "79.0", + "56.0", + "33.0", + "30.06", + "30.01", + "29.97", + "10.0", + "10.0", + "10.0", + "12.0", + "3.0", + "23.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "821", + "2016-03-21", + "68", + "52", + "35", + "39.0", + "34.0", + "30.0", + "82.0", + "57.0", + "32.0", + "30.47", + "30.37", + "30.24", + "10.0", + "10.0", + "10.0", + "12.0", + "4.0", + "20.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "1313", + "2017-07-26", + "103", + "91", + "78", + "75.0", + "70.0", + "61.0", + "91.0", + "58.0", + "25.0", + "30.13", + "30.03", + "29.93", + "10.0", + "10.0", + "10.0", + "15.0", + "6.0", + "27.0", + " ", + "0", + "0", + "0", + "0" + ], + [ + "133", + "2014-05-03", + "94", + "76", + "58", + "42.0", + "35.0", + "26.0", + "44.0", + "27.0", + "10.0", + "30.06", + "30.0", + "29.95", + "10.0", + "10.0", + "10.0", + "13.0", + "4.0", + "20.0", + " ", + "0", + "0", + "0", + "0" + ] + ], + "shape": { + "columns": 24, + "rows": 5 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
DateTempHighFTempAvgFTempLowFDewPointHighFDewPointAvgFDewPointLowFHumidityHighPercentHumidityAvgPercentHumidityLowPercentSeaLevelPressureHighInchesSeaLevelPressureAvgInchesSeaLevelPressureLowInchesVisibilityHighMilesVisibilityAvgMilesVisibilityLowMilesWindHighMPHWindAvgMPHWindGustMPHEventsSnowFogRainThunderstorm
3002014-10-1787746164.060.054.097.069.040.029.9529.9029.8610.010.010.013.03.017.00000
6122015-08-25101897771.068.065.079.056.033.030.0630.0129.9710.010.010.012.03.023.00000
8212016-03-2168523539.034.030.082.057.032.030.4730.3730.2410.010.010.012.04.020.00000
13132017-07-26103917875.070.061.091.058.025.030.1330.0329.9310.010.010.015.06.027.00000
1332014-05-0394765842.035.026.044.027.010.030.0630.0029.9510.010.010.013.04.020.00000
\n", + "
" + ], + "text/plain": [ + " Date TempHighF TempAvgF TempLowF DewPointHighF DewPointAvgF \\\n", + "300 2014-10-17 87 74 61 64.0 60.0 \n", + "612 2015-08-25 101 89 77 71.0 68.0 \n", + "821 2016-03-21 68 52 35 39.0 34.0 \n", + "1313 2017-07-26 103 91 78 75.0 70.0 \n", + "133 2014-05-03 94 76 58 42.0 35.0 \n", + "\n", + " DewPointLowF HumidityHighPercent HumidityAvgPercent \\\n", + "300 54.0 97.0 69.0 \n", + "612 65.0 79.0 56.0 \n", + "821 30.0 82.0 57.0 \n", + "1313 61.0 91.0 58.0 \n", + "133 26.0 44.0 27.0 \n", + "\n", + " HumidityLowPercent SeaLevelPressureHighInches \\\n", + "300 40.0 29.95 \n", + "612 33.0 30.06 \n", + "821 32.0 30.47 \n", + "1313 25.0 30.13 \n", + "133 10.0 30.06 \n", + "\n", + " SeaLevelPressureAvgInches SeaLevelPressureLowInches \\\n", + "300 29.90 29.86 \n", + "612 30.01 29.97 \n", + "821 30.37 30.24 \n", + "1313 30.03 29.93 \n", + "133 30.00 29.95 \n", + "\n", + " VisibilityHighMiles VisibilityAvgMiles VisibilityLowMiles \\\n", + "300 10.0 10.0 10.0 \n", + "612 10.0 10.0 10.0 \n", + "821 10.0 10.0 10.0 \n", + "1313 10.0 10.0 10.0 \n", + "133 10.0 10.0 10.0 \n", + "\n", + " WindHighMPH WindAvgMPH WindGustMPH Events Snow Fog Rain \\\n", + "300 13.0 3.0 17.0 0 0 0 \n", + "612 12.0 3.0 23.0 0 0 0 \n", + "821 12.0 4.0 20.0 0 0 0 \n", + "1313 15.0 6.0 27.0 0 0 0 \n", + "133 13.0 4.0 20.0 0 0 0 \n", + "\n", + " Thunderstorm \n", + "300 0 \n", + "612 0 \n", + "821 0 \n", + "1313 0 \n", + "133 0 " + ] + }, + "execution_count": 42, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin_fixed.sample(5)\n" ] }, { @@ -478,11 +7305,47 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 43, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Date 0\n", + "TempHighF 0\n", + "TempAvgF 0\n", + "TempLowF 0\n", + "DewPointHighF 0\n", + "DewPointAvgF 0\n", + "DewPointLowF 0\n", + "HumidityHighPercent 0\n", + "HumidityAvgPercent 0\n", + "HumidityLowPercent 0\n", + "SeaLevelPressureHighInches 0\n", + "SeaLevelPressureAvgInches 0\n", + "SeaLevelPressureLowInches 0\n", + "VisibilityHighMiles 0\n", + "VisibilityAvgMiles 0\n", + "VisibilityLowMiles 0\n", + "WindHighMPH 0\n", + "WindAvgMPH 0\n", + "WindGustMPH 0\n", + "Events 903\n", + "Snow 0\n", + "Fog 0\n", + "Rain 0\n", + "Thunderstorm 0\n", + "dtype: int64" + ] + }, + "execution_count": 43, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin_fixed.eq(\" \").sum()\n" ] }, { @@ -500,11 +7363,13 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 44, "metadata": {}, "outputs": [], "source": [ - "# Your code here\n" + "# Your code here\n", + "austin_fixed['Date'] = pd.to_datetime(austin_fixed['Date'], errors='coerce')\n", + "austin_fixed['Date_Ordinal'] = austin_fixed['Date'].apply(lambda x: x.toordinal() if pd.notnull(x) else None)\n" ] }, { @@ -516,9 +7381,533 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 45, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.microsoft.datawrangler.viewer.v0+json": { + "columns": [ + { + "name": "index", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date", + "rawType": "datetime64[ns]", + "type": "datetime" + }, + { + "name": "TempHighF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempAvgF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "TempLowF", + "rawType": "int64", + "type": "integer" + }, + { + "name": "DewPointHighF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointAvgF", + "rawType": "float64", + "type": "float" + }, + { + "name": "DewPointLowF", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityHighPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityAvgPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "HumidityLowPercent", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureHighInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureAvgInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "SeaLevelPressureLowInches", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityHighMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityAvgMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "VisibilityLowMiles", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindHighMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindAvgMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "WindGustMPH", + "rawType": "float64", + "type": "float" + }, + { + "name": "Events", + "rawType": "object", + "type": "string" + }, + { + "name": "Snow", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Fog", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Rain", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Thunderstorm", + "rawType": "int64", + "type": "integer" + }, + { + "name": "Date_Ordinal", + "rawType": "int64", + "type": "integer" + } + ], + "conversionMethod": "pd.DataFrame", + "ref": "4f5fe993-7195-4264-9b03-4d03e8498679", + "rows": [ + [ + "0", + "2013-12-21 00:00:00", + "74", + "60", + "45", + "67.0", + "49.0", + "43.0", + "93.0", + "75.0", + "57.0", + "29.86", + "29.68", + "29.59", + "10.0", + "7.0", + "2.0", + "20.0", + "4.0", + "31.0", + "Rain , Thunderstorm", + "0", + "0", + "1", + "1", + "735223" + ], + [ + "1", + "2013-12-22 00:00:00", + "56", + "48", + "39", + "43.0", + "36.0", + "28.0", + "93.0", + "68.0", + "43.0", + "30.41", + "30.13", + "29.87", + "10.0", + "10.0", + "5.0", + "16.0", + "6.0", + "25.0", + " ", + "0", + "0", + "0", + "0", + "735224" + ], + [ + "2", + "2013-12-23 00:00:00", + "58", + "45", + "32", + "31.0", + "27.0", + "23.0", + "76.0", + "52.0", + "27.0", + "30.56", + "30.49", + "30.41", + "10.0", + "10.0", + "10.0", + "8.0", + "3.0", + "12.0", + " ", + "0", + "0", + "0", + "0", + "735225" + ], + [ + "3", + "2013-12-24 00:00:00", + "61", + "46", + "31", + "36.0", + "28.0", + "21.0", + "89.0", + "56.0", + "22.0", + "30.56", + "30.45", + "30.3", + "10.0", + "10.0", + "7.0", + "12.0", + "4.0", + "20.0", + " ", + "0", + "0", + "0", + "0", + "735226" + ], + [ + "4", + "2013-12-25 00:00:00", + "58", + "50", + "41", + "44.0", + "40.0", + "36.0", + "86.0", + "71.0", + "56.0", + "30.41", + "30.33", + "30.27", + "10.0", + "10.0", + "7.0", + "10.0", + "2.0", + "16.0", + " ", + "0", + "0", + "0", + "0", + "735227" + ] + ], + "shape": { + "columns": 25, + "rows": 5 + } + }, + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
DateTempHighFTempAvgFTempLowFDewPointHighFDewPointAvgFDewPointLowFHumidityHighPercentHumidityAvgPercentHumidityLowPercentSeaLevelPressureHighInchesSeaLevelPressureAvgInchesSeaLevelPressureLowInchesVisibilityHighMilesVisibilityAvgMilesVisibilityLowMilesWindHighMPHWindAvgMPHWindGustMPHEventsSnowFogRainThunderstormDate_Ordinal
02013-12-2174604567.049.043.093.075.057.029.8629.6829.5910.07.02.020.04.031.0Rain , Thunderstorm0011735223
12013-12-2256483943.036.028.093.068.043.030.4130.1329.8710.010.05.016.06.025.00000735224
22013-12-2358453231.027.023.076.052.027.030.5630.4930.4110.010.010.08.03.012.00000735225
32013-12-2461463136.028.021.089.056.022.030.5630.4530.3010.010.07.012.04.020.00000735226
42013-12-2558504144.040.036.086.071.056.030.4130.3330.2710.010.07.010.02.016.00000735227
\n", + "
" + ], + "text/plain": [ + " Date TempHighF TempAvgF TempLowF DewPointHighF DewPointAvgF \\\n", + "0 2013-12-21 74 60 45 67.0 49.0 \n", + "1 2013-12-22 56 48 39 43.0 36.0 \n", + "2 2013-12-23 58 45 32 31.0 27.0 \n", + "3 2013-12-24 61 46 31 36.0 28.0 \n", + "4 2013-12-25 58 50 41 44.0 40.0 \n", + "\n", + " DewPointLowF HumidityHighPercent HumidityAvgPercent HumidityLowPercent \\\n", + "0 43.0 93.0 75.0 57.0 \n", + "1 28.0 93.0 68.0 43.0 \n", + "2 23.0 76.0 52.0 27.0 \n", + "3 21.0 89.0 56.0 22.0 \n", + "4 36.0 86.0 71.0 56.0 \n", + "\n", + " SeaLevelPressureHighInches SeaLevelPressureAvgInches \\\n", + "0 29.86 29.68 \n", + "1 30.41 30.13 \n", + "2 30.56 30.49 \n", + "3 30.56 30.45 \n", + "4 30.41 30.33 \n", + "\n", + " SeaLevelPressureLowInches VisibilityHighMiles VisibilityAvgMiles \\\n", + "0 29.59 10.0 7.0 \n", + "1 29.87 10.0 10.0 \n", + "2 30.41 10.0 10.0 \n", + "3 30.30 10.0 10.0 \n", + "4 30.27 10.0 10.0 \n", + "\n", + " VisibilityLowMiles WindHighMPH WindAvgMPH WindGustMPH \\\n", + "0 2.0 20.0 4.0 31.0 \n", + "1 5.0 16.0 6.0 25.0 \n", + "2 10.0 8.0 3.0 12.0 \n", + "3 7.0 12.0 4.0 20.0 \n", + "4 7.0 10.0 2.0 16.0 \n", + "\n", + " Events Snow Fog Rain Thunderstorm Date_Ordinal \n", + "0 Rain , Thunderstorm 0 0 1 1 735223 \n", + "1 0 0 0 0 735224 \n", + "2 0 0 0 0 735225 \n", + "3 0 0 0 0 735226 \n", + "4 0 0 0 0 735227 " + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "austin_fixed.head(5)" ] @@ -577,11 +7966,18 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 46, "metadata": {}, "outputs": [], "source": [ - "# Your code here:\n" + "# Your code here:\n", + "\n", + "X = austin_fixed[['Date', 'TempHighF', 'TempLowF', 'DewPointHighF', 'DewPointAvgF', \n", + " 'DewPointLowF', 'HumidityHighPercent', 'HumidityAvgPercent', 'HumidityLowPercent',\n", + " 'SeaLevelPressureHighInches', 'SeaLevelPressureAvgInches', 'SeaLevelPressureLowInches',\n", + " 'VisibilityHighMiles', 'VisibilityAvgMiles', 'VisibilityLowMiles', \n", + " 'WindHighMPH', 'WindAvgMPH', 'WindGustMPH', 'Snow', 'Fog', 'Rain', 'Thunderstorm']]\n", + "y = austin_fixed['TempAvgF']\n" ] }, { @@ -593,11 +7989,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 47, "metadata": {}, "outputs": [], "source": [ - "#Your code here:\n" + "#Your code here:\n", + "from sklearn.model_selection import train_test_split\n" ] }, { @@ -612,11 +8009,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 48, "metadata": {}, "outputs": [], "source": [ - "#Your code here:\n" + "#Your code here:\n", + "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)\n" ] }, { @@ -641,11 +8039,15 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 49, "metadata": {}, "outputs": [], "source": [ - "# Your code here:\n" + "# Your code here:\n", + "import numpy as np\n", + "\n", + "total_rows = len(austin_fixed)\n", + "ts_rows = np.ceil(0.8 * total_rows).astype(int)\n" ] }, { @@ -657,11 +8059,13 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 50, "metadata": {}, "outputs": [], "source": [ - "# Your code here:\n" + "# Your code here:\n", + "X_ts_train = X.iloc[:ts_rows]\n", + "X_ts_test = X.iloc[ts_rows:]" ] }, { @@ -673,11 +8077,14 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 51, "metadata": {}, "outputs": [], "source": [ - "# Your code here:\n" + "# Your code here:\n", + "\n", + "y_ts_train = y.iloc[:ts_rows]\n", + "y_ts_test = y.iloc[ts_rows:]" ] } ], @@ -697,7 +8104,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.9" + "version": "3.13.2" } }, "nbformat": 4,