# Day 25 - Working with CSV Data and the Pandas Library

## Reading CSV Data in Python

In [13]:
# method 1

with open("weather_data.csv") as data_file:
    data = data_file.readlines()
    print(data)

['day,temp,condition\n', 'Monday,12,Sunny\n', 'Tuesday,14,Rain\n', 'Wednesday,15,Rain\n', 'Thursday,14,Cloudy\n', 'Friday,21,Sunny\n', 'Saturday,22,Sunny\n', 'Sunday,24,Sunny']


In [14]:
# method 2

import csv

with open("weather_data.csv") as data_file:
    data = csv.reader(data_file)
    for row in data:
        print(row)


['day', 'temp', 'condition']
['Monday', '12', 'Sunny']
['Tuesday', '14', 'Rain']
['Wednesday', '15', 'Rain']
['Thursday', '14', 'Cloudy']
['Friday', '21', 'Sunny']
['Saturday', '22', 'Sunny']
['Sunday', '24', 'Sunny']


In [15]:
# challenge get all the temperature into a list

import csv

with open("weather_data.csv") as data_file:
    data = csv.reader(data_file)
    temperatures = []
    for row in data:
        if row[1] != "temp":
            temperatures.append(int(row[1]))
    print(temperatures)

[12, 14, 15, 14, 21, 22, 24]


In [16]:
import pandas as pd

data = pd.read_csv("weather_data.csv")
print(data)
# print(data["temp"])

         day  temp condition
0     Monday    12     Sunny
1    Tuesday    14      Rain
2  Wednesday    15      Rain
3   Thursday    14    Cloudy
4     Friday    21     Sunny
5   Saturday    22     Sunny
6     Sunday    24     Sunny


## Dataframes & Series: Working with Rows & Columns

In [17]:
## Get Data in rows

print(data[data.day == "Monday"])
print(data[data.temp == data.temp.max()])

      day  temp condition
0  Monday    12     Sunny
      day  temp condition
6  Sunday    24     Sunny


In [18]:
## Create a dataframe from scratch

data_dict = {
    "students": ["Amy", "James", "Angela"],
    "scores": [76, 56, 65]
}

data = pd.DataFrame(data_dict)  # creating a dataframe with dictionary data
data.to_csv("new_data.csv")  # creates a csv file with the data
print(data)

  students  scores
0      Amy      76
1    James      56
2   Angela      65


## The Great Squirrel Census Data Analysis (with Pandas)

In [19]:
csv_data = pd.read_csv("2018_Central_Park_Squirrel_Census_-_Squirrel_Data.csv")
grey_squirrels_count = len(csv_data[csv_data["Primary Fur Color"] == "Gray"])
red_squirrels_count = len(csv_data[csv_data["Primary Fur Color"] == "Cinnamon"])
black_squirrels_count = len(csv_data[csv_data["Primary Fur Color"] == "Black"])

print(grey_squirrels_count)
print(red_squirrels_count)
print(black_squirrels_count)

data_dict = {
    "Fur Color": ["Gray", "Cinnamon", "Black"],
    "Count": [grey_squirrels_count, red_squirrels_count, black_squirrels_count]
}

df = pd.DataFrame(data_dict)
df.to_csv("squirrel_count.csv")

2473
392
103


## Project - U.S. States Game