FIRST FILE

Importing the Required Library

In [1]:
import pandas as pd

Defining the convert_to_float Function

In [2]:
def convert_to_float(coord):#Converts coordinates like '13.14E' or '13.14S' to float values.'E' and 'N' are positive, 'W' and 'S' are negative.
    
    if 'E' in coord or 'N' in coord:
        return float(coord[:-1]) #removing the last character of the string, leaving just the number part and converting this string into a float (a decimal number).
    elif 'W' in coord or 'S' in coord:
        return -float(coord[:-1]) #same as before, but also adds a - sign in front to make it negative.
    else:
        raise ValueError(f"Unexpected coordinate format: {coord}") #If the coordinate doesn’t contain "E", "N", "W", or "S", it raises an error, stopping the program and showing a message to indicate there was an issue with the format.

Defining the load_data Function

In [3]:
def load_data(filepath):
    data = pd.read_csv(filepath)
    
    # Ensure 'Year' is extracted from date
    data['Year'] = pd.to_datetime(data['dt'], errors='coerce').dt.year #converts the values in the 'dt' column to datetime format, and creates a new column in the DataFrame called Year that stores these extracted year values.
    
    # Convert 'AverageTemperature' to numeric, handling errors by setting non-numeric values to NaN
    data['AverageTemperature'] = pd.to_numeric(data['AverageTemperature'], errors='coerce')
    
    # Drop rows where 'AverageTemperature' or 'Year' is NaN
    data.dropna(subset=['AverageTemperature', 'Year'], inplace=True)
    
    # Apply the conversion function to latitude and longitude
    data['Latitude'] = data['Latitude'].apply(convert_to_float)
    data['Longitude'] = data['Longitude'].apply(convert_to_float)
    
    return data

 Defining the filter_data_by_year Function

In [4]:
#This function filters the data so that only rows for a specific year are included.
def filter_data_by_year(data, year):
    return data[data['Year'] == year] #returns only the rows in data where the 'Year' column equals the specified year