## In this notebook we will be gathering and adding PAR data to our Covariate dataset

To do this we will use the [Seaflow-sfl GitHub](https://github.com/seaflow-uw/seaflow-sfl/tree/master) as it has ship PAR values for most cruises that has the Seaflow machine on board

In [None]:
import os
import requests
import pandas as pd

def download_data(dataset):
    base_url = 'https://github.com/seaflow-uw/seaflow-sfl/raw/master/curated/'
    output_directory = './downloaded_data'

    # Create the output directory if it doesn't exist
    os.makedirs(output_directory, exist_ok=True)

    # Extract unique cruisenames from the dataset
    cruisenames = dataset['cruisename'].unique()

    for cruisename in cruisenames:
        # Generate the corresponding file name based on the cruisename structure
        file_name = cruisename + '_751.sfl'

        file_url = base_url + file_name

        # Download the file
        response = requests.get(file_url)
        if response.status_code == 200:
            # Save the downloaded file
            output_path = os.path.join(output_directory, file_name)
            with open(output_path, 'wb') as f:
                f.write(response.content)
                print(f"Downloaded {file_name}")
        else:
            print(f"Failed to download {file_name}")
