# Subset Canada Reference Basin Hydrometric Network 2020 stations
Retains from the metadata file only those stations that are part of the RHBN 2020 set. 

See (last access: 2022-08-23): https://www.canada.ca/en/environment-climate-change/services/water-overview/quantity/monitoring/survey/data-products-services/reference-hydrometric-basin-network.html

In [1]:
import sys
from pathlib import Path
sys.path.append(str(Path().absolute().parent))
import python_cs_functions as cs
import pandas as pd

### Config handling

In [2]:
# Specify where the config file can be found
config_file = '../0_config/config.txt'

In [3]:
# Get the required info from the config file
data_path,_ = cs.read_from_config(config_file,'data_path')
shps_path,_ = cs.read_from_config(config_file,'ref_shps_path')
file_url,_  = cs.read_from_config(config_file,'can_rhbn_meta_url')

### Define file location

In [7]:
# Construct the download location
download_folder = Path(data_path) / shps_path / 'RHBN-CAN'

In [4]:
# Make the file name: Get the last part of the url, strip whitespace and characters, replace extension
file_name = file_url.split('/')[-1].strip().replace('xlsx','csv') 

### Process file

In [9]:
# Open the file
df = pd.read_csv(str(download_folder/file_name))

In [12]:
# Select only the 2020 set
df = df[df.Evaluation_Year == 2020]

In [14]:
df.to_csv(download_folder/file_name, encoding='utf-8', index=False)