In [1]:
import sys
if 'google.colab' in sys.modules:
    !git clone  https://github.com/ecastillot/delaware.git ./delaware
    !pip install obspy

In [1]:
import sys
import os

version = "10102024"

if 'google.colab' in sys.modules:
    dw_path = os.path.join("/content/delaware",version)
else:
    dw_path = os.path.join("/home/emmanuel/ecastillo/dev/delaware",version)
    
sys.path.append(dw_path)

In [2]:
from delaware.core.read import EQPicks
from delaware.core.eqviewer import Stations
from delaware.loc.inv import prepare_cat2vps
import pandas as pd
import os
from itertools import combinations
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import pandas as pd
from itertools import combinations
from typing import Tuple, List, Dict
from scipy.stats import mode

def load_stations(stations_path: str, proj: str) -> object:
    """
    Load station data and return a Stations object.

    Args:
        stations_path (str): Path to the stations CSV file.
        proj (str): EPSG projection for the station data.

    Returns:
        Stations: An object containing station data.
    """
    stations = pd.read_csv(stations_path)
    stations_columns = ["network", "station", "latitude", "longitude", "elevation"]
    stations = stations[stations_columns]
    stations["station_index"] = stations.index
    stations_obj = Stations(data=stations, xy_epsg=proj)
    return stations_obj

def get_single_station(stations: object, station_name: str) -> pd.Series:
    """
    Extract information for a single station by name.

    Args:
        stations (object): Stations object containing station data.
        station_name (str): Name of the station to extract.

    Returns:
        pd.Series: Data for the specified station.
    """
    single_station = stations.data[stations.data["station"] == station_name].iloc[0]
    return single_station

def load_eqpicks(root: str, author: str, proj: str, catalog_path: str, picks_path: str,
                 catalog_header_line=1) -> object:
    """
    Load earthquake picks and return an EQPicks object.

    Args:
        root (str): Root directory for the data.
        author (str): Author name for the picks.
        proj (str): EPSG projection for the picks.
        catalog_path (str): Path to the catalog CSV file.
        picks_path (str): Path to the picks database file.

    Returns:
        EQPicks: An object containing earthquake picks data.
    """
    return EQPicks(root, author=author, xy_epsg=proj, 
                   catalog_header_line=catalog_header_line,
                   catalog_path=catalog_path, picks_path=picks_path)

def process_catalog_and_picks(eq_picks: object, single_station: pd.Series,
                              stations: Stations,r) -> Tuple[pd.DataFrame, pd.DataFrame]:
    """
    Process catalog and picks for a single station.

    Args:
        eq_picks (object): EQPicks object containing picks and catalog data.
        single_station (pd.Series): Data for a single station.

    Returns:
        Tuple[pd.DataFrame, pd.DataFrame]: Processed catalog and picks data.
    """
    src = (single_station.latitude, single_station.longitude, r, None)
    catalog, picks = eq_picks.get_catalog_with_picks(region_from_src=src)
    catalog, picks = prepare_cat2vps(catalog.data, picks.data, stations.data)
    picks = picks[picks["station"] == single_station.station]
    catalog = catalog[catalog['ev_id'].isin(picks['ev_id'])]
    return catalog, picks

def preprocess_picks(picks: pd.DataFrame, catalog: pd.DataFrame) -> pd.DataFrame:
    """
    Preprocess picks data by merging with catalog and calculating arrival times.

    Args:
        picks (pd.DataFrame): Picks data.
        catalog (pd.DataFrame): Catalog data.

    Returns:
        pd.DataFrame: Preprocessed picks data.
    """
    picks_data = pd.merge(picks, catalog, on=["ev_id"])
    picks_data['arrival_time_P'] = pd.to_datetime(picks_data['arrival_time_P']) - pd.to_datetime(picks_data['origin_time'])
    picks_data['arrival_time_S'] = pd.to_datetime(picks_data['arrival_time_S']) - pd.to_datetime(picks_data['origin_time'])
    picks_data['arrival_time_P'] = picks_data['arrival_time_P'].apply(lambda x: x.total_seconds())
    picks_data['arrival_time_S'] = picks_data['arrival_time_S'].apply(lambda x: x.total_seconds())
    return picks_data

def calculate_vij(picks_data: pd.DataFrame) -> pd.DataFrame:
    """
    Calculate v_ij for all combinations of picks.

    Args:
        picks_data (pd.DataFrame): Preprocessed picks data.

    Returns:
        pd.DataFrame: DataFrame containing v_ij results.
    """
    results = []
    good_logs, bad_logs = [], []

    for i, j in combinations(picks_data.index, 2):
        delta_t_S = picks_data.loc[i, 'arrival_time_S'] - picks_data.loc[j, 'arrival_time_S']
        delta_t_P = picks_data.loc[i, 'arrival_time_P'] - picks_data.loc[j, 'arrival_time_P']
        v_ij = delta_t_S / delta_t_P if delta_t_P != 0 else None

        log = {
            "ev_i": picks_data.loc[i, 'ev_id'],
            "ev_j": picks_data.loc[j, 'ev_id'],
            "station": picks_data.loc[i, 'station'],
            "v_ij": v_ij
        }

        if v_ij is not None and v_ij > 0:
            results.append(log)
            good_logs.append(log)
        else:
            bad_logs.append(log)

    print(f"Good: {len(good_logs)}, Bad: {len(bad_logs)}")
    return pd.DataFrame(results)


In [6]:
root = "/home/emmanuel/ecastillo/dev/delaware/10102024/data/eq/aoi/growclust_and_sheng"
catalog_path = "/home/emmanuel/ecastillo/dev/delaware/10102024/data/eq/aoi/growclust_and_sheng/origin.csv"
picks_path = "/home/emmanuel/ecastillo/dev/delaware/10102024/data/eq/aoi/growclust_and_sheng/picks.db"
author = "growclust"
proj = "EPSG:3857"
stations_path = "/home/emmanuel/ecastillo/dev/delaware/02032024/data_git/stations/delaware_onlystations_160824.csv"
# stations_path = "/home/emmanuel/ecastillo/dev/delaware/10102024/data_git/stations/standard_stations.csv"

r = 25 #in km
# bins = np.arange(1, 3.02, 0.1)
station_list = ["PB04","PB16"]

custom_palette = {"PB35": "#26fafa", 
                  "PB36": "#2dfa26", 
                  "PB28": "#ad16db", 
                  "PB37": "#1a3be3", 
                  "WB03": "#ffffff", 
                  "SA02": "#f1840f", 
                  "PB24": "#0ea024", 
                  }
# station_list = list(custom_palette.keys())

for station_name in station_list:
    print(station_name)

    stations = load_stations(stations_path, proj)
    print(stations)
    single_station = get_single_station(stations, station_name)

    # Load EQPicks
    eq_picks = load_eqpicks(root, author, proj, catalog_path, picks_path,catalog_header_line=0)

    # Process catalog and picks
    catalog, picks = process_catalog_and_picks(eq_picks, single_station,
                                               stations=stations,
                                               r=r)

    # Preprocess picks
    picks_data = preprocess_picks(picks, catalog)

    # Calculate v_ij
    results_df = calculate_vij(picks_data)
    
    path = os.path.join("/home/emmanuel/ecastillo/dev/delaware/02032024/project/vpvs/stations",f"{station_name}_{r}.csv")
    results_df.to_csv(path,index=False)
    # Q1 = results_df['v_ij'].quantile(0.10)
    # Q3 = results_df['v_ij'].quantile(0.90)
    # iqr_results_df = results_df[(results_df['v_ij'] >= Q1) & (results_df['v_ij'] <= Q3)]
    # print(iqr_results_df.describe())
    # plot_vij_histogram(iqr_results_df,station_name,bins=bins,output=output_fig)


PB04
Station | 265 stations
['texnet2017cobl', 'texnet2017cqbk', 'texnet2017cqhr', 'texnet2017cwhc', 'texnet2017cxvs', 'texnet2017czqk', 'texnet2017dcct', 'texnet2017ddcv', 'texnet2017ddfo', 'texnet2017demh', 'texnet2017dgwa', 'texnet2017djhy', 'texnet2017djjz', 'texnet2017djrd', 'texnet2017djsm', 'texnet2017dnka', 'texnet2017dott', 'texnet2017dozs', 'texnet2017dpfl', 'texnet2017duxt', 'texnet2017dwwe', 'texnet2017eaib', 'texnet2017eaou', 'texnet2017eclx', 'texnet2017edgt', 'texnet2017eeio', 'texnet2017egil', 'texnet2017ehte', 'texnet2017ejyh', 'texnet2017emqo', 'texnet2017enva', 'texnet2017enwh', 'texnet2017enyb', 'texnet2017enza', 'texnet2017epjr', 'texnet2017eqtt', 'texnet2017etuh', 'texnet2017eukt', 'texnet2017eurl', 'texnet2017euuz', 'texnet2017fcup', 'texnet2017fgec', 'texnet2017fhgt', 'texnet2017fhjr', 'texnet2017fhzu', 'texnet2017fjtj', 'texnet2017fldz', 'texnet2017fmlj', 'texnet2017fnmr', 'texnet2017fnpz', 'texnet2017fnsy', 'texnet2017fqno', 'texnet2017fqnv', 'texnet2017fqsz',

  df = pd.concat(all_dataframes, ignore_index=True)


Good: 10297, Bad: 729
PB16
Station | 265 stations
['texnet2017cobl', 'texnet2017cqbk', 'texnet2017cqhr', 'texnet2017cwhc', 'texnet2017cxvs', 'texnet2017czqk', 'texnet2017dcct', 'texnet2017demh', 'texnet2017dgwa', 'texnet2017djhy', 'texnet2017djjz', 'texnet2017djrd', 'texnet2017djsm', 'texnet2017dnka', 'texnet2017dott', 'texnet2017dozs', 'texnet2017dpfl', 'texnet2017duxt', 'texnet2017dwwe', 'texnet2017eaib', 'texnet2017eclx', 'texnet2017edgt', 'texnet2017ejyh', 'texnet2017emqo', 'texnet2017enwh', 'texnet2017enyb', 'texnet2017enza', 'texnet2017epjr', 'texnet2017eqtt', 'texnet2017etuh', 'texnet2017eukt', 'texnet2017eurl', 'texnet2017euuz', 'texnet2017fcup', 'texnet2017fdkf', 'texnet2017fgec', 'texnet2017fhgt', 'texnet2017fhjr', 'texnet2017fhzu', 'texnet2017fjtj', 'texnet2017fkxu', 'texnet2017fldz', 'texnet2017fmlj', 'texnet2017fnmr', 'texnet2017fnpz', 'texnet2017fnsy', 'texnet2017fqno', 'texnet2017fxay', 'texnet2017gayk', 'texnet2017gfmd', 'texnet2017ggdk', 'texnet2017ghlo', 'texnet2017gk