# CC Scheme

In [1]:
%load_ext autoreload
%autoreload 2

import warnings
warnings.simplefilter(action='ignore', category=FutureWarning)

import numpy as np
import pandas as pd
import xarray as xr
import matplotlib.pyplot as plt
from obspy import UTCDateTime, read_inventory
import os
import ccf

In [2]:
%matplotlib notebook

In [3]:
ccf.clients.set(sds_root='/Users/psmets/Documents/Research/_data/WaveformArchive')

In [4]:
# general parameters
sampling_rate = 50.
window_length = 86400. # 24h
window_overlap = 21./24. # 3h shift
clip_lag = pd.to_timedelta((0,6),unit='h')
title_prefix = 'Monowai Volcanic Centre'
poi = {'name': 'MVC', 'latitude': -25.887, 'longitude': -177.188, 'elevation': 0., 'local_depth': 132.}

# stream preprocess operations (sequential!)
preprocess = {
    'BHZ': [
        ('merge', { 'method': 1, 'fill_value': 'interpolate', 'interpolation_samples':0 }),
        ('filter', {'type':'highpass','freq':.05}),
        ('detrend', { 'type': 'demean' }),
        ('remove_response', {'output': 'VEL'}),
        ('filter', { 'type': 'highpass', 'freq': 3. }),
        ('interpolate', {'sampling_rate': 50, 'method':'lanczos', 'a':20 }),
        ('filter', { 'type': 'lowpass', 'freq': 20. }),
        ('trim', {}),
        ('detrend', { 'type': 'demean' }),
        ('taper', { 'type': 'cosine', 'max_percentage': 0.05, 'max_length': 30.}),
    ],
    'BHR': [
        ('merge', { 'method': 1, 'fill_value': 'interpolate', 'interpolation_samples':0 }),
        ('filter', {'type':'highpass','freq':.05}),
        ('detrend', { 'type': 'demean' }),
        ('remove_response', {'output': 'VEL'}),
        ('rotate', {'method':'->ZNE'}),
        ('rotate', {'method':'NE->RT', 'back_azimuth':250.39 }),
        ('select', {'channel':'BHR'}),
        ('filter', { 'type': 'highpass', 'freq': 3. }),
        ('interpolate', {'sampling_rate': 50, 'method':'lanczos', 'a':20 }),
        ('filter', { 'type': 'lowpass', 'freq': 20. }),
        ('trim', {}),
        ('detrend', { 'type': 'demean' }),
        ('taper', { 'type': 'cosine', 'max_percentage': 0.05, 'max_length': 30.}),
    ],
    'EDH': [
        ('merge', { 'method': 1, 'fill_value': 'interpolate', 'interpolation_samples':0 }),
        ('filter', {'type':'highpass','freq':.05}),
        ('detrend', { 'type': 'demean' }),
        ('remove_sensitivity', {}),
        ('filter', { 'type': 'bandpass', 'freqmin': 3., 'freqmax': 20. }),
        ('decimate', { 'factor': 5 }),
        ('trim', {}),
        ('detrend', { 'type': 'demean' }),
        ('taper', {'type': 'cosine', 'max_percentage': 0.05, 'max_length': 30.}),
    ],
}

In [5]:
inv = read_inventory('Monowai.xml')
fig = inv.plot(color=0., projection='local')

pairs = [
    'IM.H10N1..EDH-IU.RAR.10.BHZ',
    'IM.H10N1..EDH-IU.RAR.10.BHR',
]
times = pd.date_range('2015-01-15', '2015-02-20', freq='1D')

<IPython.core.display.Javascript object>

## Get waveforms

In [None]:
BHZ = ccf.clients.get_preprocessed_stream(
    receiver = 'IU.RAR.10.BHZ', 
    time = pd.to_datetime('2015-01-01T12:00'), 
    operations = preprocess,
    inventory = inv,
    verbose = True,
)

In [None]:
BHZ.plot()

In [None]:
BHR = ccf.clients.get_preprocessed_stream(
    receiver = 'IU.RAR.10.BHR', 
    time = pd.to_datetime('2015-01-01T12:00'), 
    operations = preprocess,
    inventory = inv,
    verbose = True
)

In [None]:
BHR.plot()

## Cross-correlate one day of data

In [6]:
pair = pairs[0]
time = times[0]

In [7]:
ds = ccf.init_dataset(
    pair=pair, 
    starttime = time, 
    endtime = time + pd.offsets.DateOffset(1), 
    preprocess = preprocess, 
    sampling_rate = sampling_rate, 
    window_length = window_length, 
    window_overlap = window_overlap, 
    title_prefix = title_prefix,
    clip_lag = clip_lag,
    unbiased = False,
    inventory = inv,
    stationary_poi = poi,
)

In [8]:
ds

In [9]:
ds.distance

In [10]:
ccf.cc_dataset( ds, inventory = inv )

IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T00:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T03:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T06:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T09:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T12:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T15:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T18:00:00. Waveforms. CC. Done.
IM.H10N1..EDH-IU.RAR.10.BHZ 2015-01-15T21:00:00. Waveforms. CC. Done.


In [11]:
ds

Save a netcdf in a safe way (caching in a temp file).

In [None]:
# ccf.write_dataset(ds, 'test.nc')

In [12]:
plt.figure(figsize=[9,4])
ds.cc.loc[{'time':ds.time[:-1]}].plot.line(x='lag',add_legend=False)

<IPython.core.display.Javascript object>

[<matplotlib.lines.Line2D at 0x11c8cf850>,
 <matplotlib.lines.Line2D at 0x11c8b2090>,
 <matplotlib.lines.Line2D at 0x11c8b2910>,
 <matplotlib.lines.Line2D at 0x11c8b2ad0>,
 <matplotlib.lines.Line2D at 0x11c8b2c90>,
 <matplotlib.lines.Line2D at 0x11c8b2e50>,
 <matplotlib.lines.Line2D at 0x11c8b2fd0>]

In [13]:
ccf.bias_correct_dataset(ds,unbiased_var='cc_w')

In [14]:
ds

In [15]:
plt.figure(figsize=[9,4])
ds.cc_w.loc[{'time':ds.time[1]}].plot.line(x='lag',add_legend=False,color='orange')
ds.cc.loc[{'time':ds.time[1]}].plot.line(x='lag',add_legend=False,color='blue')

<IPython.core.display.Javascript object>

[<matplotlib.lines.Line2D at 0x127e784d0>]

### A whole period

In [None]:
def filename(pair:str,time:pd.datetime):
    return '{pair}.{y:04d}.{d:03d}.nc'.format(pair=pair,y=time.year,d=time.dayofyear)
dest = pwd

In [None]:
warnings.filterwarnings('ignore') # no warnings of duplicate inventory items

for pair in pairs:
    print('---------------------------')
    print(pair)
    print('---------------------------')
    for time in times:
        ncfile = os.path.join(dest,pair,filename(pair, time))
        if os.path.isfile(ncfile):
            ds = xr.open_dataset(ncfile)
            if np.all(ds.status.values == 1):
                ds.close()
                continue
        else:
            ds = ccf.init_dataset(
                pair=pair, 
                starttime = time, 
                endtime = time + pd.offsets.DateOffset(1), 
                preprocess = preprocess, 
                sampling_rate = sampling_rate, 
                window_length = window_length, 
                window_overlap = window_overlap, 
                title_prefix = title_prefix,
                clip_lag = clip_lag,
                unbiased = False,
                inventory = inv,
                stationary_poi = poi,
            )
        try:
            ccf.cc_dataset(
                ds,
                inventory = inv.select(starttime=UTCDateTime(time),endtime=UTCDateTime(time + pd.offsets.DateOffset(1))),
                retry_missing = True,
            )
        except (KeyboardInterrupt, SystemExit):
            raise
        except Exception as e:
            print('An error occurred. Save and continue next timestep.')
            print('Error:')
            print(e)
        ccf.write_dataset(ds,ncfile)