By default, we process and store data by years. This may be
over the top in some cases, especially for short time ranges across turn of the year. In this case, you may set
`ignore_years=True`. Below is an example.

Note however, that this can be very costly if data is only
available for few wildcarded nsc and if time range is too 
generous.

In [None]:
from glob import glob
from datetime import datetime, timezone
import os
import numpy as np

from obspy.clients.filesystem.sds import Client
from obspy.clients.fdsn import RoutingClient
from obspy.core import UTCDateTime as UTC
from obspy.signal import util

In [None]:
from data_quality_control import processing

In [None]:
from importlib import reload

In [None]:
network = 'G*'
station = 'BF*'
channel = 'HHZ'

overlap = 60 #3600

fmin, fmax = (4, 14)
nperseg = 2048
winlen_in_s = 3600
proclen = 24*3600
sds_root = os.path.abspath('../sample_sds/')
inventory_routing_type = "eida-routing"

outdir = '../data/'

sdsclient = Client(sds_root)
invclient = RoutingClient('eida-routing')

In [None]:
reload(processing)
processor = processing.RawDataProcessor(
        network=network, 
        station=station,
        channel=channel,
        sds_root=sds_root,
        inventory_routing_type=inventory_routing_type,)

In [None]:
startdate = UTC("2020-12-20")
enddate = UTC("2021-01-15")

In [None]:
%%time
#it -n1 -r7
processor.process(startdate, enddate, outdir,
                  ignore_years=True,
                        overlap=overlap, 
            winlen_in_s=winlen_in_s,
        nperseg=nperseg, proclen=proclen,
                 amplitude_frequencies=(fmin, fmax))
print("Time of execution:", datetime.now())

In [None]:
%ls -lh ../data/GR.BFO..HHZ_2020-12-25_2021-01-09.hdf5