# Stumpy Tutorial Dataset Backups

This notebook copies the download process in active tutorials as part of the Stumpy docs. Then exports CSVs to a local directory.

The CSVs are subsequently uploaded to the Stumpy community on [Zenodo](https://zenodo.org/communities/stumpy/?page=1&size=20).

In [1]:
import pandas as pd

import urllib
import ssl
import io
import os

from scipy.io import loadmat

context = ssl.SSLContext()  # Ignore SSL certificate verification for simplicity

## Steamgen 

In [2]:
colnames = ['drum pressure',
            'excess oxygen',
            'water level',
            'steam flow'
           ]


url = 'https://www.cs.ucr.edu/~eamonn/iSAX/steamgen.dat'
raw_bytes = urllib.request.urlopen(url, context=context).read()
data = io.BytesIO(raw_bytes)
steam_df = pd.read_csv(data, header=None, sep="\\s+")
steam_df.columns = colnames

steam_df.to_csv('./STUMPY_Basics_steamgen.csv', index = False)

## Taxi

In [3]:
# Ref - https://github.com/stanford-futuredata/ASAP
taxi_df = pd.read_csv("https://raw.githubusercontent.com/stanford-futuredata/ASAP/master/Taxi.csv", sep=',')

taxi_df.to_csv('./STUMPY_Basics_Taxi.csv', index = False)


## Kohls

In [4]:
url = 'https://sites.google.com/site/timeserieschain/home/Kohls_data.mat?attredirects=0&revision=1'
raw_bytes = urllib.request.urlopen(url, context=context).read()
data = io.BytesIO(raw_bytes)
mat = loadmat(data)
mdata = mat['VarName1']
mdtype = mdata.dtype

df = pd.DataFrame(mdata, dtype=mdtype, columns=['volume'])

df.to_csv('./Time_Series_Chains_Kohls_data.csv', index = False)

## TiltABP

In [5]:
url = 'https://sites.google.com/site/timeserieschain/home/TiltABP_210_25000.txt'
raw_bytes = urllib.request.urlopen(url, context=context).read()
data = io.BytesIO(raw_bytes)
df = pd.read_csv(data, header=None)
df = df.reset_index().rename({'index': 'time', 0: 'abp'}, axis='columns')

df.to_csv('./Semantic_Segmentation_TiltABP.csv', index = False)

## Robot Dog

In [6]:
T_url = 'https://www.cs.unm.edu/~mueen/robot_dog.txt'
T_raw_bytes = urllib.request.urlopen(T_url, context=context).read()
T_data = io.BytesIO(T_raw_bytes)
T_df = pd.read_csv(T_data, header=None, sep='\s+', names=['Acceleration'])

T_df.to_csv('Fast_Pattern_Searching_robot_dog.csv', index = False)

## Carpet query

In [7]:
Q_url = 'https://www.cs.unm.edu/~mueen/carpet_query.txt'
Q_raw_bytes = urllib.request.urlopen(Q_url, context=context).read()
Q_data = io.BytesIO(Q_raw_bytes)
Q_df = pd.read_csv(Q_data, header=None, sep='\s+', names=['Acceleration'])

Q_df.to_csv('./carpet_query.csv', index = False)