# Query SunPower datasets 

Note that you need to request an API key by registering at https://pvdb.slacgismo.org and emailing slacgismotutorials@gmail.com with your information and use case.

In [1]:
import os
from solardatatools.dataio import load_redshift_data
from solardatatools.data_handler import DataHandler
from solardatatools.time_axis_manipulation import make_time_series

In [2]:
query = {
    'siteid': 'TABJC1027159', #'TAAI01129193',
    'api_key': os.environ.get('REDSHIFT_API_KEY'),
    'sensor': 0
}

df = load_redshift_data(**query)

In [3]:
df.head()

Unnamed: 0,site,meas_name,ts,sensor,meas_val_f
0,TABJC1027159,ac_power,2016-03-28 20:40:00,1913101452_SMA-SB-5000TL-US-22,1.1394
1,TABJC1027159,ac_power,2016-03-28 20:45:00,1913101452_SMA-SB-5000TL-US-22,1.4464
2,TABJC1027159,ac_power,2016-03-28 20:50:00,1913101452_SMA-SB-5000TL-US-22,1.193
3,TABJC1027159,ac_power,2016-03-28 20:55:00,1913101452_SMA-SB-5000TL-US-22,2.1952
4,TABJC1027159,ac_power,2016-03-28 21:00:00,1913101452_SMA-SB-5000TL-US-22,1.4514


# Create DataHandler

In [4]:
dh = DataHandler(df, convert_to_ts=True)

In [5]:
dh.run_pipeline()
dh.report()

total time: 22.85 seconds
--------------------------------
Breakdown
--------------------------------
Preprocessing              6.68s
Cleaning                   0.35s
Filtering/Summarizing      15.82s
    Data quality           0.22s
    Clear day detect       0.40s
    Clipping detect        7.37s
    Capacity change detect 7.83s


-----------------
DATA SET REPORT
-----------------
length               3.23 years
capacity estimate    3.79 kW
data sampling        5 minutes
quality score        0.96
clearness score      0.52
inverter clipping    False
clipped fraction     0.01
capacity changes     True
time shift errors    False
time zone errors     False
            


### or manually adjust the conversion to timeseries

In [6]:
df, _ = make_time_series(df)

In [7]:
dh = DataHandler(df)#, convert_to_ts=True)
dh.run_pipeline()
dh.report()

total time: 23.33 seconds
--------------------------------
Breakdown
--------------------------------
Preprocessing              6.73s
Cleaning                   0.40s
Filtering/Summarizing      16.20s
    Data quality           0.23s
    Clear day detect       0.42s
    Clipping detect        6.90s
    Capacity change detect 8.66s


-----------------
DATA SET REPORT
-----------------
length               3.23 years
capacity estimate    3.79 kW
data sampling        5 minutes
quality score        0.96
clearness score      0.52
inverter clipping    False
clipped fraction     0.01
capacity changes     True
time shift errors    False
time zone errors     False
            
