# Analysis of Original Data
Initial analysis of 30 minutes USB data.
## Prerequesities

In [1]:
import toml
from sqlalchemy import create_engine
import pandas as pd

conf = toml.load('../../conf.toml')
db = conf['database']['local']

conn = create_engine('postgresql+psycopg2://{}:{}@{}:{}/{}'.format(
    db['user'], db['password'], db['host'], db['port'], db['name']
)).connect()

pv = pd.read_sql('SELECT * FROM pv_org', conn)
pv.dtypes

date                       object
time                       object
inverter_no                 int64
device_type                 int64
periode_s                 float64
energy_positiv_ws         float64
reactive_energy_l_vars    float64
reactive_energy_c_vars    float64
uac_l1_v                  float64
iac_l1_a                  float64
udc_mppt1_v               float64
idc_mppt1_a               float64
udc_mppt2_v               float64
idc_mppt2_a               float64
description                object
dtype: object

## Explanation of Columns
### date and time
- Night: about every 90 Minuten 4 observations
- Day: every 30 minutes 1 observation

### inverter_no
- all observations are 1

### device_type
- all obseravations are 76

### periode_s
- number of seconds between observations
- at night NaN
- at day 1800 (30 minutes)

### energy_positiv_ws
- Ws: watt seconds
- at night NaN
- Energy produced in last half hour

### reactive_energy_l_vars
- VAR: voltampere reactiv
- at night NaN
- 1 VAR = 1 W
- electrical energy that is lost
- happens with ac
- inductive (l), capacitive (c) load

### uac_l1_v
- V: Volt
- at night NaN
- voltage at output
- about 230 volt as in german electricity grid

### iac_l1_a
- A: Ampere
- at night NaN
- current at output

### udc_mppt1_v and udc_mppt2_v
- at night NaN
- voltage at input
- 2 inputs

### idc_mppt1_a and idc_mppt2_a
- at night NaN
- current at input
- 2 inputs

### description
- at day NaN
- at night: about every 90 minutes 4 observations

In [2]:
pv

Unnamed: 0,date,time,inverter_no,device_type,periode_s,energy_positiv_ws,reactive_energy_l_vars,reactive_energy_c_vars,uac_l1_v,iac_l1_a,udc_mppt1_v,idc_mppt1_a,udc_mppt2_v,idc_mppt2_a,description
0,2020-10-12,21:53:33,1,76,,,,,,,,,,,Display Information
1,2020-10-12,21:53:33,1,76,,,,,,,,,,,V0.3.23 Build 0
2,2020-10-12,21:53:33,1,76,,,,,,,,,,,"12.10.2020 20:30:55 Info 017, Counter 2302"
3,2020-10-12,21:53:33,1,76,,,,,,,,,,,Logging Start
4,2020-10-12,23:17:36,1,76,,,,,,,,,,,Display Information
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5784,2020-12-18,18:37:48,1,76,,,,,,,,,,,Logging Start
5785,2020-12-18,20:01:56,1,76,,,,,,,,,,,Display Information
5786,2020-12-18,20:01:56,1,76,,,,,,,,,,,V0.3.23 Build 0
5787,2020-12-18,20:01:56,1,76,,,,,,,,,,,"18.12.2020 18:39:18 Info 017, Counter 3447"


In [3]:
pv.describe()

Unnamed: 0,inverter_no,device_type,periode_s,energy_positiv_ws,reactive_energy_l_vars,reactive_energy_c_vars,uac_l1_v,iac_l1_a,udc_mppt1_v,idc_mppt1_a,udc_mppt2_v,idc_mppt2_a
count,5789.0,5789.0,1205.0,1205.0,1205.0,1205.0,1205.0,1205.0,1205.0,1205.0,1205.0,1205.0
mean,1.0,76.0,1800.13112,1212920.0,19525.678838,3102.26639,219.718091,2.875253,156.083983,1.947768,158.164315,2.000423
std,0.0,0.0,4.725108,1739445.0,20898.856762,1859.573549,55.462679,4.072522,43.246186,2.655767,43.659544,2.7295
min,1.0,76.0,1799.0,0.0,0.0,0.0,0.0,0.0,60.8,0.0,61.3,0.0
25%,1.0,76.0,1800.0,37915.0,8220.0,1820.0,232.3,0.14,118.0,0.29,120.3,0.29
50%,1.0,76.0,1800.0,407469.0,10807.0,2832.0,233.6,0.97,180.3,0.73,182.6,0.71
75%,1.0,76.0,1800.0,1680593.0,23523.0,4251.0,234.9,3.99,190.2,2.42,191.5,2.62
max,1.0,76.0,1964.0,8146009.0,105401.0,11302.0,239.7,19.14,213.4,13.92,206.6,13.83
