In [1]:
import numpy as np
import pandas as pd
import re
from sklearn.ensemble import RandomForestRegressor
from sklearn.model_selection import train_test_split
from scipy.stats import norm, lognorm, anderson, kstest
from sklearn import metrics
from rf_functions import data_setup, run_rf
import matplotlib.pyplot as plt
import seaborn as sns
from datetime import datetime
import warnings
warnings.filterwarnings("ignore", category=RuntimeWarning)
pd.options.mode.chained_assignment = None

In [2]:
s1_fp = 'input_data/s1_zonal_data.csv'
stats_fp = 'output/stats/scale_shape_both_dates.csv'
moran_fp = 'input_data/moran_max.csv'
output_d = 'output/'
out_file_prefix = 'func_test_dB'

targets, predictors = data_setup(s1_fp, stats_fp, moran_fp, s1_units='dB', date=None)
cols_0219 = [c for c in targets.columns if '0219' in c]
cols_0302 = [c for c in targets.columns if '0304' in c]
cols_misc = [c for c in targets.columns if c not in cols_0219 and c not in cols_0302]
cols_misc.remove('Point_ID')
cols_misc.remove('moran_p')
cols_0219 += cols_misc
cols_0302 += cols_misc
targets_0219 = targets[cols_0219].dropna()
targets_0302 = targets[cols_0302].dropna()

# run_rf(targets_0219, predictors.loc[targets_0219.index], n_runs=100, 
#        rf_type='single_target', output_dir=output_d, out_file_prefix=out_file_prefix)
# run_rf(targets_0302, predictors.loc[targets_0302.index], n_runs=100, 
#        rf_type='single_target', output_dir=output_d, out_file_prefix=out_file_prefix)


In [4]:
def remove_date(col):
    if '0219' in col:
        date_start = col.index('0219')
    elif '0304' in col:
        date_start = col.index('0304')
    else:
        return col
    
    new_col = col[:date_start] + col[date_start+5:]
    if '_1_' in new_col:
        ind = new_col.index('_1_')
        new_col = new_col[:ind] + new_col[ind+2:]
    return new_col

cols_0219_new = [remove_date(c) for c in cols_0219]
cols_0302_new = [remove_date(c) for c in cols_0302]

targets_0219.columns = cols_0219_new
targets_0302.columns = cols_0302_new

targets_all = pd.concat([targets_0219, targets_0302])
print('here')

run_rf(targets_all, predictors, n_runs=100, rf_type='single_target', 
       output_dir=output_d, out_file_prefix=out_file_prefix)

here
2022-07-05 18:11:07 -- Starting single target RF regression (91 targets total).
2022-07-05 18:11:07 -- Starting target zonal_5m_p95_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 18:33:31 -- Starting target zonal_5m_p95_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 18:55:28 -- Starting target zonal_5m_p95_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 19:17:58 -- Starting target zonal_5m_p5_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 19:40:27 -- Starting target zonal_5m_p5_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 20:02:53 -- Starting target zonal_5m_p5_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 20:25:12 -- Starting target zonal_5m_max_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 20:47:34 -- Starting target zonal_5m_max_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 21:09:42 -- Starting target zonal_5m_med_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 21:32:05 -- Starting target zonal_5m_med_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 21:55:12 -- Starting target zonal_5m_med_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 22:17:49 -- Starting target zonal_5m_min_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 22:40:18 -- Starting target zonal_5m_min_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 23:02:18 -- Starting target zonal_5m_range_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 23:24:28 -- Starting target zonal_5m_range_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-05 23:46:52 -- Starting target zonal_5m_range_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 00:08:33 -- Starting target zonal_2m_max_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 00:29:07 -- Starting target zonal_2m_max_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 00:49:36 -- Starting target zonal_2m_med_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 01:09:55 -- Starting target zonal_2m_med_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 01:30:32 -- Starting target zonal_2m_med_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 01:50:56 -- Starting target zonal_2m_min_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 02:11:18 -- Starting target zonal_2m_min_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 02:31:38 -- Starting target zonal_2m_range_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 02:52:08 -- Starting target zonal_2m_range_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 03:12:43 -- Starting target zonal_2m_range_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 03:33:22 -- Starting target zonal_2m_p5_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 03:53:47 -- Starting target zonal_2m_p5_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 04:14:22 -- Starting target zonal_2m_p5_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 04:34:45 -- Starting target zonal_2m_p95_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 04:55:15 -- Starting target zonal_2m_p95_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 05:15:47 -- Starting target zonal_2m_p95_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 05:36:14 -- Starting target zonal_1m_max_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 05:56:55 -- Starting target zonal_1m_max_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 06:17:24 -- Starting target zonal_1m_med_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 06:38:03 -- Starting target zonal_1m_med_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 06:59:05 -- Starting target zonal_1m_med_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 07:20:09 -- Starting target zonal_1m_min_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 07:41:33 -- Starting target zonal_1m_min_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 08:01:52 -- Starting target zonal_1m_range_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 08:22:22 -- Starting target zonal_1m_range_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 08:42:59 -- Starting target zonal_1m_range_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 09:03:54 -- Starting target zonal_1m_p5_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 09:24:55 -- Starting target zonal_1m_p5_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 09:47:35 -- Starting target zonal_1m_p5_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 10:09:57 -- Starting target zonal_1m_p95_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 10:32:08 -- Starting target zonal_1m_p95_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 10:54:45 -- Starting target zonal_1m_p95_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 11:18:23 -- Starting target zonal_50cm_max_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 11:41:34 -- Starting target zonal_50cm_max_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 12:04:21 -- Starting target zonal_50cm_med_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 12:28:12 -- Starting target zonal_50cm_med_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 12:51:54 -- Starting target zonal_50cm_med_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 13:13:52 -- Starting target zonal_50cm_min_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 13:37:03 -- Starting target zonal_50cm_min_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 13:59:41 -- Starting target zonal_50cm_range_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 14:22:04 -- Starting target zonal_50cm_range_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 14:44:22 -- Starting target zonal_50cm_range_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 15:06:24 -- Starting target zonal_50cm_p5_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 15:28:37 -- Starting target zonal_50cm_p5_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 15:51:47 -- Starting target zonal_50cm_p5_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 16:14:11 -- Starting target zonal_50cm_p95_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 16:36:55 -- Starting target zonal_50cm_p95_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 16:59:49 -- Starting target zonal_50cm_p95_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 17:22:08 -- Starting target zonal_25cm_max_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 17:44:28 -- Starting target zonal_25cm_max_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 18:06:28 -- Starting target zonal_25cm_med_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 18:28:35 -- Starting target zonal_25cm_med_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 18:50:35 -- Starting target zonal_25cm_med_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 19:11:35 -- Starting target zonal_25cm_min_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 19:32:59 -- Starting target zonal_25cm_min_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 19:54:04 -- Starting target zonal_25cm_range_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 20:15:03 -- Starting target zonal_25cm_range_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 20:36:16 -- Starting target zonal_25cm_range_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 20:57:09 -- Starting target zonal_25cm_p95_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 21:18:11 -- Starting target zonal_25cm_p95_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 21:39:24 -- Starting target zonal_25cm_p95_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 22:00:17 -- Starting target zonal_25cm_p5_max


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 22:21:21 -- Starting target zonal_25cm_p5_min


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 22:43:37 -- Starting target zonal_25cm_p5_mean


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 23:05:10 -- Starting target roughness_p5


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 23:27:14 -- Starting target roughness_p25


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-06 23:49:14 -- Starting target roughness_p75


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 00:11:09 -- Starting target roughness_p95


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 00:32:58 -- Starting target iqr


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 00:53:45 -- Starting target p95-p5


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 01:14:45 -- Starting target scale


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 01:35:35 -- Starting target shape


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 01:56:19 -- Starting target ks


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 02:17:01 -- Starting target moran


  0%|          | 0/100 [00:00<?, ?it/s]

2022-07-07 02:38:01 -- Starting target moran_z


  0%|          | 0/100 [00:00<?, ?it/s]