# Import

In [1]:
from IPython.core.interactiveshell import InteractiveShell
InteractiveShell.ast_node_interactivity = "all"

In [2]:
import numpy as np
import pandas as pd
# import dask
import dask.dataframe as dd
import geopandas as gpd

from pathlib import Path
import sys
import os
import glob
import multiprocessing as mp
from datetime import date

from tqdm.notebook import tqdm

pd.options.mode.chained_assignment = None  # default='warn'

# Data

In [3]:
%%time
# Folders
repository = Path.cwd()
dataFolder = repository.parent.parent / 'InOutRepoData' / 'FFE'
folder = repository / 'data' / 'comparison_arcpy'

CPU times: user 177 µs, sys: 0 ns, total: 177 µs
Wall time: 171 µs


In [14]:
%%time
# Data

wind_data = pd.read_csv(repository / 'data' / 'Copy_of_GD_wind.csv')

edgelist = pd.read_parquet(repository / 'data' / 'Copy_of_edge_data.parquet', engine='pyarrow')

CPU times: user 179 ms, sys: 124 ms, total: 302 ms
Wall time: 248 ms


**data from the scenario HikWgtnMin_pfour_1-100     
scenario1 initial ignition BLDG_ID : 217, 686, 32, 166, 15, 937, 46 which translate into edge_id 216, 685, 31, 165, 14, 936, 45 (because based on index)**

**Wind speed - critical distance 45m
Wind direction NW**

**18min processing time**

In [6]:
rngdata = {'source':[216, 685, 31, 165, 14, 936, 45], 'IgnProb_bl':[1, 1, 1, 1, 1, 1, 1]} 
rngFile = pd.DataFrame(rngdata)

## Parallel computing set up

## Functions

In [10]:
# %%px

def wind_scenario(wind_data):
      import numpy as np
      i = np.random.randint(0, wind_data.values.shape[0])
      w = wind_data.values[i, 2]
      dist = wind_data.values[i, 1]
      b = wind_data.values[i, 3]
      bear_max = b + 45  # wind direction
      bear_min = b - 45
      if b == 360:
          bear_max = 45
      if b <= 0:  # should not be necessary
          bear_min = 0
      if b == 999:
          bear_max = 999
          bear_min = 0
      return bear_max, bear_min, dist # wind characteristics, bearing and distance


def ignition(rngList=rngFile, edges=edgelist):
    import numpy as np
    import pandas as pd
    rngList['rng'] = np.random.uniform(0, 1, size=rngList.values.shape[0])
    rngList = rngList[rngList['rng'] < rngList['IgnProb_bl']]
    initialIgnitions = len(rngList)
    NewActiveEdges = edges[edges['source'].isin(rngList['source'])]
    return NewActiveEdges, initialIgnitions


def mask(t, activeEdges_d, listActivatedSources_d, w_b_max, w_b_min, w_d):
    import numpy as np
    if t==0: # special case at time=0
        return activeEdges_d
    else:
        mask = (activeEdges_d.bearing.values < w_b_max) & (activeEdges_d.bearing.values < w_b_min) & (activeEdges_d.distance < w_d)
        NewActiveEdges = activeEdges_d[mask]
        NewActiveEdges = NewActiveEdges[~NewActiveEdges.source.isin(listActivatedSources_d)]
        return NewActiveEdges


def propagation(activeEdges_d, edges=edgelist):
    import numpy as np
    import pandas as pd
    NewActiveEdges = edges[edges.source.isin(activeEdges_d.target)]
    return NewActiveEdges

In [20]:
# @dview.parallel(block = False) # The @parallel decorator breaks up elementwise operations and distributes them.
def ffe_runs(n):
    import numpy as np
    import pandas as pd
    from datetime import date
    for scenario in n:
        # initial setup
        listActivatedSources = []
        listScenarioDataframes = []
        condition = True
        time = 0 
        # wind conditions
        w_bearing_max, w_bearing_min, w_distance = wind_scenario(wind_data)
        # ignition / initial state and edges selection
        ActiveEdges, numberIgnitions = ignition()
        if ActiveEdges.empty:
            print(f"no ignitions {numberIgnitions}")
            condition = False
            continue
        while condition: # spread burn zone
            ActiveEdges = mask(time, ActiveEdges, listActivatedSources, w_bearing_max, w_bearing_min, w_distance)
            if ActiveEdges.empty: #no more buildings to burn
                break
            burns = ActiveEdges.drop_duplicates(['source'], inplace=False)
#             print(f"Active edges {len(ActiveEdges)} / no duplicate = {len(burns)}")
            burns['time'] = time
            listScenarioDataframes.append(burns)
            listActivatedSources.extend(ActiveEdges.source.values)
            ActiveEdges = propagation(ActiveEdges)
            time += 1
        
        print(f'finishing scenario --- {scenario} time ---- {time} \n started with {numberIgnitions} ignitions ')

        Activations = pd.concat(listScenarioDataframes)
        Activations["scenario"] = scenario
        Activations["InitialIgnitions"] = numberIgnitions
        Activations.to_parquet(folder / f'scenario{scenario}_{str(date.today())}.parquet', engine='auto', compression="GZIP")

# Run

In [21]:
%%time
ffe_runs(range(1))

finishing scenario --- 0 time ---- 83 
 started with 7 ignitions 
CPU times: user 10.1 s, sys: 2.38 s, total: 12.4 s
Wall time: 12.5 s



### Post processing and comparison

In [7]:
comparisonFolder = Path('/home/alexd/InOutRepoData/FFE/ProbaScenariosInput/comparisonArcPyResults')

In [13]:
testNetScenario = pd.read_parquet(comparisonFolder / 'scenario0_2020-09-04.parquet')
testArc = gpd.read_file(comparisonFolder / 'HikWgtnMin_pfourARCPY.shp')
testArcScenario = testArc.iloc[:,:9]

testArcScenario
testNetScenario

Unnamed: 0,OBJECTID,Replacemen,Combustibl,FloorArea,BLDG_ID,SA2_ID,NightOccup,IgnProbBld,Ignited1
0,1.0,271128.0,1,156.0,1,67,3.0,0.000069,0
1,2.0,66044.0,1,38.0,2,75,1.0,0.000085,0
2,3.0,56944.0,1,21.0,3,23,0.0,0.000107,0
3,4.0,307626.0,1,177.0,4,38,3.0,0.000063,38
4,5.0,342386.0,1,197.0,5,60,3.0,0.000103,0
...,...,...,...,...,...,...,...,...,...
73730,73731.0,330220.0,1,190.0,73731,33,3.0,0.000069,0
73731,73732.0,357378.0,1,132.0,73732,63,2.0,0.000085,0
73732,73733.0,939420.0,1,340.0,73733,23,5.0,0.000107,0
73733,73734.0,307626.0,1,177.0,73734,64,3.0,0.000285,0


Unnamed: 0,source,target,distance,bearing,IgnProb_bl,time,scenario,InitialIgnitions
515,14,3033,75.748970,224.277611,0.000326,0,0,7
1238,31,28,23.863988,44.646598,0.000352,0,0,7
1934,45,46,75.747227,231.780053,0.000476,0,0,7
7080,165,24118,60.728622,277.114749,0.000167,0,0,7
9296,216,29015,15.098701,207.438212,0.000234,0,0,7
...,...,...,...,...,...,...,...,...
1620224,35699,34856,9.052844,55.727160,0.000362,81,0,7
1620274,35700,34856,5.491216,25.324895,0.000362,81,0,7
1567686,34847,34868,33.237173,26.008368,0.000362,82,0,7
1568107,34856,35150,0.557125,19.652963,0.000362,82,0,7


In [15]:
# merge geometry to scenario
# merge each line / source with geometry 
shape = gpd.read_file('data/shapefile/BuildingFootprints.shp')
shape = shape[['BLDG_ID', 'geometry']]
ScenarioARC = pd.merge(testArcScenario, shape, how='left', left_on='BLDG_ID', right_index=True)
ScenarioNET = pd.merge(, shape, how='left', left_on='BLDG_ID', right_index=True)

#### Create Gif for comparisons 

In [71]:
def save_png(df, path):
    gdf = gpd.GeoDataFrame(df, geometry=df.geometry)
    mapShape = gpd.read_file(path / 'WellWHV_Buildings.shp')
    for t in tqdm(range(max(gdf.time))):
        gdfT = gdf[gdf.time<=t]
        # plot
        fig, ax = plt.subplots(figsize = (20,16)) 
        gdfT.plot(color="red", edgecolor=None, ax=ax)
        mapShape.geometry.boundary.plot(color=None,edgecolor='k',linewidth = 0.1,ax=ax)
        # savefig
        plt.savefig(os.path.join(str(pathShapefile), 'gif', f'{t}.png'), dpi=70)
        plt.close()

In [72]:
save_png(worstScenario, path=pathShapefile)

HBox(children=(FloatProgress(value=0.0, max=145.0), HTML(value='')))


