In [1]:
import gpw_queries as gpw
from river_inputs_loader import load_river_inputs
import geometry_helper as gh

# Filter data

In [2]:
data = gpw.get_sites_by_country("india")

In [3]:
data.keys()

Index(['geometry', 'Distance to Waterway (m)', 'Drainage Direction',
       'Elevation', 'Fine Earth Density (kg / m^3)',
       'Height Above Nearest Drainage (m)', 'Landform Type',
       'Nearest Water Type', 'Population - 1 km', 'Population - 10 km',
       'Population - 5 km', 'Slope (degrees)', 'Soil Clay Fraction',
       'Soil Great Group', 'Soil Sand Fraction',
       'Upstream Drainage Area (km^2)', 'area', 'area (km^2)', 'country', 'id',
       'place_name', 'risk'],
      dtype='object')

In [4]:
data.head()

Unnamed: 0,geometry,Distance to Waterway (m),Drainage Direction,Elevation,Fine Earth Density (kg / m^3),Height Above Nearest Drainage (m),Landform Type,Nearest Water Type,Population - 1 km,Population - 10 km,...,Soil Clay Fraction,Soil Great Group,Soil Sand Fraction,Upstream Drainage Area (km^2),area,area (km^2),country,id,place_name,risk
0,POINT (77.43796 9.94385),1871.306840842308,east,353,143,21.39999389648437,Upper slope (warm),reservoir,1861,236418,...,0.28,0,0.5,0.0252659060060977,1994.3882920761755,0.0019943882920761,India,8f603571132eb30,"Veerapandi - Seeppalakottai Road, Theni, Theni...",0.1713068804547574
1,POINT (74.99707 23.35251),739.0126046637928,west,476,154,8.100006103515625,Lower slope (flat),river,1056,287216,...,0.46,0,0.26,0.0157201029360294,5852.5284566601495,0.0058525284566601,India,8f42c92d04d554c,"Junwaniya, Ratlam Nagar Tahsil, Ratlam, Madhya...",0.1467348507525438
2,POINT (74.94934 28.31923),1378.338405725306,northwest,287,147,2.899993896484375,Lower slope (flat),water,2759,108979,...,0.25,0,0.5,0.0075418390333652,1997.3005165642269,0.0019973005165642,India,8f3da4446642a21,"Gajsar, Churu Tehsil, Churu, Rajasthan, 331001...",0.2029740094501775
3,POINT (70.21870 21.79124),508.6261516453608,southeast,54,159,0.0,Lower slope (flat),river,3848,120337,...,0.35,0,0.32,4.847708702087402,10409.84764771634,0.0104098476477163,India,8f42c2146d43646,"Upleta Taluka, Rajkot, Gujarat, India",0.24046623006271
4,POINT (73.48358 22.49636),210.26582578754727,northwest,115,159,4.0,Lower slope (flat),river,6343,206876,...,0.32,1,0.43,0.0158179905265569,16298.18846145113,0.0162981884614511,India,8f42cab439852a4,"Halol Bypass SH-05, Halol, Halol Taluka, Panch...",0.3084192893633979


In [5]:
data['Distance to Waterway (m)']

0       1871.306840842308
1       739.0126046637928
2       1378.338405725306
3      508.62615164536084
4      210.26582578754727
              ...        
685    336.87317224562213
686    295.26655669173886
687    3170.4405343611684
688    246.84113671488052
689    1105.2848079475004
Name: Distance to Waterway (m), Length: 690, dtype: object

In [6]:
filtered_by_water_proximity = data[data['Distance to Waterway (m)'].astype('float32') <= 500.0]
filtered_by_watertype = filtered_by_water_proximity[(filtered_by_water_proximity['Nearest Water Type'].isin(['water', 'stream', 'river', 'coastline', 'drain', 'canal']))]
filtered = filtered_by_watertype[filtered_by_watertype['Distance to Waterway (m)'].astype('float32') != -1]
print(len(filtered))

204


In [7]:
filtered = filtered.sort_values(['risk', 'Distance to Waterway (m)','area (km^2)'], ascending=[False, True, True])


# Enhanced GPW with other datasets

In [8]:
river_inputs_gdf = load_river_inputs("river_inputs/PlasticRiverInputs.shp")

In [9]:
cross_df = gh.ckd_nearest_point_to_point(filtered, river_inputs_gdf)
cross_df = cross_df[cross_df['dist'].astype('float32') <= 0.5]
cross_df = cross_df.sort_values(["m_out_max"], ascending=False)

In [10]:
print(len(cross_df))
cross_df.head()

79


Unnamed: 0,geometry,Distance to Waterway (m),Drainage Direction,Elevation,Fine Earth Density (kg / m^3),Height Above Nearest Drainage (m),Landform Type,Nearest Water Type,Population - 1 km,Population - 10 km,...,m_out_jul,m_out_aug,m_out_sep,m_out_oct,m_out_nov,m_out_dec,area,mpw,m_out_max,dist
187,POINT (88.33540 22.66677),442.1206350423517,south,5,127,0.0,Valley,river,3329,4137416.0,...,404580500.0,1246114000.0,1079263000.0,347070800.0,32172280.0,5919650.0,29721300000.0,98736400.0,1246114000.0,0.430054
13,POINT (73.11779 19.25087),101.34313832744114,west,3,147,3.299999952316284,Lower slope (flat),river,17824,2026968.0,...,236288300.0,215478900.0,101026400.0,7588453.0,204193.4,29738.24,4555700000.0,14350400.0,236288300.0,0.208528
197,POINT (73.12484 19.27815),332.34778015490525,northwest,6,148,8.100000381469727,Lower slope (flat),water,3784,1813954.0,...,236288300.0,215478900.0,101026400.0,7588453.0,204193.4,29738.24,4555700000.0,14350400.0,236288300.0,0.212544
116,POINT (72.82799 19.23437),466.33569222405686,southeast,6,102,3.700000047683716,Lower slope (warm),river,40916,3896986.0,...,47292230.0,26237170.0,13819680.0,1328835.0,184904.6,62023.1,55900000.0,3112740.0,47292230.0,0.003343
29,POINT (72.93513 19.06160),208.91423138532335,south,6,144,7.0,Lower slope (flat),water,76615,5339669.0,...,41633580.0,24181220.0,12130290.0,1041626.0,134103.6,44328.32,59200000.0,2928760.0,41633580.0,0.02738
