# Prepare Google Earth Engine Dataset

Author: Ivan Zvonkov

Last modified: June 25, 2024

Description: Takes processed csv files from data/datasets and converts to simple csv to be uploaded as a GEE table asset.



In [1]:
import pandas as pd

In [9]:
df1 = pd.read_csv("../../data/datasets/Hawaii_CEO_2020.csv")
df2 = pd.read_csv("../../data/datasets/HawaiiAgriculturalLandUse2020.csv")
df3 = pd.read_csv("../../data/datasets/HawaiiAgriculturalLandUse2020Subset.csv")
df4 = pd.read_csv("../../data/datasets/HawaiiCorrective2020.csv")
df5 = pd.read_csv("../../data/datasets/HawaiiCorrectiveGuided2020.csv")

In [10]:
renames = {"class_probability": "is_crop", "lat": "latitude", "lon": "longitude"}
for df in [df1, df2, df3, df4, df5]:
    df.rename(columns=renames, inplace=True)

In [11]:
df1 = df1[(df1["is_crop"] != 0.5) & (df1["num_labelers"] > 1)]

In [21]:
df3

Unnamed: 0,objectid,crops_2020,island,acreage,st_areasha,st_perimet,geometry,start_date,end_date,latitude,longitude,subset,is_crop,eo_status,eo_data,eo_lat,eo_lon,eo_file
0,3603,Macadamia Nuts,Big Island,74.251099,3.009922e+05,2493.443380,POLYGON ((-155.48163800219658 19.2501737246023...,2020-01-01,2021-12-31,19.246651,-155.478457,training,1.0,eo_data_complete,"[[-10.722673840989376, -16.00940534093112, 891...",19.246630,-155.478478,min_lat=19.2459_min_lon=-155.4792_max_lat=19.2...
1,534,Diversified Crop,Big Island,5.286180,2.141438e+04,776.452401,POLYGON ((-155.6856571491883 20.01503428014222...,2020-01-01,2021-12-31,20.015103,-155.685940,training,1.0,eo_data_complete,"[[-8.725794581725804, -14.326780156285752, 891...",20.015138,-155.685899,min_lat=20.0144_min_lon=-155.6867_max_lat=20.0...
2,667,Macadamia Nuts,Big Island,5.012700,2.029946e+04,601.945311,POLYGON ((-155.80039286358922 20.2220171318779...,2020-01-01,2021-12-31,20.222997,-155.800529,training,1.0,eo_data_complete,"[[-11.246407877966822, -17.39068462501195, 934...",20.223008,-155.800524,min_lat=20.2223_min_lon=-155.8013_max_lat=20.2...
3,4630,Diversified Crop,Oahu,7.672060,3.084165e+04,700.092454,POLYGON ((-158.09106890904232 21.5366251785891...,2020-01-01,2021-12-31,21.536440,-158.089887,training,1.0,eo_data_complete,"[[-9.661015311449251, -14.91925380361867, 1013...",21.536435,-158.089881,min_lat=21.5357_min_lon=-158.0907_max_lat=21.5...
4,2049,Banana,Big Island,2.363230,9.591609e+03,456.477891,"POLYGON ((-155.1010169799786 19.8448752701613,...",2020-01-01,2021-12-31,19.844294,-155.101180,training,1.0,eo_data_complete,"[[-2.496108260734728, -12.64099781026996, 928....",19.844279,-155.101186,min_lat=19.8436_min_lon=-155.1019_max_lat=19.8...
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
324,2613,Macadamia Nuts,Big Island,74.481201,3.015362e+05,4541.133044,POLYGON ((-155.87706622087327 19.4260830277771...,2020-01-01,2021-12-31,19.423378,-155.876224,training,1.0,eo_data_complete,"[[-11.05321712725342, -15.104622713257791, 741...",19.423418,-155.876252,min_lat=19.4227_min_lon=-155.877_max_lat=19.42...
325,2320,Diversified Crop,Big Island,42.515499,1.725014e+05,2147.460583,POLYGON ((-155.20195491459984 19.9541256475104...,2020-01-01,2021-12-31,19.954389,-155.200474,training,1.0,eo_data_complete,"[[-8.09734605030693, -14.13202783099192, 1066....",19.954412,-155.200449,min_lat=19.9537_min_lon=-155.2012_max_lat=19.9...
326,2257,Pasture,Big Island,4863.270020,1.973283e+07,36291.822574,POLYGON ((-155.18463196245165 19.9350945456247...,2020-01-01,2021-12-31,19.914885,-155.190268,training,1.0,eo_data_complete,"[[-4.374754888392252, -12.005911387399252, 842...",19.914886,-155.190298,min_lat=19.9142_min_lon=-155.191_max_lat=19.91...
327,2669,Coffee,Big Island,2.989330,1.210244e+04,481.842392,POLYGON ((-155.87237324345375 19.4302840532736...,2020-01-01,2021-12-31,19.430577,-155.871562,training,1.0,eo_data_complete,"[[-8.753316229223827, -16.630732275651, 852.0,...",19.430605,-155.871581,min_lat=19.4299_min_lon=-155.8723_max_lat=19.4...


In [22]:
keep_columns = ["latitude", "longitude", "subset", "is_crop"]

df1[keep_columns].to_csv("HawaiiCEO2020.csv", index=False)
df2[keep_columns + ["crops_2020", "island", "acreage"]].to_csv("HawaiiAgriculturalLandUse2020.csv", index=False)
df4[keep_columns].to_csv("MauiCorrective2020.csv", index=False)
df5[keep_columns].to_csv("MauiCorrectiveGuided2020.csv", index=False)