In [None]:
import numpy as np
import IPython.display as disp
import geopandas as gpd
from geemap import geopandas_to_ee
import pandas as pd
import logging
import ee
import numpy as np
from pygeosys.util.dataframe import chunk_dataframe
import folium
import time
from tqdm import tqdm
from functools import reduce

In [None]:
import os
os.chdir(r'C:/Users/lwh/OneDrive - GEOSYS/Bureau/Documents/PROJECTS/tillage_detection/tillage-detection')


In [None]:
    # -------------------------------------------------------------------------

    # GEE logging & initialization
    # -------------------------------------------------------------------------

# service_account = 'aubin-allies-sandbox@earthengine-185413.iam.gserviceaccount.com'
# credentials = ee.ServiceAccountCredentials(service_account, '/home/lwh/Documents/aubin-allies-sandbox-earthengine-185413-d486e9739448.json')
ee.Initialize()
logger = logging.getLogger()
    # 

In [None]:
# -----------------------------------------------------------------------------

# Define input parameters
# -----------------------------------------------------------------------------
input_filepath = 'data/00_external/Demo_account/Fields_demo_Account_US_only.geojson'
chunk_size = None #to change depending on the size of the shapefile : None means there will be one batch of the default size (which is a 100)


# load input vector dataset
geometry_collection = gpd.read_file(input_filepath)

# Sentinel-2

## Functions and parameters

In [None]:
# Constants
# -----------------------------------------------------------------------------

# Parameters for cloud masking
CLOUD_FILTER = 60
CLD_PRB_THRESH = 50
NIR_DRK_THRESH = 0.15
CLD_PRJ_DIST = 1
BUFFER = 50



In [None]:
# S2 collection with cloud probability
def get_s2_sr_cld_col(aoi, start_date, end_date):
    # Import and filter S2 SR.
    s2_sr_col = (ee.ImageCollection('COPERNICUS/S2_SR')
        .filterBounds(aoi)
        .filterDate(start_date, end_date)
        .filter(ee.Filter.lte('CLOUDY_PIXEL_PERCENTAGE', CLOUD_FILTER)))

    # Import and filter s2cloudless.
    s2_cloudless_col = (ee.ImageCollection('COPERNICUS/S2_CLOUD_PROBABILITY')
        .filterBounds(aoi)
        .filterDate(start_date, end_date))

    # Join the filtered s2cloudless collection to the SR collection by the 'system:index' property.
    return ee.ImageCollection(ee.Join.saveFirst('s2cloudless').apply(**{
        'primary': s2_sr_col,
        'secondary': s2_cloudless_col,
        'condition': ee.Filter.equals(**{
            'leftField': 'system:index',
            'rightField': 'system:index'
        })
    }))

In [None]:
# Add clouds band
def add_cloud_bands(img):
    # Get s2cloudless image, subset the probability band.
    cld_prb = ee.Image(img.get('s2cloudless')).select('probability')

    # Condition s2cloudless by the probability threshold value.
    is_cloud = cld_prb.gt(CLD_PRB_THRESH).rename('clouds')

    # Add the cloud probability layer and cloud mask as image bands.
    return img.addBands(ee.Image([cld_prb, is_cloud]))

In [None]:
# Add clouds shadows band
def add_shadow_bands(img):
    # Identify water pixels from the SCL band.
    not_water = img.select('SCL').neq(6)

    # Identify dark NIR pixels that are not water (potential cloud shadow pixels).
    SR_BAND_SCALE = 1e4
    dark_pixels = img.select('B8').lt(NIR_DRK_THRESH*SR_BAND_SCALE).multiply(not_water).rename('dark_pixels')

    # Determine the direction to project cloud shadow from clouds (assumes UTM projection).
    shadow_azimuth = ee.Number(90).subtract(ee.Number(img.get('MEAN_SOLAR_AZIMUTH_ANGLE')));

    # Project shadows from clouds for the distance specified by the CLD_PRJ_DIST input.
    cld_proj = (img.select('clouds').directionalDistanceTransform(shadow_azimuth, CLD_PRJ_DIST*10)
        .reproject(**{'crs': img.select(0).projection(), 'scale': 100})
        .select('distance')
        .mask()
        .rename('cloud_transform'))

    # Identify the intersection of dark pixels with cloud shadow projection.
    shadows = cld_proj.multiply(dark_pixels).rename('shadows')

    # Add dark pixels, cloud projection, and identified shadows as image bands.
    return img.addBands(ee.Image([dark_pixels, cld_proj, shadows]))

In [None]:
def add_cld_shdw_mask(img):
    # Add cloud component bands.
    img_cloud = add_cloud_bands(img)

    # Add cloud shadow component bands.
    img_cloud_shadow = add_shadow_bands(img_cloud)

    # Combine cloud and shadow mask, set cloud and shadow as value 1, else 0.
    is_cld_shdw = img_cloud_shadow.select('clouds').add(img_cloud_shadow.select('shadows')).gt(0)

    # Remove small cloud-shadow patches and dilate remaining pixels by BUFFER input.
    # 20 m scale is for speed, and assumes clouds don't require 10 m precision.
    is_cld_shdw = (is_cld_shdw.focalMin(2).focalMax(BUFFER*2/20)
        .reproject(**{'crs': img.select([0]).projection(), 'scale': 20})
        .rename('cloudmask'))

    # Add the final cloud-shadow mask to the image.
    return img_cloud_shadow.addBands(is_cld_shdw)

In [None]:
def apply_cld_shdw_mask(img):
    # Subset the cloudmask band and invert it so clouds/shadow are 0, else 1.
    not_cld_shdw = img.select('cloudmask').Not()

    # Subset reflectance bands and update their masks, return the result.
    return img.select('B.*').updateMask(not_cld_shdw)

In [None]:
# Functions GEE display with folium
# -----------------------------------------------------------------------------
# Define a method for displaying Earth Engine image tiles to a folium map.
def add_ee_layer(self, ee_image_object, vis_params, name, show=True, opacity=1, min_zoom=0):
    map_id_dict = ee.Image(ee_image_object).getMapId(vis_params)
    folium.raster_layers.TileLayer(
        tiles=map_id_dict['tile_fetcher'].url_format,
        attr='Map Data © <a href="https://earthengine.google.com/">Google Earth Engine</a>',
        name=name,
        show=show,
        opacity=opacity,
        min_zoom=min_zoom,
        overlay=True,
        control=True
        ).add_to(self)

# Add the Earth Engine layer method to folium.
folium.Map.add_ee_layer = add_ee_layer

In [None]:
def NDVI(image):
  return image.addBands(image.normalizedDifference(['B8', 'B4']).rename('NDVI'))
def NBR2(image):
    return image.addBands(image.normalizedDifference(['B11', 'B12']).rename('NBR2'))

## Tasks launch

In [None]:
if chunk_size is None:
    geometry_collections = [geometry_collection]
else:
    geometry_collections = list(chunk_dataframe(geometry_collection, chunk_size))
logger.info(f'Chunks: {len(geometry_collections)}')
filename_prefixes = []

output_folder='data/04_features/'
year=2020

# loop on chunks
for chunk_id,  gc in enumerate(geometry_collections):
    logger.info(
        f'Processing chunk {chunk_id} / {len(geometry_collections)}')
    logger.info(
        f'Uploading FeatureCollection ({len(gc)} Features) on server side')
    feature_collection_ee = geopandas_to_ee(gc)

    logger.info('Creating Task')

    feature = feature_collection_ee.first()
    
    s2_sr_cld_col = get_s2_sr_cld_col(feature.geometry(), f'{year}-01-01', f'{year}-12-31')
    s2_sr_cld_col=s2_sr_cld_col.map(add_cld_shdw_mask).map(apply_cld_shdw_mask).map(NDVI)

    # function to retrive available dates
    acq_times = s2_sr_cld_col.aggregate_array('GENERATION_TIME').getInfo()
    list_date = [time.strftime('%x', time.gmtime(acq_time/1000)) for acq_time in acq_times]


    for date in tqdm(list_date):
        date_reformat = f'{year}-{date[0:2]}-{date[3:5]}'
        date_reformat_2 = f'{year}-{date[0:2]}-{int(date[3:5])+1}'
        
        Im_final=ee.Image(s2_sr_cld_col.filterDate(f'{date_reformat}', f'{date_reformat_2}').filterBounds(feature_collection_ee).select('NDVI').median())
        output_filename = f"tillage/" #where to put it in the bucket
        fullName=f"S2_image_NDVI_{date_reformat}"
        task=ee.batch.Export.image.toCloudStorage(**{
            'image': Im_final,
            'description': fullName,
            'bucket': 'gri_geosys',
            'fileNamePrefix':output_filename+fullName,
            'scale': 10,
            'region':feature.geometry(),
            'maxPixels': 15000000000,
            'skipEmptyTiles': True
            })
        task.start()
    


# Sentinel 1 

In [None]:
year=2020
date_start = f'{year}-01-01' 
date_end = f'{year}-12-31'

chunk_size=None
if chunk_size is None:
    geometry_collections = [geometry_collection]
else:
    geometry_collections = list(chunk_dataframe(geometry_collection, chunk_size))

print(f'Chunks: {len(geometry_collections)}')
filename_prefixes = []
for chunk_id,  gc in enumerate(geometry_collections):
    print(
            f'Processing chunk {chunk_id+1} / {len(geometry_collections)}')
    print(
            f'Uploading FeatureCollection ({len(gc)} Features) on server side')
    table = geopandas_to_ee(gc)


aoi = table.geometry()
aoi_sub=table.first().geometry()

In [None]:
dataset=ee.ImageCollection('COPERNICUS/S1_GRD')
im_coll = dataset.filterBounds(
    aoi_sub).filterDate(ee.Date(date_start),ee.Date(date_end)
    ).filter(ee.Filter.eq('orbitProperties_pass', 'ASCENDING')
    ).sort('system:time_start')
im_list = im_coll.toList(im_coll.size())
acq_times = im_coll.aggregate_array('system:time_start').getInfo()
dates = [time.strftime('%x', time.gmtime(acq_time/1000)) for acq_time in acq_times]
cpt = 0
for date in tqdm(dates) : 
    date_reformat = f'{year}-{date[0:2]}-{date[3:5]}'
    im_list = im_coll.toList(im_coll.size())
    im_final = ee.Image(im_list.get(cpt)).select('VV','VH').clip(aoi_sub)
    cpt+=1
    output_filename = f"tillage/"
    fullName=f"S1_image_{date_reformat}"
    task=ee.batch.Export.image.toCloudStorage(**{
        'image': im_final,
        'description': fullName,
        'bucket': 'gri_geosys',
        'fileNamePrefix':output_filename+fullName,
        'scale': 10,
        'region':feature.geometry(),
        'maxPixels': 15000000000,
        'skipEmptyTiles': True
        })
    task.start()