In [None]:
# !pip install geemap

# Machine Learning with Earth Engine - Supervised Classification

## Supervised classification algorithms available in Earth Engine

Source: https://developers.google.com/earth-engine/classification

The `Classifier` package handles supervised classification by traditional ML algorithms running in Earth Engine. These classifiers include CART, RandomForest, NaiveBayes and SVM. The general workflow for classification is:

1. Collect training data. Assemble features which have a property that stores the known class label and properties storing numeric values for the predictors.
2. Instantiate a classifier. Set its parameters if necessary.
3. Train the classifier using the training data.
4. Classify an image or feature collection.
5. Estimate classification error with independent validation data.

The training data is a `FeatureCollection` with a property storing the class label and properties storing predictor variables. Class labels should be consecutive, integers starting from 0. If necessary, use remap() to convert class values to consecutive integers. The predictors should be numeric.

# Import libraries

In [1]:
import ee
import geemap

### Prepare Train Dataset

In [2]:
Map = geemap.Map()
#Map

In [3]:
point = ee.Geometry.Point([-122.4439, 37.7538])
point2 = ee.Geometry.Point([-87.7719, 41.8799])

image = ee.ImageCollection('LANDSAT/LC08/C01/T1_SR') \
    .filterBounds(point) \
    .filterDate('2016-01-01', '2016-12-31') \
    .sort('CLOUD_COVER') \
    .first() \
    .select('B[1-7]')

vis_params = {
    'min': 0,
    'max': 3000,
    'bands': ['B4', 'B3', 'B2']
}

Map.centerObject(point, 8)
Map.addLayer(image, vis_params, "Landsat-8-Train")
Map

Map(center=[37.75379999999999, -122.44390000000001], controls=(WidgetControl(options=['position', 'transparent…

In [216]:
image2 = ee.ImageCollection('LANDSAT/LC08/C01/T1_SR') \
    .filterBounds(point2) \
    .filterDate('2016-01-01', '2016-12-31') \
    .sort('CLOUD_COVER') \
    .first() \
    .select('B[1-7]')

vis_params = {
    'min': 0,
    'max': 3000,
    'bands': ['B4', 'B3', 'B2']
}

#Map.centerObject(point2, 8)
Map.addLayer(image2, vis_params, "Landsat-8-Test")
Map

Map(center=[37.75379999999999, -122.44390000000001], controls=(WidgetControl(options=['position', 'transparent…

# Add data to the map

### Check image properties

In [217]:
ee.Date(image.get('system:time_start')).format('YYYY-MM-dd').getInfo()

'2016-11-18'

In [218]:
image.get('CLOUD_COVER').getInfo()

0.08

In [219]:
ee.Date(image2.get('system:time_start')).format('YYYY-MM-dd').getInfo()

'2016-06-17'

In [220]:
image2.get('CLOUD_COVER').getInfo()

0.03

# Make training dataset

There are several ways you can create a region for generating the training dataset.

- Draw a shape (e.g., rectangle) on the map and the use `region = Map.user_roi`
- Define a geometry, such as `region = ee.Geometry.Rectangle([-122.6003, 37.4831, -121.8036, 37.8288])`
- Create a buffer zone around a point, such as `region = ee.Geometry.Point([-122.4439, 37.7538]).buffer(10000)`
- If you don't define a region, it will use the image footprint by default

In [221]:
# region = Map.user_roi
# region = ee.Geometry.Rectangle([-122.6003, 37.4831, -121.8036, 37.8288])
# region = ee.Geometry.Point([-122.4439, 37.7538]).buffer(10000)

In this example, we are going to use the [USGS National Land Cover Database (NLCD)](https://developers.google.com/earth-engine/datasets/catalog/USGS_NLCD) to create label dataset for training


![](https://i.imgur.com/7QoRXxu.png)

In [222]:
nlcd = ee.Image('USGS/NLCD/NLCD2016').select('landcover').clip(image.geometry())
Map.addLayer(nlcd, {}, 'NLCD')
Map

Map(bottom=25636.0, center=[37.75379999999999, -122.44390000000001], controls=(WidgetControl(options=['positio…

In [223]:
# Make the training dataset.
points = nlcd.sample(**{
    'region': image.geometry(),
    'scale': 30,
    'numPixels': 5000,
    'seed': 0,
    'geometries': True  # Set this to False to ignore geometries
})

Map.addLayer(points, {}, 'training', False)

In [224]:
print(points.size().getInfo())

3640


In [225]:
print(points.first().getInfo())

{'type': 'Feature', 'geometry': {'type': 'Point', 'coordinates': [-122.25798986874739, 38.2706212827936]}, 'id': '0', 'properties': {'landcover': 31}}


# Train the classifier

In [226]:
# Use these bands for prediction.
bands = ['B1', 'B2', 'B3', 'B4', 'B5', 'B6', 'B7']

# This property of the table stores the land cover labels.
label = 'landcover'

# Overlay the points on the imagery to get training.
training = image.select(bands).sampleRegions(**{
  'collection': points,
  'properties': [label],
  'scale': 30
})

## Model

In [227]:
# Train a CART classifier with default parameters.
trained = ee.Classifier.smileCart().train(training, label, bands)

In [228]:
print(training.first().getInfo())

{'type': 'Feature', 'geometry': None, 'id': '0_0', 'properties': {'B1': 575, 'B2': 814, 'B3': 1312, 'B4': 1638, 'B5': 1980, 'B6': 2091, 'B7': 1967, 'landcover': 31}}


# Predict

In [229]:
# Classify the image with the same bands used for training.
result = image.select(bands).classify(trained)

# # Display the clusters with random colors.
Map.addLayer(result.randomVisualizer(), {}, 'classfied')
Map

Map(bottom=25636.0, center=[37.75379999999999, -122.44390000000001], controls=(WidgetControl(options=['positio…

# Predict Popayan

In [197]:
# https://sites.google.com/site/seriescol/shapes
shape = ee.FeatureCollection('users/dsrestrepo/mpio')

# Cauca = shape.filter(ee.Filter.eq('DPTO_CCDGO', 19))
# region = shape.filter(ee.Filter.eq('MPIO_CCNCT	', 19001))
# Medellin = ee.FeatureCollection('users/dsrestrepo/Medellin')

region = shape.filter(ee.Filter.eq('MPIOS', '19001'))
Map.addLayer(region, {}, "Popayan")

In [198]:
collection = ee.ImageCollection('LANDSAT/LC08/C01/T1') \
    .filterBounds(region) \
    .filterDate('2016-01-01', '2016-12-31') \
    #.select('B[1-7]')
 
    
image =  ee.Algorithms.Landsat.simpleComposite(collection,
                                                   percentile=20,
                                                   cloudScoreRange=5,
                                                   asFloat=True).clipToCollection(region).select('B[1-7]').multiply(10000)

Map.centerObject(region, 12)
Map.addLayer(image, vis_params, "Landsat-8-Popayan")

### With random colors

In [199]:
# Classify the image with the same bands used for training.
result = image.select(bands).classify(trained)

# # Display the clusters with random colors.
Map.addLayer(result.randomVisualizer(), {}, 'popayan_classfied')
Map

Map(bottom=517372.0, center=[2.476705214936409, -76.64337627568842], controls=(WidgetControl(options=['positio…

# Convert to actual values and colors

To render a categorical map, we can set two image properties: `landcover_class_values` and `landcover_class_palette`. We can use the same style as the NLCD so that it is easy to compare the two maps. 

In [204]:
class_values = nlcd.get('landcover_class_values').getInfo()
class_values

[11,
 12,
 21,
 22,
 23,
 24,
 31,
 41,
 42,
 43,
 51,
 52,
 71,
 72,
 73,
 74,
 81,
 82,
 90,
 95]

In [205]:
class_palette = nlcd.get('landcover_class_palette').getInfo()
class_palette

['476ba1',
 'd1defa',
 'decaca',
 'd99482',
 'ee0000',
 'ab0000',
 'b3aea3',
 '68ab63',
 '1c6330',
 'b5ca8f',
 'a68c30',
 'ccba7d',
 'e3e3c2',
 'caca78',
 '99c247',
 '78ae94',
 'dcd93d',
 'ab7028',
 'bad9eb',
 '70a3ba']

In [206]:
landcover = result.set('classification_class_values', class_values)
landcover = landcover.set('classification_class_palette', class_palette)

In [207]:
Map.addLayer(landcover, {}, 'Land cover')
Map

Map(bottom=258775.0, center=[2.518490969060616, -76.6674041748047], controls=(WidgetControl(options=['position…

### Visualize the result

In [208]:
print('Change layer opacity:')
cluster_layer = Map.layers[-1]
cluster_layer.interact(opacity=(0, 1, 0.1))

Change layer opacity:


Box(children=(FloatSlider(value=1.0, description='opacity', max=1.0),))

### Add a legend to the map

In [209]:
Map.add_legend(builtin_legend='NLCD')
Map

Map(bottom=258775.0, center=[2.518490969060616, -76.6674041748047], controls=(WidgetControl(options=['position…

### Export the result

Export the result directly to your computer:

In [210]:
import os
out_dir = os.path.join(os.path.expanduser('~'), 'Downloads')
out_file = os.path.join(out_dir, 'landcover.tif')

In [211]:
geemap.ee_export_image(landcover, filename=out_file, scale=900)

Generating URL ...
An error occurred while downloading.
Image.clipToBoundsAndScale: The geometry for image clipping must be bounded.


Export the result to Google Drive:

In [212]:
geemap.ee_export_image_to_drive(landcover, description='landcover', folder='export', scale=900)

Exporting landcover ...
