# This Notebook explores the SCAR GeoMAP dataset released in 2019
## Cox S.C., Smith Lyttle B. and the GeoMAP team (2019). Lower Hutt, New Zealand. GNS Science. Release v.201907.
### [Data Available Here](https://data.gns.cri.nz/ata_geomap/index.html?content=/mapservice/Content/antarctica/www/index.html)

## Configure packages, paths, and load data

In [2]:
import os
import geopandas as gpd
import matplotlib as plt

In [5]:
geol_path = f"{os.getcwd()}/data/ATA_SCAR_GeoMAP_geology.gdb"
print(geol_path)

/home/sam/geomap/data/ATA_SCAR_GeoMAP_geology.gdb


In [6]:
data = gpd.read_file(geol_path)

## Some Metadata exploration

In [16]:
cols = ""
for i in range(len(data.columns)):
    cols += f'{data.columns[i]}\t'
    if (i + 1) % 3 == 0:
        cols += '\n'
print(cols)


SOURCECODE	MAPSYMBOL	PLOTSYMBOL	
NAME	DESCR	POLYGTYPE	
MBREQUIV	FMNEQUIV	SBGRPEQUIV	
GRPEQUIV	SPGRPEQUIV	TERREQUIV	
STRATRANK	TYPENAME	TYPE_URI	
GEOLHIST	REPAGE_URI	YNGAGE_URI	
OLDAGE_URI	ABSMIN_MA	ABSMAX_MA	
AGECODE	LITHCODE	LITHOLOGY	
REPLITH_URI	OBSMETHOD	CONFIDENCE	
POSACC_M	SOURCE	METADATA	
RESSCALE	CAPTSCALE	CAPTDATE	
MODDATE	FEATUREID	SPEC_URI	
SYMBOL	DATASET	REGION	
Shape_Length	Shape_Area	geometry	



In [34]:
symbols = data["MAPSYMBOL"].value_counts(ascending=False)
poly_types = data["POLYGTYPE"].value_counts(ascending=False)
obs_method = data["OBSMETHOD"].value_counts(ascending=False)
datasets = data["DATASET"].value_counts(ascending=False)
regions = data["REGION"].value_counts(ascending=False)
lithology = data["LITHOLOGY"].value_counts(ascending=False)

In [35]:
print(symbols)
print(poly_types)
print(obs_method)
print(datasets)
print(regions)
print(lithology)

JKg    6608
EOg    4707
?      4654
CTw    4479
EOs    4015
       ... 
Pzq       2
Dn        2
Et        1
Rzh       1
JKj       1
Name: MAPSYMBOL, Length: 173, dtype: int64
rock       86144
moraine     6481
ice         2536
Name: POLYGTYPE, dtype: int64
synthesis from multiple sources                  74836
polygon unit inferred from regional-scale map    11513
remotely sensed data                              4889
digital conversion from published source          3168
outcrop observation                                755
Name: OBSMETHOD, dtype: int64
ATA_PEN_geological_units     37951
ATA_NVL_geological_units     14100
ATA_CTAM_geological_units    11341
ATA_WAAT_geological_units     9602
ATA_DML_geological_units      8539
ATA_SVL_geological_units      6488
ATA_EM_geological_units       2808
ATA_MBL_geological_units      2312
ATA_QEL_geological_units      2020
Name: DATASET, dtype: int64
East Antarctica    52090
West Antarctica    43071
Name: REGION, dtype: int64
unknown            

## Basic descriptive statistics