## Surface Observation Data Processing

In [11]:
# import required packages
import pandas as pd
import os
import pickle
import sys
pd.options.display.width=None
pd.options.display.max_columns=None


if sys.version_info >= (3, 6):
    from zipfile import ZipFile as zipfile
else:
    import zipfile36 as zipfile
    
url = "https://unearthed-exploresa.s3-ap-southeast-2.amazonaws.com/Unearthed_5_SARIG_Data_Package.zip" 
# enter the directory to save data
data_loc = './data'
file_name = 'Unearthed_5_SARIG_Data_Package.zip'

if os.path.isfile(os.path.join(data_loc, file_name)):
    print ("File exist")
    pass
else:
    # open and save the zip file onto computer
    url = urlopen(URL)
    output = open('./data/Unearthed_5_SARIG_Data_Package.zip', 'wb')    # note the flag:  "wb"        
    output.write(url.read())
    output.close()
    
files_in_dataset = []
file_name = 'Unearthed_5_SARIG_Data_Package.zip'
for file in zipfile(os.path.join(data_loc, file_name),'r').filelist:
    files_in_dataset.append(file.filename)
    
files_in_dataset



File exist


['SARIG_Data_Package/sarig_dh_core_exp.csv',
 'SARIG_Data_Package/sarig_dh_details_exp.csv',
 'SARIG_Data_Package/sarig_dh_litho_exp.csv',
 'SARIG_Data_Package/sarig_dh_petrophys_exp.csv',
 'SARIG_Data_Package/sarig_dh_reference_exp.csv',
 'SARIG_Data_Package/sarig_dh_strat_exp.csv',
 'SARIG_Data_Package/sarig_fieldobs_exp.csv',
 'SARIG_Data_Package/sarig_fieldobs_litho_exp.csv',
 'SARIG_Data_Package/sarig_fieldobs_note_exp.csv',
 'SARIG_Data_Package/sarig_fieldobs_struct_exp.csv',
 'SARIG_Data_Package/sarig_md_commodity_exp.csv',
 'SARIG_Data_Package/sarig_md_details_exp.csv',
 'SARIG_Data_Package/sarig_md_mineralogy_exp.csv',
 'SARIG_Data_Package/sarig_md_reference_exp.csv',
 'SARIG_Data_Package/sarig_md_zone_hr_lith_exp.csv',
 'SARIG_Data_Package/sarig_md_zone_lith_exp.csv',
 'SARIG_Data_Package/sarig_rs_biostr_analys_exp.csv',
 'SARIG_Data_Package/sarig_rs_biostr_results_exp.csv',
 'SARIG_Data_Package/sarig_rs_chem_exp.csv',
 'SARIG_Data_Package/sarig_rs_chem_isotope_exp.csv',
 'SA

For this part of data cleaning, we will only use the following files: 
 - 'SARIG_Data_Package/sarig_fieldobs_exp.csv',
 - 'SARIG_Data_Package/sarig_fieldobs_litho_exp.csv',
 - 'SARIG_Data_Package/sarig_fieldobs_note_exp.csv',
 - 'SARIG_Data_Package/sarig_fieldobs_struct_exp.csv'

### Load Field Observation Data

In [12]:
# load the field observation summary data
sarig_fieldobs_exp = pd.read_csv(
    zipfile(os.path.join(data_loc, file_name),'r').open('SARIG_Data_Package/sarig_fieldobs_exp.csv','r'), 
    sep=',', encoding='latin1')
sarig_fieldobs_exp.sample(5)

  interactivity=interactivity, compiler=compiler, result=result)


Unnamed: 0,SITE_NO,FIELD_ID,OBSERVER,OBSERVATION_DATE,FIELD_NOTE,LITHOLOGY,STRUCTURE,ROCK_SAMPLE,IMAGE,LANDFORM_CODE,LANDFORM_DESC,MAP_250000,MAP_100000,MAP_50000,EASTING_GDA2020,NORTHING_GDA2020,ZONE_GDA2020,LONGITUDE_GDA2020,LATITUDE_GDA2020,LONGITUDE_GDA94,LATITUDE_GDA94,HORIZ_ACCRCY_M,ELEVATION_M,VERT_ACCRCY_M,SURVEY_METHOD_CODE,SURVEY_METHOD,COMMENTS
43076,1848898,SG-00053,"MCAVANEY, S.O.",01/02/2013,N,Y,N,N,Y,,,SI5304 PORT AUGUSTA,6432 Cultana,1,779614.26,6378462.89,53,137.982473,-32.696157,137.982463,-32.696143,5.0,160.7,10.0,GPSSN,GPS Standalone Navigational,
27905,226993,0241201271072,,,N,Y,Y,N,N,,,SI5405 BURRA,6731 Caroona,4,334453.63,6341646.33,54,139.226947,-33.051141,139.226937,-33.051127,,,,,,
86714,228224,0241300121005,,,N,Y,Y,N,N,,,SI5405 BURRA,6731 Caroona,1,345629.98,6325552.91,54,139.343882,-33.19789,139.343872,-33.197876,,,,,,
3395,208770,0073601261021,"MAJOR, R.B.",,Y,N,N,N,N,,,SG5313 EVERARD,5443 Etitinna,3,273904.28,6975794.69,53,132.714959,-27.322313,132.71495,-27.322299,,,,,,
75138,1807636,TRUS036,"RUSAK, T.M.",04/09/2011,Y,Y,N,N,N,,,SG5310 ABMINGA,5645 Tieyon,4,372949.68,7119921.88,53,133.73018,-26.034099,133.730171,-26.034085,5.0,476.9,,GPSSN,GPS Standalone Navigational,


In [13]:
interested_fieldobs_exp = sarig_fieldobs_exp[['SITE_NO', 'FIELD_ID', 
       'LANDFORM_CODE', 'MAP_250000', 'MAP_100000', 'MAP_50000',
       'EASTING_GDA2020', 'NORTHING_GDA2020', 'ZONE_GDA2020',
       'LONGITUDE_GDA2020', 'LATITUDE_GDA2020', 'LONGITUDE_GDA94',
       'LATITUDE_GDA94', 'HORIZ_ACCRCY_M', 'ELEVATION_M', 'VERT_ACCRCY_M',
       'SURVEY_METHOD_CODE']]
interested_fieldobs_exp.sample(5)

Unnamed: 0,SITE_NO,FIELD_ID,LANDFORM_CODE,MAP_250000,MAP_100000,MAP_50000,EASTING_GDA2020,NORTHING_GDA2020,ZONE_GDA2020,LONGITUDE_GDA2020,LATITUDE_GDA2020,LONGITUDE_GDA94,LATITUDE_GDA94,HORIZ_ACCRCY_M,ELEVATION_M,VERT_ACCRCY_M,SURVEY_METHOD_CODE
73978,460033,0355300541011,,SI5405 BURRA,6631 Jamestown,4,277928.66,6341358.85,54,138.621872,-33.043661,138.621862,-33.043647,,,,PHOTO
31192,267993,0355601651196,,SI5405 BURRA,6630 Clare,4,288597.32,6269379.75,54,138.719166,-33.694515,138.719156,-33.6945,,,,PHOTO
70319,1970747,ALMP00050,FACF,SG5309 ALBERGA,5545 Alcurra,1,342922.49,7100060.52,53,133.427753,-26.210425,133.427744,-26.210411,10.0,449.1,20.0,GPSSN
73387,266358,0355601141135,,SI5405 BURRA,6630 Clare,1,307433.0,6272978.16,54,138.923043,-33.665664,138.923033,-33.66565,,,,PHOTO
75698,2008372,BN_RP00275,MLPT,SI5303 YARDEA,6132 Buckleboo,1,629446.71,6386861.75,53,136.380198,-32.648286,136.380188,-32.648272,10.0,294.0,20.0,GPSSN


In [14]:
sarig_fieldobs_exp.columns

Index(['SITE_NO', 'FIELD_ID', 'OBSERVER', 'OBSERVATION_DATE', 'FIELD_NOTE',
       'LITHOLOGY', 'STRUCTURE', 'ROCK_SAMPLE', 'IMAGE', 'LANDFORM_CODE',
       'LANDFORM_DESC', 'MAP_250000', 'MAP_100000', 'MAP_50000',
       'EASTING_GDA2020', 'NORTHING_GDA2020', 'ZONE_GDA2020',
       'LONGITUDE_GDA2020', 'LATITUDE_GDA2020', 'LONGITUDE_GDA94',
       'LATITUDE_GDA94', 'HORIZ_ACCRCY_M', 'ELEVATION_M', 'VERT_ACCRCY_M',
       'SURVEY_METHOD_CODE', 'SURVEY_METHOD', 'COMMENTS'],
      dtype='object')

In [15]:
sarig_fieldobs_exp.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 88221 entries, 0 to 88220
Data columns (total 27 columns):
SITE_NO               88221 non-null int64
FIELD_ID              63727 non-null object
OBSERVER              70938 non-null object
OBSERVATION_DATE      19638 non-null object
FIELD_NOTE            88221 non-null object
LITHOLOGY             88221 non-null object
STRUCTURE             88221 non-null object
ROCK_SAMPLE           88221 non-null object
IMAGE                 88221 non-null object
LANDFORM_CODE         6208 non-null object
LANDFORM_DESC         6208 non-null object
MAP_250000            88221 non-null object
MAP_100000            88221 non-null object
MAP_50000             88221 non-null int64
EASTING_GDA2020       88221 non-null float64
NORTHING_GDA2020      88221 non-null float64
ZONE_GDA2020          88221 non-null int64
LONGITUDE_GDA2020     88221 non-null float64
LATITUDE_GDA2020      88221 non-null float64
LONGITUDE_GDA94       88221 non-null float64
LATITUDE_GD

This data table includes the summary of the contents of the field observation dataset. 

### Load the Field Observation Lithology Data

In [16]:
sarig_fieldobs_litho_exp = pd.read_csv(
    zipfile(os.path.join(data_loc, file_name),'r').open('SARIG_Data_Package/sarig_fieldobs_litho_exp.csv','r'), 
    sep=',', encoding='latin1')
sarig_fieldobs_litho_exp['STRAT_UNIT_NO'] = sarig_fieldobs_litho_exp['STRAT_UNIT_NO'].astype('Int64')
sarig_fieldobs_litho_exp['OBSERVATION_DATE'] = pd.to_datetime(sarig_fieldobs_litho_exp['OBSERVATION_DATE'])
sarig_fieldobs_litho_exp.sample(5)

Unnamed: 0,SITE_NO,LITHOLOGY_NO,MAP_SYMBOL,GIS_CODE,STRAT_UNIT_NO,STRAT_CONF,STRAT_NAME,STRAT_DESCRIPTION,ROCK_GROUP_CODE,ROCK_GROUP,LITHO_CODE,LITHO_CONFIDENCE,LITHOLOGY_NAME,LITHO_MODIFIER,LITHO_COMMENTS,OBSERVATION_DATE,EASTING_GDA2020,NORTHING_GDA2020,ZONE_GDA2020,LONGITUDE_GDA2020,LATITUDE_GDA2020,LONGITUDE_GDA94,LATITUDE_GDA94
10844,227828,17239,,,,,,,N,No Information,XXXX,,No Information,,,NaT,340872.74,6304714.96,54,139.289201,-33.385073,139.289191,-33.385059
44616,2012025,75665,Maym,M-a--ym,6348.0,,Moonaree Dacite Member,"Dacite, massive, red, commonly columnar jointe...",IFE,Igneous Felsic Extrusive,DACT,,Dacite,"porphyritic, Feldspar, moderate reddish brown",,2015-10-28,538674.81,6416416.12,53,135.411193,-32.388592,135.411183,-32.388578
41578,1131186,59632,Lweo,L-wceo,5551.0,,Tommie Wattie Formation,"Psammite, in lower part; grades up to pelite, ...",MS,Metasediment,QTZT,,Quartzite,,,NaT,414441.71,6460596.55,54,140.094333,-31.987455,140.094323,-31.987441
60986,1993881,72246,,,,,,,G,General/Miscellaneous,QZRU,,Quartz Rock (Undiff. Origin),quartz,Purple-grey siliceous rock brecciated and ceme...,2014-03-11,702711.27,6396141.77,53,137.158965,-32.553616,137.158955,-32.553602
57842,237091,22883,Nds,N-wbds,4127.0,,Saddleworth Formation,"Mudstone; siltstone; shale, partly carbonaceous.",SSL,Sediment Siliciclastic Lutite,SLST,,Siltstone,Cleaved.,"Blue-grey, purple weathering; occurs to E of l...",1994-01-20,323854.24,6259684.44,54,139.097424,-33.788348,139.097414,-33.788333


In [17]:
sarig_fieldobs_litho_exp.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 66212 entries, 0 to 66211
Data columns (total 23 columns):
SITE_NO              66212 non-null int64
LITHOLOGY_NO         66212 non-null int64
MAP_SYMBOL           46529 non-null object
GIS_CODE             46529 non-null object
STRAT_UNIT_NO        46587 non-null Int64
STRAT_CONF           3710 non-null object
STRAT_NAME           46587 non-null object
STRAT_DESCRIPTION    46586 non-null object
ROCK_GROUP_CODE      66212 non-null object
ROCK_GROUP           66212 non-null object
LITHO_CODE           66212 non-null object
LITHO_CONFIDENCE     1114 non-null object
LITHOLOGY_NAME       66212 non-null object
LITHO_MODIFIER       30038 non-null object
LITHO_COMMENTS       24365 non-null object
OBSERVATION_DATE     41456 non-null datetime64[ns]
EASTING_GDA2020      66212 non-null float64
NORTHING_GDA2020     66212 non-null float64
ZONE_GDA2020         66212 non-null int64
LONGITUDE_GDA2020    66212 non-null float64
LATITUDE_GDA2020     66212

In [18]:
interested_fieldobs_litho_exp = sarig_fieldobs_litho_exp[
    ['SITE_NO', 'LITHOLOGY_NO', 'MAP_SYMBOL', 'GIS_CODE', 'STRAT_UNIT_NO', 
     'ROCK_GROUP_CODE', 'LITHO_CODE', 'LITHO_CONFIDENCE', 'LITHO_MODIFIER']]
interested_fieldobs_litho_exp.sample(5)

Unnamed: 0,SITE_NO,LITHOLOGY_NO,MAP_SYMBOL,GIS_CODE,STRAT_UNIT_NO,ROCK_GROUP_CODE,LITHO_CODE,LITHO_CONFIDENCE,LITHO_MODIFIER
31290,303049,34269,Qp\ca,I-----ca,4429.0,RPDC,CALC,,
32604,309190,36621,Nli,N-wbli,3825.0,SSL,SLST,,
62782,271319,29673,Novs,N-wbovs,6226.0,SSL,SLST,,"Fine sandy, micromicaceous, with faint laminat..."
33934,311917,38534,Nli,N-wbli,3825.0,SSL,SLST,,
52041,1993807,72164,,,,G,QZRU,,quartz


### Load Field Observation Notes

In [19]:
sarig_fieldobs_note_exp = pd.read_csv(
    zipfile(os.path.join(data_loc, file_name),'r').open('SARIG_Data_Package/sarig_fieldobs_note_exp.csv','r'), 
    sep=',', encoding='latin1')
sarig_fieldobs_litho_exp['OBSERVATION_DATE'] = pd.to_datetime(sarig_fieldobs_litho_exp['OBSERVATION_DATE'])
sarig_fieldobs_note_exp.sample(5)

Unnamed: 0,SITE_NO,FIELD_NOTE_NO,FIELD_NOTES,OBSERVATION_DATE,EASTING_GDA2020,NORTHING_GDA2020,ZONE_GDA2020,LONGITUDE_GDA2020,LATITUDE_GDA2020,LONGITUDE_GDA94,LATITUDE_GDA94
4169,154001,5117,Interbedded shales and thin conglomerate lense...,,726535.05,6059182.38,53,137.500204,-35.585179,137.500194,-35.585165
12580,474732,16678,Mylonitisation as ?D2 feature.,20/10/2000,416713.65,6451807.47,54,140.11762,-32.066909,140.11761,-32.066895
23401,1971863,32690,Dolerite geochem sample. Photo: 8016-19.,27/06/2013,308885.56,7063021.82,53,133.08169,-26.540547,133.081681,-26.540533
7204,234601,8633,NOT RECORDED,,694635.07,7082580.83,52,130.950655,-26.363566,130.950646,-26.363552
18487,1841610,29182,This site lies within gradational contact betw...,13/10/2012,781094.12,6392921.27,53,137.993896,-32.565532,137.993885,-32.565518


The FIELD_NOTES are words, which might require text mining, while these FIELD_NOTES does not give too much insight into the ores. So, we ignore this table. 

### Load Field Observation Geological Structure Data 

In [20]:
sarig_fieldobs_struct_exp = pd.read_csv(
    zipfile(os.path.join(data_loc, file_name),'r').open('SARIG_Data_Package/sarig_fieldobs_struct_exp.csv','r'), 
    sep=',', encoding='latin1')
sarig_fieldobs_struct_exp.sample(5)

Unnamed: 0,SITE_NO,LITHOLOGY_NO,ROCK_GROUP_CODE,ROCK_GROUP,LITHOLOGY_CODE,LITHOLOGY_NAME,MAP_SYMBOL,STRUCTURE_NO,STRUCTRE_CODE,STRUCTURE_NAME,STRUCTURE_CONF,LOCAL_GENERATION,OROGENY,REGIONAL_GENERATION,AZIMUTH,AZIMUTH_ACCURACY,AZIMUTH_MEASUREMENT_TYPE,INCLINATION,INCLINATION_ACCURACY,YOUNGING,OBSERVATION_DATE,EASTING_GDA2020,NORTHING_GDA2020,ZONE_GDA2020,LONGITUDE_GDA2020,LATITUDE_GDA2020,LONGITUDE_GDA94,LATITUDE_GDA94
68304,2122901,77612.0,IFI,Igneous Felsic Intrusive,GRNT,Granite,,80879,STS,Tectonic foliation,,,,,321.0,2.0,M,85.0,2.0,,29/09/2018,388041.0,6652298.71,53,133.836217,-30.255779,133.836208,-30.255765
68064,457744,,,,,,,61903,SPSH,Originally horizontal sedimentary bedding,,0.0,,,259.0,2.0,M,85.0,2.0,,15/09/1999,278296.34,6295601.26,54,138.614623,-33.456114,138.614613,-33.456099
12090,242157,25557.0,MG,Metamorphic General,PHYL,Phyllite,Nob,18355,SPSH,Originally horizontal sedimentary bedding,,0.0,,0.0,70.0,10.0,M,45.0,5.0,,10/03/1992,264994.97,6257617.53,54,138.461604,-33.795535,138.461594,-33.795521
28400,281563,,,,,,,26300,SPSH,Originally horizontal sedimentary bedding,,,,,265.0,2.0,T,3.0,2.0,,,251697.24,6773932.09,54,138.447716,-29.138892,138.447706,-29.138878
19851,262370,45525.0,SSA,Sediment Siliciclastic Arenite,SDST,Sandstone,Nya,47041,LTES,Fault slickensides,,,Delamerian Orogeny,,41.0,2.0,M,38.0,2.0,,10/01/1996,306892.0,6266181.14,54,138.915732,-33.72683,138.915722,-33.726816


In [21]:
sarig_fieldobs_struct_exp.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 72873 entries, 0 to 72872
Data columns (total 28 columns):
SITE_NO                     72873 non-null int64
LITHOLOGY_NO                40987 non-null float64
ROCK_GROUP_CODE             40987 non-null object
ROCK_GROUP                  40987 non-null object
LITHOLOGY_CODE              40987 non-null object
LITHOLOGY_NAME              40987 non-null object
MAP_SYMBOL                  30177 non-null object
STRUCTURE_NO                72873 non-null int64
STRUCTRE_CODE               72873 non-null object
STRUCTURE_NAME              72873 non-null object
STRUCTURE_CONF              2138 non-null object
LOCAL_GENERATION            38008 non-null float64
OROGENY                     36124 non-null object
REGIONAL_GENERATION         16032 non-null float64
AZIMUTH                     72832 non-null float64
AZIMUTH_ACCURACY            72872 non-null float64
AZIMUTH_MEASUREMENT_TYPE    72872 non-null object
INCLINATION                 72842 non-n

In [22]:
interest_fieldobs_struct_exp = sarig_fieldobs_struct_exp[['SITE_NO', 'LITHOLOGY_NO', 'STRUCTURE_NO', 'STRUCTRE_CODE', 
    'LOCAL_GENERATION', 'OROGENY', 'REGIONAL_GENERATION', 'AZIMUTH', 
    'AZIMUTH_ACCURACY', 'AZIMUTH_MEASUREMENT_TYPE', 'INCLINATION', 
    'INCLINATION_ACCURACY']]

### Merge Data Tables

In [23]:
merged_fieldobs_exp = interested_fieldobs_exp.merge(
    interested_fieldobs_litho_exp, how='inner', on='SITE_NO').merge(
    interest_fieldobs_struct_exp, how='inner', on=['SITE_NO','LITHOLOGY_NO'])

In [24]:
merged_fieldobs_exp.sample(10)

Unnamed: 0,SITE_NO,FIELD_ID,LANDFORM_CODE,MAP_250000,MAP_100000,MAP_50000,EASTING_GDA2020,NORTHING_GDA2020,ZONE_GDA2020,LONGITUDE_GDA2020,LATITUDE_GDA2020,LONGITUDE_GDA94,LATITUDE_GDA94,HORIZ_ACCRCY_M,ELEVATION_M,VERT_ACCRCY_M,SURVEY_METHOD_CODE,LITHOLOGY_NO,MAP_SYMBOL,GIS_CODE,STRAT_UNIT_NO,ROCK_GROUP_CODE,LITHO_CODE,LITHO_CONFIDENCE,LITHO_MODIFIER,STRUCTURE_NO,STRUCTRE_CODE,LOCAL_GENERATION,OROGENY,REGIONAL_GENERATION,AZIMUTH,AZIMUTH_ACCURACY,AZIMUTH_MEASUREMENT_TYPE,INCLINATION,INCLINATION_ACCURACY
11856,309800,2413B01281053,,SI5405 BURRA,6630 Clare,3,282943.49,6247410.76,54,138.652811,-33.891351,138.652801,-33.891336,,,,PHOTO,36933,Nli,N-wbli,3825.0,SSL,SLST,,,39966,SPSH,0.0,Delamerian Orogeny,,263.0,2.0,M,71.0,2.0
27968,272290,0355601321079,,SI5405 BURRA,6630 Clare,3,270678.02,6258744.56,54,138.523231,-33.786628,138.523221,-33.786613,,,,PHOTO,36823,Novs,N-wbovs,6226.0,MG,SCHT,,,39831,STSN,3.0,Delamerian Orogeny,,255.0,2.0,M,60.0,2.0
15772,225046,0241201971112,,SI5405 BURRA,6731 Caroona,4,320318.27,6326393.66,54,139.072622,-33.186402,139.072612,-33.186387,,,,,14457,,,,N,XXXX,,,9821,SPSH,0.0,Delamerian Orogeny,,303.0,2.0,M,75.0,2.0
28484,263558,0355600531243,,SI5405 BURRA,6631 Jamestown,2,296421.12,6291669.87,54,138.808611,-33.495145,138.808601,-33.495131,,,,PHOTO,50405,Nep,N-huep,4045.0,SSL,SLST,,"Pale khaki-grey weathered massive siltstone, c...",51869,STSC,1.0,Delamerian Orogeny,,268.0,2.0,M,70.0,2.0
16502,228650,0241201161056,,SI5405 BURRA,6731 Caroona,1,354168.6,6336504.37,54,139.437208,-33.100327,139.437198,-33.100313,,,,,18061,,,,N,XXXX,,,14918,SPSH,0.0,Delamerian Orogeny,,218.0,2.0,M,33.0,2.0
31363,1834253,W48,,SI5304 PORT AUGUSTA,6432 Cultana,1,781034.37,6396689.54,53,137.992132,-32.5316,137.992122,-32.531586,15.0,,,GPSSN,64819,Nee,N-huee,3546.0,SSA,SDST,,Top of next medium and coarse-grained blocky p...,76727,SPSH,,,,96.0,2.0,M,90.0,2.0
28085,266324,0355601161015,,SI5405 BURRA,6630 Clare,1,311362.41,6271939.49,54,138.96518,-33.675731,138.96517,-33.675717,,,,PHOTO,48647,Nds,N-wbds,4127.0,SSL,SLST,,Dark Grey thinly laminated,50024,STSC,1.0,Delamerian Orogeny,,288.0,2.0,M,67.0,2.0
24650,1116209,,,SI5402 OLARY,6933 Olary,1,452786.66,6450739.52,54,140.499727,-32.078628,140.499717,-32.078614,10.0,,,GPSAP,59393,,,,MG,MIGM,,,65538,STSI,3.0,Olarian Orogeny,3.0,169.0,2.0,M,90.0,2.0
11544,296027,0266200161002,,SI5311 LINCOLN,6128 Spilsby,4,591830.74,6180680.69,53,136.000418,-34.511433,136.000408,-34.511419,,,,PHOTO,32445,Ldw,L--d-w,4836.0,MG,GNSS,,,35557,STS,,,,56.0,2.0,M,80.0,2.0
30017,295968,0267200131019,,SI5311 LINCOLN,6128 Spilsby,3,592400.45,6138561.38,53,136.011234,-34.89115,136.011224,-34.891136,,,,PHOTO,32640,Ldw,L--d-w,4836.0,IFI,GRNT,,,35787,STSM,,Kimban Orogeny,3.0,339.0,2.0,M,70.0,2.0


In [25]:
merged_fieldobs_exp.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 40973 entries, 0 to 40972
Data columns (total 35 columns):
SITE_NO                     40973 non-null int64
FIELD_ID                    39408 non-null object
LANDFORM_CODE               1455 non-null object
MAP_250000                  40973 non-null object
MAP_100000                  40973 non-null object
MAP_50000                   40973 non-null int64
EASTING_GDA2020             40973 non-null float64
NORTHING_GDA2020            40973 non-null float64
ZONE_GDA2020                40973 non-null int64
LONGITUDE_GDA2020           40973 non-null float64
LATITUDE_GDA2020            40973 non-null float64
LONGITUDE_GDA94             40973 non-null float64
LATITUDE_GDA94              40973 non-null float64
HORIZ_ACCRCY_M              5863 non-null float64
ELEVATION_M                 4101 non-null float64
VERT_ACCRCY_M               3944 non-null float64
SURVEY_METHOD_CODE          28289 non-null object
LITHOLOGY_NO                40973 non-n

### Export Merged Dataset

In [26]:
merged_fieldobs_exp.to_csv('./data/merged_fieldobs_exp.csv', sep=',', header='infer')