In [1]:
# Steps to convert starkey to NumMobility read:
"""
    1. Convert the Easting and Northing to latitude and
       longitude respectively using the utm library which
       can be installed using pip.
    2. Then, create a DateTime column for the dataset.
    3. Rearrange the columns.
    4. Done!

    Warning: Please do not run this multiple times, run it
             once only if you want to see the results.
"""

import pandas as pd
import utm

starkey = pd.read_csv('./data/starkey.csv')
starkey.head()

Unnamed: 0,UTMGridEast,UTMGridNorth,Id,StarkeyTime,GMDate,GMTime,LocDate,LocTime,RadNum,Species,UTME,UTMN,Year,Grensunr,Grensuns,Obswt
0,374145,5014200,890424000000.0,168825628,02:08:28,19930507,19930506,18:08:28,59,E,374137,5014190,93,12:34:00,03:10:00,1.62
1,374265,5010180,921228000000000.0,168826022,07:02:02,19930507,19930506,23:02:02,57,E,374262,5010176,93,12:34:00,03:10:00,1.36
2,377475,5015730,8902220.0,168826135,08:55:55,19930507,19930507,00:55:55,46,E,377477,5015745,93,12:34:00,03:10:00,1.68
3,374805,5018490,9.10313e+24,168826274,01:11:14,19930507,19930506,17:11:14,54,E,374795,5018503,93,12:34:00,03:10:00,1.43
4,377055,5008470,9.10313e+42,168826332,01:21:12,19930507,19930506,17:21:12,67,E,377053,5008474,93,12:34:00,03:10:00,1.73


In [2]:
lat, lon = utm.to_latlon(easting=starkey['UTMGridEast'],
                         northing=starkey['UTMGridNorth'],
                         zone_number=11,
                         northern=True)
starkey['UTMGridEast'] = lat
starkey['UTMGridNorth'] = lon

In [3]:
starkey = starkey.rename(columns={'UTMGridEast': 'lat',
                                  'UTMGridNorth': 'lon'})
starkey.head()

Unnamed: 0,lat,lon,Id,StarkeyTime,GMDate,GMTime,LocDate,LocTime,RadNum,Species,UTME,UTMN,Year,Grensunr,Grensuns,Obswt
0,45.27003,-118.60439,890424000000.0,168825628,02:08:28,19930507,19930506,18:08:28,59,E,374137,5014190,93,12:34:00,03:10:00,1.62
1,45.233879,-118.601844,921228000000000.0,168826022,07:02:02,19930507,19930506,23:02:02,57,E,374262,5010176,93,12:34:00,03:10:00,1.36
2,45.284385,-118.562334,8902220.0,168826135,08:55:55,19930507,19930507,00:55:55,46,E,377477,5015745,93,12:34:00,03:10:00,1.68
3,45.308749,-118.597063,9.10313e+24,168826274,01:11:14,19930507,19930506,17:11:14,54,E,374795,5018503,93,12:34:00,03:10:00,1.43
4,45.218985,-118.56589,9.10313e+42,168826332,01:21:12,19930507,19930506,17:21:12,67,E,377053,5008474,93,12:34:00,03:10:00,1.73


In [4]:
import datetime

dates = pd.to_datetime(starkey['LocDate']).dt.date
times = pd.to_datetime(starkey['LocTime']).dt.time

a = [None] * len(starkey['LocTime'])
for i in range(len(starkey['LocTime'])):
    a[i] = datetime.datetime.combine(date=dates[i],
                                     time=times[i])

In [5]:
datetime= pd.to_datetime(a, format='%Y-%m-%d %H:%M:%S')
starkey.insert(0, 'DateTime', datetime)

In [6]:
starkey.head()

Unnamed: 0,DateTime,lat,lon,Id,StarkeyTime,GMDate,GMTime,LocDate,LocTime,RadNum,Species,UTME,UTMN,Year,Grensunr,Grensuns,Obswt
0,1970-01-01 18:08:28,45.27003,-118.60439,890424000000.0,168825628,02:08:28,19930507,19930506,18:08:28,59,E,374137,5014190,93,12:34:00,03:10:00,1.62
1,1970-01-01 23:02:02,45.233879,-118.601844,921228000000000.0,168826022,07:02:02,19930507,19930506,23:02:02,57,E,374262,5010176,93,12:34:00,03:10:00,1.36
2,1970-01-01 00:55:55,45.284385,-118.562334,8902220.0,168826135,08:55:55,19930507,19930507,00:55:55,46,E,377477,5015745,93,12:34:00,03:10:00,1.68
3,1970-01-01 17:11:14,45.308749,-118.597063,9.10313e+24,168826274,01:11:14,19930507,19930506,17:11:14,54,E,374795,5018503,93,12:34:00,03:10:00,1.43
4,1970-01-01 17:21:12,45.218985,-118.56589,9.10313e+42,168826332,01:21:12,19930507,19930506,17:21:12,67,E,377053,5008474,93,12:34:00,03:10:00,1.73


In [7]:
starkey.columns.to_list()

['DateTime',
 'lat',
 'lon',
 'Id',
 'StarkeyTime',
 'GMDate',
 'GMTime',
 'LocDate',
 'LocTime',
 'RadNum',
 'Species',
 'UTME',
 'UTMN',
 'Year',
 'Grensunr',
 'Grensuns',
 'Obswt']

In [8]:
cols = ['Id', 'DateTime', 'lat', 'lon', 'StarkeyTime', 'GMDate',
        'GMTime', 'LocDate', 'LocTime', 'RadNum', 'Species',
        'UTME', 'UTMN', 'Year', 'Grensunr', 'Grensuns', 'Obswt']

starkey = starkey[cols]

In [9]:
starkey.head()

Unnamed: 0,Id,DateTime,lat,lon,StarkeyTime,GMDate,GMTime,LocDate,LocTime,RadNum,Species,UTME,UTMN,Year,Grensunr,Grensuns,Obswt
0,890424000000.0,1970-01-01 18:08:28,45.27003,-118.60439,168825628,02:08:28,19930507,19930506,18:08:28,59,E,374137,5014190,93,12:34:00,03:10:00,1.62
1,921228000000000.0,1970-01-01 23:02:02,45.233879,-118.601844,168826022,07:02:02,19930507,19930506,23:02:02,57,E,374262,5010176,93,12:34:00,03:10:00,1.36
2,8902220.0,1970-01-01 00:55:55,45.284385,-118.562334,168826135,08:55:55,19930507,19930507,00:55:55,46,E,377477,5015745,93,12:34:00,03:10:00,1.68
3,9.10313e+24,1970-01-01 17:11:14,45.308749,-118.597063,168826274,01:11:14,19930507,19930506,17:11:14,54,E,374795,5018503,93,12:34:00,03:10:00,1.43
4,9.10313e+42,1970-01-01 17:21:12,45.218985,-118.56589,168826332,01:21:12,19930507,19930506,17:21:12,67,E,377053,5008474,93,12:34:00,03:10:00,1.73


In [11]:
starkey.to_csv('./data/starkey.csv', index=False, index_label=False)

(287136, 17)