In [1]:
%matplotlib notebook
import matplotlib as mpl
mpl.rcParams['figure.figsize'] = [8, 8]

import os
import pickle
import numpy as np

import pandas as pd
import geopandas as gpd
import normalise_worker

from multiprocessing import Pool
from normalise_worker_helper import normalise_args_helper

data_src = os.path.join(os.path.dirname(os.getcwd()), 'data_out')

  from .sqlite import head_to_sql, start_sql


In [2]:
# Divide the data into chunks based on rins
chunks = []

for c in range(8):
    chunk_in_path = os.path.join(data_src, 'samples_buffered_%s.pickle' % c)
    with open(chunk_in_path, 'rb') as f:
        chunk = pickle.load(f)
        
        chunk.drop('geometry', axis = 1, inplace = True)
        chunk.drop('stroke', axis = 1, inplace = True)
        chunk.drop('index_right', axis = 1, inplace = True)
        
        chunks.append((chunk, c, ['Au_ppm']))

In [3]:
chunks

[(       index  As_ppm  Au_ppm  FILEID  FILE_ID      LAT94       LNG94  \
  0          0     NaN     NaN     NaN    109.0 -29.378209  150.282157   
  1          0     NaN     NaN     NaN    109.0 -29.363753  150.294260   
  2          0     NaN     NaN     NaN    109.0 -29.396065  150.313078   
  3          0     NaN     NaN     NaN    109.0 -29.388715  150.314466   
  4          0     2.8   0.011     NaN    252.0 -31.994859  141.710774   
  5          0     2.5   0.005     NaN    252.0 -31.993518  141.710919   
  6          1     6.0  -0.001     NaN    252.0 -31.965162  141.607901   
  7          1     3.6   0.012     NaN    252.0 -31.959100  141.615062   
  8          2     1.1   0.004     NaN    252.0 -32.090668  141.552975   
  9          2     1.8   0.006     NaN    252.0 -32.090115  141.553243   
  10         2     3.4   0.002     NaN    252.0 -32.089702  141.553549   
  11         2     2.8   0.005     NaN    252.0 -32.089300  141.553881   
  12         2     2.1   0.003     NaN

In [4]:
num_processors = 8
p=Pool(processes = num_processors)
output = p.map(normalise_args_helper, chunks)
print(output)

[None, None, None, None, None, None, None, None]


In [6]:
data_fout = os.path.join(os.path.dirname(os.getcwd()), 'data_out')

with open(os.path.join(data_fout, 'samples_buffered_normalised_0.pickle'), 'rb') as f:
    samples_example = pickle.load(f)

In [7]:
samples_example

Unnamed: 0,index,As_ppm,Au_ppm,FILEID,FILE_ID,LAT94,LNG94,RIN,RPT_ID,RPT_TYPE,...,SAMPLEID,MR_AUTHOR,MR_CONFIDENTIALITY,MR_REPYEAR,EASTING,NORTHING,Au_ppm_nn,Au_ppm_fn,Au_ppm_log,Au_ppm_nml
0,0,,0.000,,109.0,-29.378209,150.282157,R00029158,29,A,...,6155380,Rio Tinto Exploration Pty Ltd,O,2003,1.558176e+06,-3.422245e+06,0.000,0.0005,-3.301030,
1,0,,0.000,,109.0,-29.363753,150.294260,R00029158,29,A,...,6155381,Rio Tinto Exploration Pty Ltd,O,2003,1.559533e+06,-3.420825e+06,0.000,0.0005,-3.301030,
2,0,,0.000,,109.0,-29.396065,150.313078,R00029158,29,A,...,6155554,Rio Tinto Exploration Pty Ltd,O,2003,1.560865e+06,-3.424569e+06,0.000,0.0005,-3.301030,
3,0,,0.000,,109.0,-29.388715,150.314466,R00029158,29,A,...,6155555,Rio Tinto Exploration Pty Ltd,O,2003,1.561102e+06,-3.423788e+06,0.000,0.0005,-3.301030,
4,0,2.8,0.011,,252.0,-31.994859,141.710774,R00029266,32,A,...,370028,Golden Cross Operations Pty Ltd\r\nSipa Explor...,O,2003,7.219072e+05,-3.630439e+06,0.011,0.0110,-1.958607,0.666667
5,0,2.5,0.005,,252.0,-31.993518,141.710919,R00029266,32,A,...,370027,Golden Cross Operations Pty Ltd\r\nSipa Explor...,O,2003,7.219298e+05,-3.630293e+06,0.005,0.0050,-2.301030,0.000000
6,1,6.0,-0.001,,252.0,-31.965162,141.607901,R00029266,32,A,...,370251,Golden Cross Operations Pty Ltd\r\nSipa Explor...,O,2003,7.124852e+05,-3.626594e+06,-0.001,0.0005,-3.301030,0.000000
7,1,3.6,0.012,,252.0,-31.959100,141.615062,R00029266,32,A,...,370026,Golden Cross Operations Pty Ltd\r\nSipa Explor...,O,2003,7.131954e+05,-3.625969e+06,0.012,0.0120,-1.920819,0.666667
8,2,1.1,0.004,,252.0,-32.090668,141.552975,R00029266,32,A,...,370003,Golden Cross Operations Pty Ltd\r\nSipa Explor...,O,2003,7.065188e+05,-3.640056e+06,0.004,0.0040,-2.397940,0.658961
9,2,1.8,0.006,,252.0,-32.090115,141.553243,R00029266,32,A,...,370004,Golden Cross Operations Pty Ltd\r\nSipa Explor...,O,2003,7.065475e+05,-3.639997e+06,0.006,0.0060,-2.221849,0.787450
