In [22]:
##### SALARY PREDICTION 
# Use Kaggle' Job Salary Prediction Dataset
# Ninsth

##### CONSTANTS
QUICK_ROWS = 0 # quick test. 0: all, >0: just use head with QUICK_ROWS (should above 3000)
USE_SAVED_FRAME = True
USE_SAVED_W2V_MODEL = True
USE_SAVED_MODEL = False

DATA_FILE = "/Users/Ninhsth/Downloads/Train_rev1.csv"
RESPONSE_NAME = "SalaryNormalized"
STOPPING_METRIC = "mae"

INOUT_DIR = "/Users/Ninhsth/gd/ninhsh.work/github/navi-reco-py/inout"
RESTART_H2O = True # To release all resources of H2O after heavy jobs 
SHUTDOWN_H2O = False

WORD_VEC_SIZE = 200
EPOCHS = 5
GOOD_DISTANCE_PERCENTAGE = 30
SEED = 12345678901
VERBAL = False


FULLDESC_W2V_MODEL_NAME = "fulldesc_w2v_model"
TITLE_W2V_MODEL_NAME = "title_w2v_model"
VEC_JOB_DF_NAME = "vec_job_df"
VECCAT_JOB_DF_NAME = "veccat_job_df"
BEST_SAL_MODEL_NAME = "best_sal_model"

STOP_WORDS = ["ax","i","you","edu","s","t","m","subject","can","lines","re","what",
               "there","all","we","one","the","a","an","of","or","in","for","by","on",
               "but","is","in","a","not","with","as","was","if","they","are","this","and","it","have",
               "from","at","my","be","by","not","that","to","from","com","org","like","likes","so"
    , "our", "will", "looking", "both"        
    , "vacancies", "candidate", "up", "usd", "exp", "welcome", "urgent", "hot", "good", "new", "attractive", "___", "years", "year", "salary", "need", "needed", "very"
    , "bị", "bởi", "cả", "các", "cái", "cần", "càng", "chỉ", "chiếc", "cho", "chứ", "chưa", "chuyện", "có", "có_thể", "cứ", "của", "cùng", "cũng", "đã", "đang", "đây", "để", "đến_nỗi", "đều", "điều", "do", "đó", "được", "dưới", "gì", "khi", "không", "là", "lại", "lên", "lúc", "mà", "mỗi", "một_cách", "này", "nên", "nếu", "ngay", "nhiều", "như", "nhưng", "những", "nơi", "nữa", "phải", "qua", "ra", "rằng", "rằng", "rất", "rất", "rồi", "sau", "sẽ", "so", "sự", "tại", "theo", "thì", "trên", "trước", "từ", "từng", "và", "vẫn", "vào", "vậy", "vì", "việc", "với", "vừa"
  ]

In [23]:
%matplotlib inline
import time, datetime, sys
import json
import matplotlib
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.mlab as mlab

import h2o
from h2o.estimators.word2vec import H2OWord2vecEstimator
from h2o.estimators.gbm import H2OGradientBoostingEstimator
from h2o.estimators.random_forest import H2ORandomForestEstimator
from h2o.estimators.deeplearning import H2ODeepLearningEstimator
from h2o.grid import H2OGridSearch
from h2o.estimators import H2OXGBoostEstimator

In [24]:
##### FUNCTIONS
def niceTime():
    return datetime.datetime.fromtimestamp(time.time()).strftime('%Y-%m-%d %H:%M:%S')

def StartOfFunc(funcname=""):
    print(niceTime(), '- START ', funcname)
    
def EndOfFunc(funcname=""):
    print(niceTime(), '- END ', funcname)

In [25]:
def tokenize(sentences, stop_word = STOP_WORDS):
    StartOfFunc(sys._getframe().f_code.co_name)
    tokenized = sentences.tokenize("\\W+")
    if VERBAL: print(niceTime(),"tokenized")

    tokenized_lower = tokenized.tolower()
    tokenized_filtered = tokenized_lower[(tokenized_lower.nchar() >= 2) | (tokenized_lower.isna()),:]
    if VERBAL: print(niceTime(),"filtered")

    tokenized_words = tokenized_filtered[tokenized_filtered.grep("[0-9]",invert=True,output_logical=True),:]
    tokenized_words = tokenized_words[(tokenized_words.isna()) | (~ tokenized_words.isin(STOP_WORDS)),:]
    if VERBAL: print("tokenized_words:\n", tokenized_words.describe())
    
    EndOfFunc(sys._getframe().f_code.co_name)
    return tokenized_words

In [26]:
def load_data(data_file):
    StartOfFunc(sys._getframe().f_code.co_name)

    vjobs_df = h2o.import_file(data_file, destination_frame = "vjob",
                col_names = ["Id","Title","FullDescription","LocationRaw","LocationNormalized","ContractType",
                             "ContractTime","Company","Category","SalaryRaw","SalaryNormalized","SourceName"], 
                col_types = ["int", "string", "string", "enum", "enum","enum",
                             "enum","enum","enum","string","int", "string"], header = 1)

    vjobs_df = vjobs_df.drop(['Id', 'SalaryRaw', 'LocationRaw']) # use ignore_columns not work
    if (QUICK_ROWS>0): vjobs_df = vjobs_df.head(QUICK_ROWS)
        
    print(niceTime(), "Data description")
    if VERBAL: vjobs_df.describe()
        
#     topCats=['IT Jobs'] #,'Engineering Jobs', 'Accounting & Finance Jobs'
#     data_df=vjobs_df[vjobs_df['Category'].isin(topCats)]
#     if VERBAL: data_df.describe()
    data_df=vjobs_df
        
    EndOfFunc(sys._getframe().f_code.co_name)  
    return data_df

In [27]:
def split(df):
    StartOfFunc(sys._getframe().f_code.co_name)
    
    [train_df, valid_df, test_df] = df.split_frame(ratios=[0.7,0.15],seed=SEED)
    train_df.frame_id = df.frame_id + "_train"
    valid_df.frame_id = df.frame_id + "_valid"
    test_df.frame_id = df.frame_id + "_test"
    
    EndOfFunc(sys._getframe().f_code.co_name)
    return [train_df, valid_df, test_df]

In [28]:
def find_synonyms(word, w2v_model):
    print(w2v_model.find_synonyms(word, count = 5))

In [29]:
def vectorize_title(job_df, use_saved_model=False):
    StartOfFunc(sys._getframe().f_code.co_name)

    print("Break Title into sequence of words")
    words = tokenize(job_df["Title"])
    
    if use_saved_model:
        print("Load w2v model from " + INOUT_DIR + "/" + TITLE_W2V_MODEL_NAME)
        w2v_model = h2o.load_model(INOUT_DIR + "/" + TITLE_W2V_MODEL_NAME) 
    else: 
        print("Build word2vec model")
        w2v_model = H2OWord2vecEstimator(sent_sample_rate = 0.0, epochs = EPOCHS,vec_size = WORD_VEC_SIZE)
        w2v_model.train(training_frame=words)
        w2v_model.model_id = TITLE_W2V_MODEL_NAME

        model_path = h2o.save_model(model=w2v_model, path=INOUT_DIR, force=True)
        print("w2v_model saved to: ", model_path)
    
    print("Calculate a vector for each job title")
    job_vecs = w2v_model.transform(words, aggregate_method = "AVERAGE")
    if VERBAL: print("job_vecs.describe:\n", job_vecs.describe())
    vec_job_df = job_df.cbind(job_vecs)
    vec_job_df.frame_id = "vec_job_df"
    vec_job_df = vec_job_df.drop('Title')   
    
    EndOfFunc(sys._getframe().f_code.co_name)
    
    return vec_job_df

def preprocess(job_df, use_saved_model = False):
    ''' Return 2 dataframes
        1. Vectorize both Title and FullDescription, vec_job_df
        2. Categorize Title and vectorize FullDescription, veccat_job_df
    '''
    StartOfFunc(sys._getframe().f_code.co_name)
    
    
    vec_job_df = vectorize_title(job_df, use_saved_model=use_saved_model)
    if VERBAL: print(vec_job_df.describe())
        
    print(niceTime(), "Convert Title to category data type")    
    veccat_job_df = job_df
    veccat_job_df['Title']= veccat_job_df['Title'].asfactor()

    print(niceTime(), "Tokenize")    
    words = tokenize(job_df["FullDescription"])
    if VERBAL: words.describe()
  
    if use_saved_model:
        print("Load w2v model from " + INOUT_DIR + "/" + FULLDESC_W2V_MODEL_NAME)
        w2v_model = h2o.load_model(INOUT_DIR + "/" + FULLDESC_W2V_MODEL_NAME) 
    else: 
        print(niceTime(), "Train with H2OWord2vecEstimator")
        w2v_model = H2OWord2vecEstimator(sent_sample_rate = 0.0001, epochs = EPOCHS, vec_size = WORD_VEC_SIZE)
        w2v_model.train(training_frame=words)
        w2v_model.model_id = FULLDESC_W2V_MODEL_NAME

        model_path = h2o.save_model(model=w2v_model, path=INOUT_DIR, force=True)
        print("w2v_model saved to: ", model_path)
    
    print(niceTime(), "Calculate a vector for each FullDescription")
    vecs = w2v_model.transform(words, aggregate_method = "AVERAGE")
    print(niceTime(), "Prepare training&validation data (keep only FullDescription made of known words)")
    valid_data = ~ vecs["C1"].isna()
    if VERBAL: valid_data.describe() 
        
    print(niceTime(), "Combine vec column")
    vec_job_df = vec_job_df[valid_data,:].cbind(vecs[valid_data,:])
    vec_job_df.frame_id = "vec_job_df" 
    vec_job_df = vec_job_df.drop('FullDescription')
    
    veccat_job_df = veccat_job_df[valid_data,:].cbind(vecs[valid_data,:])
    veccat_job_df.frame_id = "veccat_job_df" 
    veccat_job_df = veccat_job_df.drop('FullDescription')
     
    
    EndOfFunc(sys._getframe().f_code.co_name)
    
    return [vec_job_df, veccat_job_df]

In [30]:
def trainGBM(train_df,valid_df, col_sample_rate = 1):
    StartOfFunc(sys._getframe().f_code.co_name)

    print("Build a GBM model")
    gbm_model = H2OGradientBoostingEstimator(nfolds=5, ignored_columns=['Id', 'SalaryRaw', 'LocationRaw'], ntrees=150, seed = SEED, learn_rate= 0.5, stopping_tolerance= 0.05, col_sample_rate = col_sample_rate )

    gbm_model.train(x = train_df.names,
                    y=RESPONSE_NAME,                     
                    training_frame = train_df, 
                    validation_frame = valid_df)
    
    print(gbm_model.model_performance(valid=True))
    EndOfFunc(sys._getframe().f_code.co_name)
    
    return gbm_model

In [31]:
def trainRF(train_df,valid_df, col_sample_rate = 1):
    StartOfFunc(sys._getframe().f_code.co_name)

    model = H2OGradientBoostingEstimator(nfolds=5, ignored_columns=['Id', 'SalaryRaw', 'LocationRaw'], ntrees=150, seed = SEED, learn_rate= 0.5, stopping_tolerance= 0.05, col_sample_rate = col_sample_rate )

    model.train(x = train_df.names,
                    y=RESPONSE_NAME,                     
                    training_frame = train_df, 
                    validation_frame = valid_df)
    
    print(gbm_model.model_performance(valid=True))
    EndOfFunc(sys._getframe().f_code.co_name)
    
    return gbm_model

In [32]:
def trainDL(train_df, valid_df):

    print("Build a DL model")
    model = H2ODeepLearningEstimator(nfolds=5, seed = SEED, stopping_metric = STOPPING_METRIC
                                     , hidden = [200, 200]
                                     , epochs = 8
                                     , rate = 0.005 # Learning rate (higher => less stable, lower => slower convergence). Default 0.005. With 0.003 I see unstable mae (up/down deviance a lot)
                                     , sparse = True #Sparse data handling (more efficient for data with lots of 0 values). Default False.
                                     , stopping_tolerance= 0.1 # The relative tolerance for the metric-based stopping to stop training if the improvement is less than this value.
                                     , activation= 'rectifier_with_dropout'
                                     , input_dropout_ratio = 0.25
                                     , hidden_dropout_ratios = [0.6, 0.6] # Hidden layer dropout ratios (can improve generalization), specify one value per hidden layer, defaults to 0.5.
                                     , missing_values_handling = 'mean_imputation' #``"mean_imputation"``, ``"skip"``  (default: ``"mean_imputation"``).
                                    )

    model.train(x = train_df.names,
                    y=RESPONSE_NAME,                     
                    training_frame = train_df, 
                    validation_frame = valid_df)
    
    print(model.model_performance(valid=True))
    EndOfFunc(sys._getframe().f_code.co_name)
    
    return model

In [33]:
def grid_init_GBM():
    if (QUICK_ROWS>0): 
        l_ntrees = 3
    else:
        l_ntrees = 1000
      
    param = {
         "ignored_columns": ['Id', 'SalaryRaw', 'LocationRaw']  
        , "seed": SEED # potentially result in overfitting to a particular random sample selected
        , "nfolds": 4 # default 0, 5-10 is good but 10 will take more time
#         , 'tree_method': 'hist'
#         , 'grow_policy': 'lossguide'
#         , 'max_bins':1
#         , 'max_leaves':1
#         , 'min_sum_hessian_in_leaf': 0.1
#         , 'min_data_in_leaf':10.0
#         , "stopping_rounds": 3 
#         , "min_rows": 16
#         #     , "col_sample_rate_per_tree" : 0.9
#         #     , "min_rows" : 5
#         #     , "score_tree_interval": 100                                  
        }
    hyper_parameters = {
          'ntrees': l_ntrees # default 50 and CV not change, 10 CV(folds) still have save ntrees 50). this should be tuned using CV for a particular learning rate??
        , 'max_depth': [10] # default 5 and CV not change (Should be tuned using CV??) Control over-fitting, higher may overfitting
        , 'col_sample_rate': [0.8]
        , "sample_rate": [0.85]
        , "histogram_type": 'quantiles_global'
        , 'learn_rate': [0.1]
        , 'min_rows': [60] # default 10, higher for preventing overfitting.
#           'min_split_improvement': [0.0005]
        , 'nbins_cats': [800]    # default 1024, higher values can lead to more overfitting.
#         , 'stopping_rounds': [5]
#         , 'stopping_tolerance': [0.001]
        }
    
    print("hyper_parameters: ", hyper_parameters)
   
    grid_search = H2OGridSearch(H2OGradientBoostingEstimator(**param)
                        , hyper_params=hyper_parameters)
    
    return grid_search

In [34]:
def grid_init_RF():
    '''   
       Too slow: grid search with trees [50,100], max depth [20, 40] H2O est. 5 hours to run!
      try trees [50,100] max depth [15,30]: 4 hours
    '''
    if (QUICK_ROWS>0): 
        l_ntrees = 3
    else:
        l_ntrees = 500
        
    param = {
         "ignored_columns": ['Id', 'SalaryRaw', 'LocationRaw']  
        , "seed": SEED # potentially result in overfitting to a particular random sample selected
        , "nfolds": 4 # default 0, 5-10 is good but 10 will take more time
#         , 'tree_method': 'hist'
#         , 'grow_policy': 'lossguide'
#         , 'max_bins':1
#         , 'max_leaves':1
#         , 'min_sum_hessian_in_leaf': 0.1
#         , 'min_data_in_leaf':10.0
#         , "stopping_rounds": 3 
#         , "min_rows": 16
#         #     , "col_sample_rate_per_tree" : 0.9
#         #     , "min_rows" : 5
#         #     , "score_tree_interval": 100                                  
        }
    hyper_parameters = {
        'ntrees': l_ntrees
        , 'max_depth': 10
#         , 'col_sample_rate': [0.9]
#         , 'learn_rate': learn_rate
#           'min_split_improvement': [0.0005]
#         , 'nbins_cats': [800]
#         , 'stopping_rounds': [5]
#         , 'stopping_tolerance': [0.001]
        }
    
    print("hyper_parameters: ", hyper_parameters)
   
    grid_search = H2OGridSearch(H2ORandomForestEstimator(**param)
                        , hyper_params=hyper_parameters)                            
 
    return grid_search

In [35]:
def grid_init_XGBoost():
    if (QUICK_ROWS>0): 
        l_ntrees = [2,3]
    else:
        l_ntrees = [1400]
        
    # http://lightgbm.readthedocs.io/en/latest/Parameters-Tuning.html
    # http://docs.h2o.ai/h2o/latest-stable/h2o-docs/data-science/xgboost.html
    hyper_parameters = {
          'ntrees': l_ntrees
        , 'col_sample_rate': [0.6]
        , 'learn_rate': [0.03] #defaults 0.3
        , 'max_leaves': [900]
        , 'max_bins': [63] # default 256 # the smaller the faster but almost same accuracy, read more: http://lightgbm.readthedocs.io/en/latest/GPU-Performance.html
#           'min_split_improvement': [0.0005]
#         , 'nbins_cats': [800]
#         , 'stopping_rounds': [3]
#         , 'subsample': 0.9
#         , 'colsample_bytree': 0.75
#         , 'reg_alpha': [0.1]
#         , 'reg_lambda': [0.1]      
#         , 'stopping_tolerance': [0.001]
        }
        
    param = {
             "seed": SEED # potentially result in overfitting to a particular random sample selected
            , 'stopping_metric': STOPPING_METRIC
            , "nfolds": 3 # default 0, 5-10 is good but 10 will take more time
            , 'tree_method': 'hist'
            , 'grow_policy': 'lossguide'
            , 'max_depth': 0
#             , 'min_sum_hessian_in_leaf': 0.1
#             , 'min_data_in_leaf':3.0
            , "stopping_rounds": 3 
    #         , "min_rows": 16
    #         #     , "col_sample_rate_per_tree" : 0.9
    #         #     , "min_rows" : 5
    #         #     , "score_tree_interval": 100 
            #       , "ignored_columns": ['Id', 'SalaryRaw', 'LocationRaw']  # not works

    }
    
    print("hyper_parameters: ", hyper_parameters)
    print("parameters: ", param)   

    grid_search = H2OGridSearch(H2OXGBoostEstimator(**param)
                        , hyper_params=hyper_parameters)
        
    return grid_search

In [36]:
def grid_train(train_df, valid_df, algorithm = ""):
    StartOfFunc(sys._getframe().f_code.co_name)
    '''
    Grid search to find optimum parameters
    
    
    Note:
    + I tried categorical_encoding='one_hot_explicit', histogram_type='quantiles_global' for GBM 
    with only [20,50] trees, max depth 7. H2O shows 46 hours to run! 
    When try only one_hot_explicit, even with col_sample_rate 0.3, H2O still estimates 6 hours.
    So I don't use one_hot_explicit any more in this project, will study more when have time.
    
    '''
    
                 
    if (algorithm == "" or algorithm == H2OGradientBoostingEstimator.__name__):
        grid_search = grid_init_GBM()
        
    elif (algorithm == H2OXGBoostEstimator.__name__):
        grid_search = grid_init_XGBoost()
    
    elif (algorithm == H2ORandomForestEstimator.__name__):       
        grid_search = grid_init_RF()
        
    grid_search.train(x = train_df.names,
                    y = RESPONSE_NAME,                     
                    training_frame = train_df, 
                    validation_frame = valid_df)
    
    grid = h2o.get_grid(grid_search.grid_id)
    grid.show()

    EndOfFunc(sys._getframe().f_code.co_name)
    
    return grid

In [37]:
def show_score_his(model,interateType="Trees"):
    StartOfFunc(sys._getframe().f_code.co_name)

    score_history=model.scoring_history() 
    plt.title('Scoring history')
    plt.xlabel(interateType)
    plt.ylabel(STOPPING_METRIC)

    x=0
    if (interateType == "Trees"): x = score_history.number_of_trees
    elif (interateType == "Epochs"): x = score_history.epochs
        
    y1=score_history.training_mae
    plt.plot(x, y1, '-b', label='Train')

    y2=score_history.validation_mae
    plt.plot(x, y2, '-r', label='Valid')
    
    plt.legend(loc='upper right')
    
    EndOfFunc(sys._getframe().f_code.co_name)

In [38]:
def evaluate(model, test_df):
    StartOfFunc(sys._getframe().f_code.co_name)

    pred_df = model.predict(test_df)
    perf = model.model_performance(test_data=test_df)

    print("perf.mae:", perf.mae)

    combined_df = pred_df.cbind(test_df)
    # combined_df.describe()
    diff_df = test_df[RESPONSE_NAME] - pred_df
    diff_df = diff_df.abs()
    diff_df.set_name(0,'pred_distance')
    # diff_df.describe()
    # diff_df.hist()

    diff_percentage_df = diff_df*100/test_df[RESPONSE_NAME]
    diff_percentage_df.set_name(0,'pred_distance_percentage')
    good_pred_count = len(diff_percentage_df[diff_percentage_df['pred_distance_percentage'] <= GOOD_DISTANCE_PERCENTAGE])
    total_count = len(diff_percentage_df)
    good_pred_rate = np.round(good_pred_count*100/total_count)
    print("Good pred %: ", good_pred_rate, " (", good_pred_count, "/", total_count, ")" )
    diff_percentage_df.hist()
    
    EndOfFunc(sys._getframe().f_code.co_name)
    return [good_pred_rate, perf.mae]

In [39]:
def train_evaluate(data_df):
    '''
    Train and evaluate models
    '''
    StartOfFunc(sys._getframe().f_code.co_name)

    print(data_df.frame_id)
    [train_df, valid_df, test_df] = split(data_df)
    model= grid_train(train_df, valid_df, algorithm = H2OXGBoostEstimator.__name__ )[0]
#     model= grid_train(train_df, valid_df, algorithm = H2ORandomForestEstimator.__name__ )[0]    
#     model= grid_train(train_df, valid_df, algorithm = H2OGradientBoostingEstimator.__name__ )[0] 
#     model = trainDL(train_df, valid_df)

    [good_pred_rate, mae] = evaluate(model, test_df)

    show_score_his(model)
    
    try:
        model.varimp_plot()
    except Exception:
        print("Error with model.varimp_plot()")

    model_param_file_name = INOUT_DIR + "/" + model.model_id + "_params.json"
    print(niceTime(), "Save model params to ", model_param_file_name)
    with open(model_param_file_name, 'w') as outfile:
        json.dump(model.get_params(), outfile)
        
    EndOfFunc(sys._getframe().f_code.co_name)
    return [good_pred_rate, mae, model]

In [40]:
############################### MAIN ####################################
start_time = niceTime()
if (RESTART_H2O and h2o.cluster()):
    h2o.cluster().shutdown()
    time.sleep(2)
    
h2o.init(max_mem_size="13G")
niceTime()

H2O session _sid_8afa closed.
Checking whether there is an H2O instance running at http://localhost:54321..... not found.
Attempting to start a local H2O server...
  Java Version: java version "1.8.0_66"; Java(TM) SE Runtime Environment (build 1.8.0_66-b17); Java HotSpot(TM) 64-Bit Server VM (build 25.66-b17, mixed mode)
  Starting server from /Library/Frameworks/Python.framework/Versions/3.6/lib/python3.6/site-packages/h2o/backend/bin/h2o.jar
  Ice root: /var/folders/13/thn2h7rd5915m6_40jwqlm9h0000gn/T/tmp0fe3tuja
  JVM stdout: /var/folders/13/thn2h7rd5915m6_40jwqlm9h0000gn/T/tmp0fe3tuja/h2o_Ninhsth_started_from_python.out
  JVM stderr: /var/folders/13/thn2h7rd5915m6_40jwqlm9h0000gn/T/tmp0fe3tuja/h2o_Ninhsth_started_from_python.err
  Server is running at http://127.0.0.1:54321
Connecting to H2O server at http://127.0.0.1:54321... successful.


0,1
H2O cluster uptime:,03 secs
H2O cluster version:,3.14.0.3
H2O cluster version age:,4 months and 16 days !!!
H2O cluster name:,H2O_from_python_Ninhsth_ol4xo1
H2O cluster total nodes:,1
H2O cluster free memory:,11.56 Gb
H2O cluster total cores:,8
H2O cluster allowed cores:,8
H2O cluster status:,"accepting new members, healthy"
H2O connection url:,http://127.0.0.1:54321


'2018-02-08 05:45:22'

In [None]:
if USE_SAVED_FRAME:
    print("USE SAVED FRAME IN ", INOUT_DIR)
    vec_job_df = h2o.import_file(path=INOUT_DIR + '/' + VEC_JOB_DF_NAME)
#     veccat_job_df = h2o.import_file(path=INOUT_DIR + '/' + VECCAT_JOB_DF_NAME)
    if (QUICK_ROWS>0): vec_job_df = vec_job_df.head(QUICK_ROWS)
    
else:
    print("LOAD DATA FILE ", DATA_FILE)
    job_df = load_data(DATA_FILE)
    job_df.frame_id = "job_df"
    [vec_job_df, veccat_job_df] = preprocess(job_df, use_saved_model=USE_SAVED_W2V_MODEL)
    vec_job_df.frame_id = VEC_JOB_DF_NAME
    veccat_job_df.frame_id = VECCAT_JOB_DF_NAME
    
    h2o.export_file(frame=vec_job_df, path=INOUT_DIR + '/' + VEC_JOB_DF_NAME, force=True)
    h2o.export_file(frame=veccat_job_df, path=INOUT_DIR + '/' + VECCAT_JOB_DF_NAME, force=True)

vec_job_df = vec_job_df.drop(['Id'])
    
vec_job_df.describe()    
# veccat_job_df.describe()

USE SAVED FRAME IN  /Users/Ninhsth/gd/ninhsh.work/github/navi-reco-py/inout
Parse progress: |█████████████████████████████████████████████████████████| 100%
Rows:244768
Cols:407




Unnamed: 0,LocationNormalized,ContractType,ContractTime,Company,Category,SalaryNormalized,SourceName,C1,C2,C3,C4,C5,C6,C7,C8,C9,C10,C11,C12,C13,C14,C15,C16,C17,C18,C19,C20,C21,C22,C23,C24,C25,C26,C27,C28,C29,C30,C31,C32,C33,C34,C35,C36,C37,C38,C39,C40,C41,C42,C43,C44,C45,C46,C47,C48,C49,C50,C51,C52,C53,C54,C55,C56,C57,C58,C59,C60,C61,C62,C63,C64,C65,C66,C67,C68,C69,C70,C71,C72,C73,C74,C75,C76,C77,C78,C79,C80,C81,C82,C83,C84,C85,C86,C87,C88,C89,C90,C91,C92,C93,C94,C95,C96,C97,C98,C99,C100,C101,C102,C103,C104,C105,C106,C107,C108,C109,C110,C111,C112,C113,C114,C115,C116,C117,C118,C119,C120,C121,C122,C123,C124,C125,C126,C127,C128,C129,C130,C131,C132,C133,C134,C135,C136,C137,C138,C139,C140,C141,C142,C143,C144,C145,C146,C147,C148,C149,C150,C151,C152,C153,C154,C155,C156,C157,C158,C159,C160,C161,C162,C163,C164,C165,C166,C167,C168,C169,C170,C171,C172,C173,C174,C175,C176,C177,C178,C179,C180,C181,C182,C183,C184,C185,C186,C187,C188,C189,C190,C191,C192,C193,C194,C195,C196,C197,C198,C199,C200,C1100,C210,C310,C410,C510,C610,C710,C810,C910,C1010,C1110,C1210,C1310,C1410,C1510,C1610,C1710,C1810,C1910,C201,C2100,C220,C230,C240,C250,C260,C270,C280,C290,C300,C3100,C320,C330,C340,C350,C360,C370,C380,C390,C400,C4100,C420,C430,C440,C450,C460,C470,C480,C490,C500,C5100,C520,C530,C540,C550,C560,C570,C580,C590,C600,C6100,C620,C630,C640,C650,C660,C670,C680,C690,C700,C7100,C720,C730,C740,C750,C760,C770,C780,C790,C800,C8100,C820,C830,C840,C850,C860,C870,C880,C890,C900,C9100,C920,C930,C940,C950,C960,C970,C980,C990,C1000,C10100,C1020,C1030,C1040,C1050,C1060,C1070,C1080,C1090,C11000,C11100,C1120,C1130,C1140,C1150,C1160,C1170,C1180,C1190,C1200,C12100,C1220,C1230,C1240,C1250,C1260,C1270,C1280,C1290,C1300,C13100,C1320,C1330,C1340,C1350,C1360,C1370,C1380,C1390,C1400,C14100,C1420,C1430,C1440,C1450,C1460,C1470,C1480,C1490,C1500,C15100,C1520,C1530,C1540,C1550,C1560,C1570,C1580,C1590,C1600,C16100,C1620,C1630,C1640,C1650,C1660,C1670,C1680,C1690,C1700,C17100,C1720,C1730,C1740,C1750,C1760,C1770,C1780,C1790,C1800,C18100,C1820,C1830,C1840,C1850,C1860,C1870,C1880,C1890,C1900,C19100,C1920,C1930,C1940,C1950,C1960,C1970,C1980,C1990,C2000
type,enum,enum,enum,enum,enum,int,enum,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real,real
mins,,,,,,5000.0,,-0.9463784694671632,-0.6578074097633362,-0.9980340003967284,-1.0955244302749634,-0.7607123851776123,-1.1576751470565796,-0.941730499267578,-0.8593214154243469,-0.7019164562225342,-1.0065102577209473,-0.716037392616272,-0.8071715235710144,-0.6532368659973145,-0.7466002106666565,-0.6600952744483948,-0.7139369249343872,-0.7012602686882019,-0.8588415384292603,-0.6852312684059143,-0.7092638611793518,-0.6420583724975586,-0.7261044383049011,-0.6048905253410339,-0.7057280540466309,-0.8466193079948425,-0.8857385516166687,-0.697553277015686,-0.691262423992157,-0.6193019151687622,-0.672021210193634,-0.8357515931129456,-0.6453160643577576,-0.6787700057029724,-0.6136549115180969,-0.9624992609024048,-0.836066722869873,-0.6118553280830383,-0.7832033038139343,-0.6883444786071777,-0.7469816207885742,-0.8575792908668518,-0.6741263270378113,-0.8259045481681824,-0.7078587412834167,-0.8205956816673279,-0.7841890454292297,-0.5117995142936707,-0.8017194867134094,-0.8800731301307678,-0.5222935080528259,-0.7986016273498535,-0.5984780788421631,-0.8158820271492004,-0.7363187074661255,-0.6063030362129211,-0.6420040130615234,-0.7975879311561584,-0.5968016386032104,-0.8889939785003662,-0.8199962377548218,-0.7604076266288757,-0.8833647966384888,-0.986600697040558,-0.6990700364112854,-0.46978217363357544,-0.8533071279525757,-0.6426979899406433,-0.7613176703453064,-0.9395978450775146,-0.8048778176307678,-0.6572688817977905,-0.7140015363693237,-0.7486850023269653,-0.9671096205711364,-0.8413068652153015,-0.48062166571617126,-0.9572044014930724,-0.7000556588172913,-0.7615777254104614,-0.8238855600357056,-0.8087213039398193,-0.7492712736129761,-0.7758000493049622,-0.7958840131759644,-0.8054603338241577,-0.8396526575088501,-0.9905079007148744,-0.6989990472793579,-0.7263836860656738,-0.7994406223297119,-0.7443052530288696,-0.6744222640991211,-0.7163347005844116,-0.7761269211769104,-0.7215966582298279,-0.746396005153656,-0.6105923056602478,-0.7646563053131104,-0.5747366547584534,-0.823085367679596,-0.6226297616958618,-0.6704060435295105,-0.8319686055183411,-0.8327645659446716,-0.830712080001831,-0.8800725936889648,-1.0967018604278564,-1.0863041877746582,-0.6947957873344421,-0.8815615177154541,-0.8237943649291992,-0.7094968557357788,-0.6161243319511414,-0.6806362271308899,-0.9839335680007936,-0.7496448159217834,-0.5918059945106506,-0.699417769908905,-0.647398829460144,-0.5747234225273132,-0.6975212097167969,-1.1478865146636963,-1.0792789459228516,-0.7976224422454834,-0.6366810202598572,-0.6896114945411682,-0.8722872138023376,-0.5125520825386047,-0.6164485216140747,-0.7044951319694519,-0.76902174949646,-0.7486499547958374,-0.8171011805534363,-0.5694268941879272,-0.7906401753425598,-0.8132392764091492,-0.5858163833618164,-0.8394167423248291,-0.7917510867118835,-0.7469233274459839,-0.8036750555038452,-0.7618985772132874,-0.7704983353614807,-0.7802705764770508,-1.0571123361587524,-0.8628325462341309,-0.7498624324798584,-0.7906282544136047,-0.6404368877410889,-0.6094255447387695,-0.5910106301307678,-0.663419783115387,-0.8135595917701721,-0.5945175290107727,-0.724541425704956,-0.8692842721939087,-0.6654308438301086,-0.7398374080657959,-0.84345543384552,-0.6671662330627441,-0.6480557322502136,-0.7233105897903442,-0.8635119795799255,-0.9270054697990416,-0.869159460067749,-0.8239593505859375,-0.8775002360343933,-0.7168903946876526,-0.8983103036880493,-0.870794951915741,-0.7859352231025696,-0.839514970779419,-1.096231460571289,-0.6506746411323547,-0.7130432724952698,-0.80573970079422,-0.9470983743667604,-0.798370897769928,-0.91135436296463,-0.8741509914398193,-0.743510901927948,-0.7117481827735901,-0.526384174823761,-0.7450082302093506,-0.8259453773498535,-1.019537329673767,-0.7072409987449646,-0.7239682674407959,-0.793149471282959,-0.5839640498161316,-0.6033416390419006,-0.8960497975349426,-0.776561975479126,-0.6616646647453308,-0.8322339057922363,-1.0352046489715576,-0.6827229857444763,-0.6610767245292664,-0.8079429268836975,-0.7636464834213257,-0.6694424748420715,-0.2894195020198822,-0.22924114763736725,-0.49768516421318054,-0.3829143047332764,-0.25917503237724304,-0.5964729189872742,-0.31181129813194275,-0.28570467233657837,-0.40854477882385254,-0.5380060076713562,-0.4725681841373443,-0.28722482919692993,-0.5825866460800171,-0.30900877714157104,-0.29119089245796204,-0.6644089221954346,-0.32034510374069214,-0.3601588308811188,-0.2712865471839905,-0.3429938554763794,-0.435374915599823,-0.3246784508228302,-0.40917062759399414,-0.32830387353897095,-0.6340107917785645,-0.2562423348426819,-0.3087376058101654,-0.42177948355674744,-0.2989508807659149,-0.35508474707603455,-0.3717671930789947,-1.1896339654922483,-0.5340818166732788,-0.43197402358055115,-0.4819640815258026,-0.2727051377296448,-0.5532817244529724,-0.1629694402217865,-0.5116688013076782,-0.5059756636619568,-0.2992859482765198,-0.4032960832118988,-0.3157693147659302,-0.30865079164505005,-0.31684377789497375,-0.4166454076766968,-0.5083639621734619,-0.5522260069847107,-0.5373729467391968,-0.3714315891265869,-0.18207766115665436,-0.1750912368297577,-0.4815751016139984,-0.19414614140987396,-0.5240029692649841,-0.4939504265785218,-0.5249212384223938,-0.4632203280925751,-0.34516194462776184,-0.32103002071380615,-0.28918954730033875,-0.409803569316864,-0.296947717666626,-0.4864528179168701,-0.2815282940864563,-0.28250542283058167,-1.1780407428741455,-0.3676574230194092,-0.4173712730407715,-0.6416800022125244,-0.4282534718513489,-0.37861892580986023,-0.2863732576370239,-0.3751879036426544,-0.3950329720973969,-0.2626694142818451,-0.4102899134159088,-0.3416834771633148,-0.4321453273296356,-0.2880813181400299,-0.24395868182182312,-0.35450708866119385,-0.2282889038324356,-0.546844482421875,-0.3783062398433686,-0.4223742187023163,-0.5517711043357849,-0.2819614112377167,-0.5493075251579285,-0.25177255272865295,-0.2978346645832062,-0.5988892316818237,-0.45831358432769775,-0.22047288715839383,-0.4006907641887665,-0.28229209780693054,-0.3129664957523346,-0.3655702471733093,-0.34019362926483154,-0.5729498863220215,-0.3651999533176422,-0.205418661236763,-0.37892910838127136,-0.35521480441093445,-0.34073153138160706,-0.6395924687385559,-0.33428955078125,-0.6052677631378174,-0.31689974665641785,-0.4524618089199066,-0.5347409248352051,-0.5190699100494385,-0.5328447222709656,-0.2427365630865097,-0.5599807500839233,-0.23068778216838837,-0.3227168619632721,-0.4171002507209778,-0.6031843423843384,-0.5147815942764282,-0.4550835192203522,-0.5524314045906067,-0.5409317016601562,-0.32200631499290466,-0.3110923171043396,-0.37337183952331543,-0.46600309014320374,-0.34937968850135803,-0.2724514603614807,-0.3306853473186493,-0.46966803073883057,-0.3783734142780304,-0.24733763933181763,-0.3717136681079865,-0.24586430191993713,-0.3476307690143585,-0.43373188376426697,-0.3352850675582886,-0.4494366943836212,-0.42554619908332825,-0.3542868196964264,-0.3841019570827484,-0.28641417622566223,-0.40905216336250305,-0.452884703874588,-0.8882268667221069,-0.7231705188751221,-0.4349699914455414,-0.5520904660224915,-0.4778934419155121,-0.480417400598526,-0.27647092938423157,-0.3765870034694672,-0.39796027541160583,-0.40998122096061707,-0.4618439972400666,-0.4988090991973877,-0.5087037682533264,-0.25096380710601807,-0.3505127429962158,-0.32072603702545166,-0.3575712740421295,-0.44664350152015686,-0.40746816992759705,-0.3533162772655487,-0.3557693660259247,-0.3693114519119262,-0.47740986943244934,-0.2782462537288666,-0.405070960521698,-0.3836310505867005,-0.6070588231086731,-0.35473397374153137,-0.26760542392730713,-0.36441731452941895,-0.1674632728099823,-0.28130459785461426,-0.4253048896789551,-0.5661355257034302,-0.3952219188213349,-0.3437306880950928,-0.3378947675228119,-0.358303040266037,-0.3443644940853119,-0.5302627682685852,-0.3079530894756317,-0.6371705532073975,-0.32826581597328186,-0.2871297001838684,-0.3304244875907898,-0.5554129481315613,-0.3045850992202759,-0.37254664301872253,-0.41068950295448303,-0.36229556798934937,-0.4702542722225189,-0.4515473544597626,-0.2881740629673004,-0.4115650951862335
mean,,,,,,34122.57757550006,,-0.03185243540187526,0.12613929713082486,0.149396083226663,-0.06697647696401555,0.04138568244297317,0.02916948046313885,-0.05446172508747415,-0.07633956396896151,0.1069607910467612,0.02718397867982643,-0.03158651631179497,0.04172100368323083,0.0827328667601242,0.01728211474713894,-0.039992730574171784,0.07484555462017937,0.0738506343264518,0.07919705741352892,0.09596271719245025,-0.011770865830420583,0.12605502977593627,0.23562264251852008,0.0328089362723618,0.00932782116304803,0.0028999216148428023,0.05067600343029009,-0.07442508519152247,-0.000652129212584762,-0.004636210138722433,0.008428910355694093,0.08082458340110095,0.1362879593722403,-0.06580722859438297,0.13903848684184916,-0.02429651797197236,-0.10147679663843956,0.14245047163810162,-0.007728483163898169,0.05676399411085439,0.021135173346035752,-0.139881431344507,0.052410943145944404,0.002501560797554142,-0.02179375757124396,-0.0053433338384864795,-0.030530180546273215,0.14728328678518196,-0.0012164291091568296,-0.09314601917229999,-0.0024173796285434533,-0.030621288236517,0.07508739289004054,-0.0757010127551134,0.02605842604644587,-0.03797750052054426,-0.057616890195020566,-0.03599697384712792,0.07875361694477,0.0755796369646593,-0.005376010219509117,0.021050099910234925,-0.10709141786919685,-0.010881110031878508,-0.02162181735337889,0.13313629093436685,-0.004866342601066054,-0.03357065561133222,0.025929262175291366,-0.018779570947305816,0.0438459878662694,0.009151986369516665,0.04090502134935364,0.03032744964858719,0.002263019026002408,0.042335290572670645,0.09097657929076769,0.010043001364810776,0.08472191600537367,0.04513594063918525,0.04834042662631792,-0.08761513016691368,0.005812912808960492,0.11783329293239907,-0.03933074702504156,-0.07769027891438658,0.02905825652971993,-0.028021959090618075,-0.06696188982003336,0.06641149207794181,-0.05060485765121098,0.005006681959980454,0.050541264479415204,0.06149768832210831,-0.08155312876566691,0.003461581164847368,0.0489918943610833,-0.0033664914696834654,-0.011547061562576354,0.13094367355477954,-0.020576106635545332,0.036243361420721175,0.013451908077195521,-0.06455393937141186,0.0003718763328975742,0.007748241051779563,-0.013746620198191705,-0.1064534440569414,-0.03116967519304087,0.04230254214918126,-0.041367312051751134,-0.020400772310881693,0.035357463839506,0.03506870752576492,0.03879668125005743,-0.012238627793982618,-0.02853441829129295,0.057673338800367235,-0.05301548074205623,-0.03419893653465509,0.010256931606718332,-0.09204789234227286,-0.051943017988254625,-0.18779898524291544,0.02348985380367047,-0.06915610846861141,0.06022091961829836,-0.03256227988132259,-0.012389822930954792,0.07511053195855946,0.03402979810251754,0.08838132498046163,-0.006767311883311379,0.047522665150042505,0.011203349300344629,-0.04219637290066296,0.0050600585112813646,0.07918246197289401,-0.134759383065995,-0.06450955728125185,-0.017799218787310486,-0.0063471798368559375,0.007667079419912927,-0.07302601036028943,0.10892199415169239,-0.17703931592333697,-0.04109131086860794,-0.03534851539178554,0.02457258154497834,-0.002517491035991438,-0.011435680094878114,0.025176621071467634,-0.025222735520453284,0.04042078123935561,0.1491820503354574,0.01657123224938435,-0.040973829129638976,0.03163286162929597,-0.03147535252639102,-0.008804357449521932,0.1148197461598039,-0.025131917917208518,-0.03267458731904232,0.006824775941337326,-0.07198987901974983,-0.09901102597899505,0.0785277691343435,-0.08037727549547567,0.09150733799253018,-0.03238148839964226,-0.018818409660118832,-0.017839736050652723,0.007435804014957786,0.03624344863331154,-0.011450995465488426,-0.06351330673249812,0.02962045461678357,-0.06870392791297067,-0.053406096607019005,-0.07496715582966049,-0.01283418839264179,0.01629546947974915,-0.1290407816498512,0.020395197784591687,-0.02701229496630922,-0.13224076857616138,-0.046305846320801425,0.020468102874449893,-0.0072803567603686985,-0.06548316792256424,0.04983447000447598,0.047839155754209245,0.009261943335848358,-0.06114248185137323,0.06771720318202941,0.03794297656328872,-0.1616665382235456,0.004815932959105681,-0.026403571188908934,-0.006980940602972659,-0.019295251420299964,-0.08956575432080797,0.0514281433924437,0.09880561751341371,0.02910446643862155,0.002336034136300063,0.07180507451138517,-0.00019538039548388996,-0.009516204163145216,-0.04951624203009218,-0.06319779160032125,-0.06404421271370792,-0.08106929053054027,-0.0010348136629001502,0.11108874665986297,-0.0012224561131810802,0.05105553682351769,0.04789536005135888,0.049052442558848816,-0.018213576703572758,0.05506195262400006,-0.032473802564422984,-0.0712282626605586,0.033494425622819464,0.015173590260581089,0.05412480562573508,-0.12874479343999412,0.01746623966518496,0.05707120440145437,0.01848163583134276,0.026392923026611455,0.013084970913459804,-0.02813764168589685,-0.04709148961698821,0.022005473972469998,-0.032218890539176405,-0.016182326228034494,0.06467391633486995,0.03317629934162685,0.10196751946844128,-0.06348696490390551,-0.09203822356131264,-0.014288047143054398,-0.12236661435275349,0.021845819786372695,0.04599987227340961,0.03471785472000956,0.007030676842827698,0.04703216749699752,-0.009992969610629395,0.025990298306653968,0.10911280070821863,0.08247868639827803,0.06783621506081915,0.020869720198058418,0.09252604372261307,-0.0009091934077736936,-0.03776269687505267,0.13020136106331479,-0.0009548686836225818,-0.026884714628118596,0.027843170879488007,0.1193489021562094,0.053961157432205364,0.019470426024248876,-0.035850787422829315,0.05398953748398479,0.0612085811901619,-0.04724812135895307,0.020220879676865432,0.020318708141885886,0.06886364761450742,0.0024347100909396222,0.06346147139712048,0.033562304840284204,-0.011516462982027607,-0.07340299193462561,0.052257969250478584,-0.04308099734497386,-0.003996918810513428,-0.15909330381236553,0.01686160418921837,-0.018100464538179296,-0.005535752881483099,0.08377331229284703,-0.058685952142892364,0.017511195165403986,0.08371972401649613,0.02327664867369284,0.04478353052064988,-0.01608394497538072,0.08448596402779336,0.010624690349549352,-0.02300024092157199,0.021551119982253595,0.12512400244543184,-0.0493594890122619,0.044429442991099216,0.009107493222033962,-0.013241397008025622,0.10098710513145125,-0.019381090581728728,0.07111263937224664,0.154858528300317,-0.048604267144592365,0.02432132214845108,-0.07303272131734201,0.09570701666449448,-0.04884885799031647,0.18280813410958172,0.054339609171169145,0.06201111656247541,-0.017656387940893845,-0.13529550290048373,-0.0077112481416730105,0.04020778594924031,0.0077231247670592265,0.013299578699151842,-0.008043503249853786,-0.06530630981110933,-0.01559782577252939,-0.03630805573136545,-0.02328148384695911,4.902704986701373e-05,-0.04973055696114421,-0.021428170056162307,0.021416493762848154,-0.03448413500175898,-0.0061130465026914115,0.07892706413434032,0.07309629956131292,0.06882961624175116,-0.03295868223183606,-0.017147569726977046,-0.023333320355925315,-0.04650794851320311,0.033561546472608006,-0.08829523345279,-0.0560728404267063,0.01718627489372208,0.04580322324898478,0.0007186153042988638,0.05298129117983881,0.07750751678505483,0.04560080719725622,-0.0276358663119023,0.019102473273085768,-0.011327912160355844,-0.0592431733819468,0.034357263301863006,0.1211951437511755,0.02709675128399378,0.06269091367892608,-0.05965105875639179,-0.0688008841520604,0.00046267770901386475,0.0013797390930992328,-0.017958532312820148,0.11205528557673483,-0.10782457665943841,0.030622653527653962,-0.03160285826359221,0.022250885681598595,0.04000684884928574,-0.0030342063886421846,-0.006886147452783844,-0.08206599083992996,0.030682726505563408,0.002627485883712817,-0.01075218260195478,0.06638084980713282,-0.022815201898228454,0.0984815467516703,0.055285202178643626,0.06838227068810343,0.09703821619786296,0.04488775896700234,0.13589253660934542,0.021818222462387682,-0.06608800150981524,-0.06502227219049672,-0.015453860868082987,-0.06586987522671553,-0.004896814522461809,0.11731911067595906,-0.02852671908980542,0.003681159464143342,-0.019681472493769107,-0.07386914150407531,0.01231040506940486,0.003668219629897962,-0.060078596130504015,-0.15064262313163387,0.010864938237422912,0.013015515666364495,-0.08783534430448102,-0.009643787669595899,-0.013005547350525363,-0.12238661872046662,0.0628215600313674,-0.030094791863867296
maxs,,,,,,200000.0,,0.7838835120201111,0.9658159017562866,0.99415922164917,0.7858302593231201,0.744721531867981,0.90927654504776,0.9774462580680848,0.7426179051399231,0.9121795892715454,0.8288676738739014,0.8931897878646851,0.7186107039451599,0.7615653276443481,0.9383326172828674,0.7323707342147827,0.9117676615715028,1.0031723976135254,0.8028726577758789,0.8222602009773254,0.7561386227607727,0.7681148052215576,0.957702338695526,0.7209645509719849,0.9676665663719176,0.7713504433631897,0.7794222831726074,0.6203755736351013,0.8759716749191284,0.853806734085083,0.8323575258255005,0.8384278416633606,0.8968762159347534,0.8617352843284607,1.0828620195388794,0.9074376821517944,0.604708194732666,1.007105827331543,0.8762174844741821,0.7232491970062256,0.7772286534309387,1.002366542816162,0.8231921195983887,0.7832043170928955,0.9943260550498962,0.8316215872764587,0.6641772389411926,0.8707108497619629,1.0291248559951782,0.5598892569541931,0.7917807102203369,0.8400138020515442,0.9477730393409728,0.8326894044876099,0.9569554328918456,0.6002451181411743,0.7804785966873169,0.5766410231590271,0.7970069646835327,0.8085285425186157,0.720689594745636,0.6234437227249146,0.6018301844596863,0.7961388826370239,0.5571017265319824,1.0322259664535522,0.8247293829917908,0.8393174409866333,0.6989765763282776,0.7547362446784973,0.8420795202255249,0.7523319125175476,0.8204817175865173,0.7212601900100708,0.6828768253326416,1.108290433883667,0.7926638126373291,0.7497315406799316,0.8530077338218689,0.9554272890090942,0.7950878143310547,0.6216940879821777,0.6244098544120789,0.7785620093345642,0.6497989892959595,0.7750850319862366,0.625827431678772,0.7603907585144043,0.5800755023956299,0.8237897157669067,0.566344678401947,0.7391738295555115,0.901086688041687,0.7809653878211975,0.6392437219619751,0.943875789642334,0.8090247511863708,0.9159805178642272,0.7536612153053284,1.1475733518600464,0.6421412825584412,0.7928951978683472,0.6898069381713867,0.6092032194137573,0.7002634406089783,0.7638376951217651,0.7999092936515808,0.7340769171714783,0.8044579029083252,0.724914014339447,0.7832838296890259,0.7701603770256042,0.7677690982818604,0.7642975449562073,0.7757401466369629,0.6619912981987,0.6049887537956238,0.8870335221290588,0.7462518215179443,0.5549255609512329,0.6811928749084473,0.6130487322807312,0.9227994084358216,0.7171779274940491,0.784858763217926,0.750138521194458,0.8718356490135193,0.6533656120300293,0.6877713799476624,0.9185087084770204,0.7422579526901245,0.8069667816162109,0.8885751366615295,0.8740458488464355,0.7965025305747986,0.7701408267021179,0.9051053524017334,0.7629337310791016,0.5911489725112915,0.7425107955932617,0.6271787881851196,0.685893714427948,0.8108677864074707,0.7808545827865601,1.0034106969833374,0.5350627303123474,0.5891025066375732,0.8137676119804382,0.7668129801750183,0.615416407585144,0.8270415663719177,0.7567592859268188,0.7205488681793213,0.8573544025421143,0.8317280411720276,0.6910017132759094,0.8473314046859741,0.8690299391746521,0.7232379913330078,0.6999030709266663,0.9738194942474364,0.6296302676200867,0.6865336298942566,0.8970840573310852,0.6584982872009277,0.6841845512390137,0.8286486864089966,0.7358378171920776,0.8453658819198608,0.7305091023445129,0.7223228216171265,0.713169276714325,0.640487551689148,0.7528532147407532,0.8245438933372498,0.8000266551971436,0.7208516001701355,0.9532710909843444,0.6994284987449646,0.532626748085022,0.7624373435974121,0.6456916928291321,0.4826488792896271,0.752426266670227,0.896308422088623,0.6181700825691223,1.182389736175537,0.9324429631233216,0.6527048349380493,0.858534574508667,0.6965744495391846,1.019741773605347,0.7057621479034424,0.7164446711540222,0.8403637409210205,0.8632380962371826,0.4656182527542114,0.8585965633392334,0.8510726690292358,0.7697959542274475,0.7997081279754639,0.4797663688659668,0.3796328008174896,0.7105731964111328,0.31525948643684387,0.3485127091407776,0.4555439054965973,0.2979239523410797,0.7574044466018677,0.30272719264030457,0.16461263597011566,0.20772792398929596,0.371039479970932,0.35789206624031067,0.4727810025215149,0.3051356077194214,0.33422496914863586,0.35790714621543884,0.4638637900352478,0.4349627792835235,0.5479322671890259,0.4623495638370514,0.24426841735839844,0.25577348470687866,0.342516154050827,0.5167723298072815,0.20148594677448273,0.41167810559272766,0.808027446269989,0.45434337854385376,0.3010111451148987,0.4264887571334839,0.3754467070102692,0.35115760564804077,0.2917003333568573,0.6359328627586365,0.4215932786464691,0.4209640622138977,0.31919950246810913,0.4964008629322052,0.21055026352405548,0.3261941969394684,0.40039291977882385,0.15348051488399506,0.3812146484851837,0.25885090231895447,0.5125126838684082,0.32290804386138916,0.5398404598236084,0.22719340026378632,0.26107528805732727,0.3790741264820099,0.4373650848865509,0.5948060750961304,0.6076222658157349,0.34361377358436584,0.4097571969032288,0.23680271208286283,0.44080424308776855,0.4255772829055786,0.2492686957120895,0.3552403151988983,0.4469539821147918,0.3373435437679291,0.4799775779247284,0.28392645716667175,0.4712955951690674,0.33910465240478516,0.3710419535636902,0.29626524448394775,0.4823384881019592,0.426397442817688,0.3661542534828186,0.3725253939628601,0.3681816160678863,0.41396212577819824,0.22130447626113892,0.6104323863983154,0.32931026816368103,0.4053751826286316,0.5565184354782104,0.3411561846733093,0.4339668452739715,0.26888507604599,0.3942414522171021,0.22683969140052795,0.32729706168174744,0.5335249304771423,0.5278765559196472,0.3832237124443054,0.3029468059539795,0.4273779690265655,0.32849621772766113,0.3322904706001282,0.5019212365150452,0.566184937953949,0.3274598717689514,0.3751947581768036,0.47104862332344055,0.3352343440055847,0.4342237114906311,0.31476491689682007,0.7954272627830505,0.4411773383617401,0.23354017734527588,0.40315771102905273,0.2745130956172943,0.3571546673774719,0.3725556135177612,0.670515775680542,0.4758833348751068,0.4215180277824402,0.25023120641708374,0.27387985587120056,0.309433251619339,0.4190044403076172,0.48567184805870056,0.3426206707954407,0.523045539855957,0.4651362895965576,0.3479788899421692,0.28061535954475403,0.7215830087661743,0.32566216588020325,0.5423727631568909,0.3371967673301697,0.3038288950920105,0.33381232619285583,0.396175354719162,0.3705845773220062,0.5225913524627686,0.5756824612617493,0.4496133625507355,0.2645949423313141,0.45053187012672424,0.36508074402809143,0.3744044899940491,0.5009629130363464,0.2575785219669342,0.30118340253829956,0.4736610949039459,0.30015429854393005,0.5142699480056763,0.46532830595970154,0.521162211894989,0.215251162648201,0.5026689171791077,0.24533408880233765,0.3897240161895752,0.4211050570011139,0.34529051184654236,0.30870434641838074,0.35021013021469116,0.5801025629043579,0.4270000457763672,0.31601032614707947,0.4651165306568146,0.19576525688171387,0.4933995902538299,0.13732792437076569,0.46320608258247375,0.9102864265441896,0.420058399438858,0.3993534743785858,0.24603042006492615,0.7888611555099487,0.8893266916275024,0.35429617762565613,0.4149449765682221,0.4375613033771515,0.3997484147548675,0.23020070791244507,0.4331489801406861,0.39352044463157654,0.365668386220932,0.3862150013446808,0.3126150071620941,0.6312161087989807,0.4348211884498596,0.6388893723487854,0.2012966424226761,0.3313227891921997,0.2640209496021271,0.5394213199615479,0.3958527147769928,0.5796822309494019,0.2656228244304657,0.7803516983985901,0.36608943343162537,0.312345951795578,0.37627705931663513,0.3665013611316681,0.3359624445438385,0.3334183692932129,0.44852104783058167,0.3725631833076477,0.4052349328994751,0.28743723034858704,0.31643760204315186,0.386033147573471,0.3465513586997986
sigma,,,,,,17640.5431239018,,0.1874117236911899,0.14412738035483272,0.17346012937146194,0.18733796748314088,0.13892712550538422,0.15318782786009777,0.17901599872190846,0.17471511353280303,0.14605162250089462,0.1775288072858925,0.14809702990494492,0.1383284348558982,0.14729287428848545,0.1536631216534299,0.1431205602558917,0.14275645743117638,0.1674504224856723,0.1387560350216349,0.15476643450505956,0.159437933571659,0.14888587147254495,0.16406173730499396,0.13673105080493314,0.17317687067746984,0.14520426464607175,0.1791671498291541,0.14121513153211215,0.15121636000989475,0.12273177972462672,0.12361714746511586,0.15192211987966603,0.1438688698214766,0.1490673711163039,0.1496454135100599,0.16785602703594507,0.15375316811880965,0.16755888116680837,0.1314817267465773,0.14346624557503634,0.147978983762685,0.17753535383429625,0.1472053585098916,0.16079389671603136,0.1670811215975361,0.13640496439635325,0.13779164159125357,0.13542141783207473,0.13218244962706407,0.1463223268976091,0.1420439380670639,0.16224998076385144,0.1508860240464912,0.15070011542900494,0.15445154961748253,0.12353290832145196,0.16435148238430103,0.15402647657775298,0.13645098472298603,0.1647282405057762,0.14491429613464973,0.12690759287253078,0.1411055372133866,0.16407444227313325,0.14000356503514186,0.13911740095662906,0.16735919058142257,0.14754509283078682,0.15132007182350518,0.15245964138385754,0.15437335194392224,0.1282808839403878,0.15008768974240602,0.14377814039251574,0.14892345149529926,0.156384088256997,0.12465211505800103,0.14081011124787726,0.16074273714317855,0.1560222384864195,0.15705107540336213,0.15469395568559346,0.1420778948602687,0.14523263954856122,0.13252596881349518,0.14918429314973003,0.14862097961093465,0.1534150043935969,0.1373837817973012,0.14583651414135823,0.13357890058774227,0.14668941869495203,0.1631299013055206,0.14534792427449975,0.14661490708117828,0.15109237627945285,0.13340487711416033,0.16571759009325823,0.15111355515641028,0.13287974939829572,0.1678764915089973,0.14969271809063023,0.15892111227557712,0.15790990931521695,0.1553995105208875,0.15545814681589257,0.13620966645359397,0.19052152999435323,0.169200932288784,0.1619395805504857,0.15500132196835417,0.1370406691335068,0.149590294556244,0.1396584444353021,0.15036025304040343,0.15000717778579653,0.13012944702132093,0.15154271745126172,0.15015586181974308,0.11907024393541192,0.14618474364231343,0.1349627125174101,0.18995702781535645,0.15249514444445333,0.15814904331799076,0.13364779729479234,0.14061759916904532,0.14019677326126065,0.1284997471126211,0.14126658661377467,0.1518359414223669,0.14324927056733877,0.14954523134794065,0.1458467582837554,0.11252441837587188,0.1696846432327183,0.14421302562088445,0.14402683492859,0.14612382815651945,0.13530254971331976,0.13874989400787446,0.13707239625725906,0.14725206336251637,0.17598161755036706,0.14556953663070624,0.17334204890704746,0.13874745701851124,0.15541402038160784,0.16024879811759718,0.13170407193812614,0.13801317585395853,0.15021735999691002,0.1517779577150206,0.15198565701332267,0.1332262614415919,0.14083382656705765,0.13789712595605363,0.14214662756645435,0.16360254419594947,0.16484246813139034,0.145896706839814,0.13121387196894155,0.14694222744584723,0.15780575366708513,0.13513363712598764,0.18641573314520504,0.15520482052179457,0.14030584478793345,0.1612453897352848,0.15425255402083088,0.13886814085956764,0.12583956192248644,0.14485179384587807,0.16259945675790197,0.136124035579832,0.16749560560324264,0.15246387809020512,0.14010067854403732,0.1503207143385556,0.13548516237205305,0.17198321896953955,0.13777612573413717,0.14170617600894347,0.13224243624064488,0.14480836190296126,0.1475218296607419,0.15183112844675906,0.171786585041408,0.15199986679781233,0.13788470195966476,0.14617630223653602,0.15712973634304053,0.1644266535076218,0.14218185879049536,0.1441468995407856,0.1378894735980035,0.153540096251698,0.14601925089411874,0.1440876592769817,0.1510827962581211,0.13937804140819965,0.04595094298016351,0.03582151287903053,0.049352474146848575,0.04231473585393324,0.03954808373332609,0.04307572028304392,0.04596015309561677,0.04077008465609272,0.0372769268307922,0.04242894676301202,0.03455928224077118,0.047582975970790475,0.03609345653095778,0.04473540280293131,0.04318082430433264,0.0394431712093174,0.044250229858226464,0.04158164075863611,0.04789475102338239,0.0373924977777053,0.041125494892155785,0.03612263075498093,0.040397833542254305,0.05121135453532609,0.03936428565938437,0.04144402311663305,0.04221592939426608,0.039564853458053606,0.05166057724702012,0.04031302047805175,0.047518626492556504,0.037333385121092945,0.040199560401198105,0.04200744310623964,0.045010327348069756,0.03787888380868486,0.04539767624868788,0.0510898577094514,0.04204095500078194,0.0383594888836212,0.04243960802305399,0.04276507883091641,0.0426810515412746,0.03787453834508869,0.03781334214106162,0.038886379089896166,0.03917302469085092,0.042858058022147566,0.03587260620765985,0.04157789404454113,0.042626371255913766,0.041637819806819874,0.04559400656638157,0.04008959935014278,0.04188084552213044,0.043660897862245474,0.04030825964585654,0.03895485767667282,0.04129384560130326,0.036015870141909885,0.04709655317935839,0.04095133420863096,0.04899438433510629,0.04658890093911025,0.03515583530005518,0.042300503917351726,0.04765826405732126,0.04905484224710214,0.040565040711607915,0.0425420332441604,0.05219337181348552,0.03791051875255182,0.044269657803125,0.03583017601342295,0.03967608829377707,0.035801910732263485,0.033783772172658,0.04232469455472236,0.04110135662107566,0.04207561503436901,0.03874425721538138,0.05066516147300871,0.04370485407438124,0.04258726124714404,0.044985830615598674,0.03812914557471668,0.03971164410496559,0.049534299896072005,0.0452303496016614,0.04250347192439375,0.04212647960621765,0.03831167841414745,0.04116974248423273,0.044448041577193204,0.04043518365430604,0.038632332491677406,0.040517256339959756,0.03782265851862476,0.04182727749794418,0.05329533424565274,0.04635580734425508,0.04014377993746861,0.04095885102773176,0.04193331549248297,0.05326783775476092,0.04187441658892107,0.04031417058675889,0.04492997622852007,0.054081353828977344,0.03819934196361202,0.042940829577691346,0.0451461117203853,0.05120172994534643,0.036692034167020826,0.040650753536286686,0.03896035445475333,0.039127564447357994,0.043608502607724337,0.03922731569711805,0.046747046031676044,0.03927816107104323,0.0448755758007968,0.042465323590312715,0.05491728159855028,0.037655696494763684,0.034025578879622265,0.04036524366235747,0.04617803903350416,0.040189407486878305,0.04112494319999446,0.03635659816263637,0.04751145307211441,0.0408512457411626,0.04489879975549235,0.038698630768760574,0.04233334370562882,0.038108412013843906,0.03402764790899552,0.051779484519244745,0.044095740103048196,0.0504339525519598,0.04899542383090815,0.038158762547782145,0.042768015815927846,0.03666655730211913,0.04442414456617715,0.04807872125128226,0.04150688902646838,0.04710486473931832,0.038227821248001684,0.038153944733756044,0.04373818064473208,0.03967824387775191,0.03775601102481082,0.04123269654543952,0.03963990602336131,0.03974613455502937,0.047241444225749905,0.05195698824812299,0.033342846487026484,0.0429932596130059,0.043740273812214465,0.04381380662474647,0.04533744431782714,0.05235772932624069,0.04365772121758745,0.03809022539883136,0.039791414410547024,0.0446006771728505,0.048191014619629456,0.03474091879834765,0.04037800476851913,0.040099965409012304,0.04903065173472114,0.04479911788224078,0.037410295099016694,0.03593566286848749,0.047605363738772215,0.050419601747478573,0.04227656694959415,0.03646452898095235,0.04156329285992036,0.03850672134725808,0.042955326549705734,0.04788418640069462,0.03828476569057825,0.04319276840344737,0.04197042703745034,0.04899848781188474,0.04455208071749204,0.03745743933904863,0.04836337400962889,0.038011595028034084,0.04270932994475653,0.04530918494904277,0.04255951875382604,0.051785996608417297,0.043419556024990584,0.04115169405729231,0.04717465960785655
zeros,,,,,,0,,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
missing,0,179326,63905,32430,0,0,1,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,303,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
0,Dorking,,permanent,Gregory Martin International,Engineering Jobs,25000.0,cv-library.co.uk,-0.037307772785425186,0.21470685303211212,0.14789867401123047,-0.04545272514224053,-0.004229322075843811,-0.0051243058405816555,-0.24588222801685333,0.035196710377931595,0.06273575872182846,0.1631913781166077,0.014879737980663776,0.04533211514353752,0.028592487797141075,0.1217154860496521,0.06283286213874817,-0.13888919353485107,0.05351996049284935,0.12606872618198395,0.24951715767383575,0.08640066534280777,0.1641083061695099,0.2780695855617523,0.028664054349064827,-0.016822434961795807,0.11210969090461732,0.23808807134628296,0.01859205402433872,-0.05984156206250191,-0.16916126012802124,0.09299034625291824,0.014917065389454365,0.06351589411497116,-0.16769464313983917,0.08935926109552383,0.05874762311577797,-0.30138012766838074,0.201632097363472,-0.2001121491193771,-0.001156698912382126,0.10889548808336258,0.2251565009355545,-0.23670470714569092,0.29790329933166504,-0.16474394500255585,-0.19712848961353305,0.02248814702033997,0.3769059479236603,-0.09384123235940932,-0.28197452425956726,0.016964519396424294,-0.19395428895950317,0.21486492455005649,-0.1105925440788269,0.24491740763187408,0.07137532532215118,-0.18358521163463593,-0.009118149988353252,0.17979691922664642,0.1714997440576553,0.025996141135692596,0.20515520870685575,-0.11143878847360612,0.166004940867424,0.14506864547729492,0.12434493750333786,-0.18816763162612915,-0.06286437809467316,0.124137781560421,0.06652951240539551,0.0032674185931682587,0.05701800808310509,0.14905844628810885,0.021258950233459473,-0.08226513117551804,0.08163415640592575,0.12115498632192612,-0.05372655391693115,0.03361989185214043,0.1859349012374878,0.23220519721508023,-0.19340498745441437,-0.022560423240065575,0.15162169933319092,-0.2130572348833084,-0.19249315559864044,-0.1639968752861023,0.06692159920930862,0.12646201252937317,0.19999873638153076,0.02151809073984623,0.03634803742170334,0.1595778912305832,-0.02176437526941299,-0.1438736915588379,-0.09024739265441896,0.13121268153190613,0.004273203667253256,0.0979994535446167,0.22918915748596191,-0.003432345809414983,0.019250735640525814,-0.24179239571094513,0.02411111630499363,0.10359730571508408,-0.05751664936542511,0.013651170767843723,-0.07284239679574966,-0.26270151138305664,0.09206990152597427,-0.15836244821548462,-0.19869697093963623,-0.05533597245812416,-0.13052688539028168,0.2011962532997131,0.11716129630804062,0.1404026597738266,0.028860880061984066,-0.08239825814962387,-0.020825788378715515,-0.06438872963190079,-0.1833623498678207,-0.0064096227288246155,-0.11958108097314836,0.12392307072877884,-0.07408785820007324,0.08636359125375748,0.005075380206108093,-0.010317601263523102,0.127547487616539,-0.043636322021484375,0.08784952014684677,-0.010505837388336658,0.07083667069673538,0.02746068499982357,0.060329798609018326,-0.053550273180007935,-0.03668166324496269,-0.039615944027900696,-0.04423387348651886,-0.221054807305336,0.057755377143621445,-0.025984108448028564,0.014969393610954285,-0.02082482911646366,-0.34043586254119873,-0.1855049878358841,-0.16770310699939728,0.22956065833568573,-0.02447362989187241,-0.10409826040267944,-0.19219155609607697,-0.2237587720155716,-0.14620818197727203,0.08485107868909836,-0.024384772405028343,-0.020960168913006783,0.0391245000064373,-0.07071047276258469,0.07013171166181564,0.0613723061978817,-0.16218197345733645,-0.07415188103914261,-0.11921737343072893,-0.032936941832304,-0.25218191742897034,0.08832866698503494,-0.02700384519994259,0.27927282452583313,-0.04269447922706604,0.07103494554758072,-0.1744142770767212,-0.011756747961044312,0.2120777815580368,0.022664204239845276,-0.0902308151125908,0.013131044805049896,-0.2188568115234375,-0.005836003925651312,-0.1474500447511673,-0.07697711884975433,-0.15000642836093905,-0.0046496219001710415,-0.029227495193481445,0.06218134984374046,-0.013233065605163574,-0.06401551514863968,-0.2266465574502945,0.23627842962741852,-0.12947523593902588,0.12661318480968475,-0.01921999640762806,0.17887385189533234,0.04857639595866203,-0.22202564775943756,0.03737121447920799,-0.0912272408604622,-0.09471374750137328,-0.2233097106218338,-0.04588403180241585,-0.2586986720561981,-0.14249832928180697,0.137290820479393,0.18778249621391296,0.04475943371653557,-0.001402290421538055,0.16450610756874084,0.06708430498838425,-0.09553978592157364,0.07771769165992737,-0.08810972422361374,-0.07605444639921188,-0.10027293115854265,-0.034518271684646606,0.11294539272785188,0.053609710186719894,-0.1779555231332779,0.03440067917108536,-0.010144268162548542,0.02631010301411152,-0.025839168578386307,0.015838366001844406,-0.07659474015235901,0.0395771786570549,-0.0397648923099041,0.06979958713054657,-0.06057088449597359,0.027071017771959305,0.06268265843391418,-0.09892742335796356,-0.03333573788404465,-0.06227317824959755,0.05701364949345589,-0.04502136632800102,0.05340447649359703,-0.03273118659853935,-0.035389598459005356,0.07324974983930588,0.1311115175485611,-0.043717142194509506,-0.12226630747318268,0.007582374848425388,-0.16005437076091766,-0.13372595608234406,0.0914720818400383,0.01100778765976429,0.04625564441084862,0.08310899883508682,0.041091158986091614,0.004681609105318785,-0.10974224656820296,0.08886794745922089,0.050150830298662186,0.16260777413845062,-0.02770231105387211,0.07721546292304993,-0.1194138154387474,-0.08532866090536118,0.17674726247787476,0.08094494044780731,-0.15239684283733368,-0.1217380166053772,0.03702588379383087,-0.038944028317928314,0.11378786712884904,0.021109892055392265,0.1103651598095894,0.0684317797422409,-0.13671238720417023,-0.07723120599985123,0.015902547165751457,0.13351686298847198,-0.09961563348770142,0.02659844048321247,0.038311444222927094,0.08072227239608765,-0.17743094265460968,0.03164831921458244,-0.003945966716855764,-0.08118455857038498,-0.06807296723127365,-0.0405106283724308,0.1350611448287964,-0.04558916017413139,0.20229190587997437,-0.026248792186379433,0.029116326943039898,-0.011792399920523168,0.0818900391459465,0.13392458856105804,-0.035906124860048294,0.08601117879152298,0.12718842923641205,0.09298822283744812,0.10514495521783827,0.18564143776893616,0.0013792661484330893,0.14096905291080475,0.11275938153266908,0.09322883188724518,0.07254866510629654,-0.03757732734084129,0.10010485351085664,0.05957530438899994,-0.005149161908775568,0.17966194450855255,-0.015753118321299553,0.12174277752637865,-0.11896876245737076,0.013939755968749523,-0.037107888609170914,-0.001964043593034148,-0.08180896192789078,0.018748216331005096,0.029005512595176697,0.0015073911054059863,-0.04954689368605614,0.0035982185509055853,-0.02705983445048332,0.07585351169109344,-0.03965464234352112,0.07255994528532028,0.005310615990310907,0.0031454581767320633,-0.013862302526831629,-0.05214439705014229,0.0685029998421669,0.02253454364836216,-0.04884219169616699,0.02463824860751629,0.13697831332683563,0.15519170463085177,0.01087056752294302,-0.10691247880458832,-0.18844176828861237,-0.048842232674360275,0.07714594155550003,-0.1877894252538681,-0.08260011672973633,0.11248510330915452,0.08265361189842224,-0.07222041487693787,-0.019980791956186295,0.11841141432523727,0.07107789069414139,-0.1011236011981964,0.08091618865728378,0.08874267339706421,0.007262794300913811,-0.05427519604563713,0.04529177024960518,0.14053991436958313,0.03367249295115471,-0.05927182734012604,-0.16479624807834625,-0.07050519436597824,-0.0659620612859726,-0.05979112163186073,-0.05913292616605759,-0.13245543837547302,0.0805421695113182,0.04910287633538246,-0.08472613990306854,-0.028418008238077164,-0.09101292490959167,0.09357790648937224,-0.1267969012260437,-0.10929212719202042,-0.12769979238510132,-0.039791498333215714,0.03455161303281784,0.04619200527667999,-0.04885125532746315,0.08761400729417801,0.027508363127708435,0.23582907021045685,0.028417663648724556,0.15331590175628662,0.04304000735282898,-0.24093300104141235,-0.11640288680791856,0.012811992317438126,-0.03999921306967735,0.03327145799994469,0.1310880035161972,-0.07142448425292969,-0.10297125577926636,0.002614916069433093,-0.10014687478542328,0.0881224051117897,0.0010622446425259111,-0.15179818868637085,-0.21387408673763275,-0.06341945379972458,-0.13326385617256165,-0.11235007643699646,0.029899895191192627,-0.082054503262043,-0.2176060825586319,0.13494740426540375,0.05042388290166855
1,Glasgow,,permanent,Gregory Martin International,Engineering Jobs,30000.0,cv-library.co.uk,-0.20831213891506195,0.30739811062812805,-0.015398328192532064,0.09251733869314194,-0.00015516082930844277,0.019120873883366585,-0.1254838854074478,0.009004670195281506,0.045682791620492935,-0.05469943583011627,-0.14925608038902283,-0.029095908626914024,-0.10229026526212692,0.09432726353406906,0.02142634056508541,0.13895544409751892,0.33366307616233826,0.09855931997299194,0.22131983935832977,0.17396603524684906,0.23863984644412992,0.23988103866577148,-0.14289681613445282,0.02908874489367008,-0.07099464535713196,0.1764293760061264,0.07465191185474396,0.029974982142448425,-0.12190791964530943,0.03821374848484993,0.040416836738586426,0.3674744665622711,-0.1031900718808174,0.004673907998949289,-0.05761555954813957,-0.3872840702533722,0.3212657570838928,-0.049343228340148926,0.14502792060375214,-0.05328018590807915,-0.05959709361195564,0.0004620403051376343,0.04033229872584343,-0.0557100772857666,0.08613315969705582,-0.1958431601524353,0.18548230826854703,-0.006563777569681406,-0.13105829060077667,-0.07437416166067123,-0.17234450578689575,0.2763906717300415,-0.2067916989326477,0.2179802805185318,-0.09784424304962158,-0.036832984536886215,0.051097571849823,0.2604559659957886,0.08605528622865677,-0.07252760976552963,0.04169933497905731,-0.12184248119592668,-0.03672633320093155,0.027192363515496257,0.051994439214468,-0.27259793877601624,-0.21880698204040527,0.170480415225029,0.08926976472139359,-0.1751282960176468,-0.10693225264549255,-0.060309115797281265,0.05478919669985771,-0.09619691222906113,-0.007832064293324947,-0.10180483013391496,0.03665618970990181,-0.27200451493263245,-0.06892171502113342,0.19244341552257535,-0.21661360561847687,-0.15340527892112732,-0.08169461041688919,-0.15294979512691498,-0.02267146110534668,0.044427718967199326,-0.009927288629114628,-0.021444804966449738,0.21013014018535617,-0.02565780282020569,-0.06425818800926208,0.1964539885520935,-0.17478565871715546,0.05694720149040222,0.06970668584108353,0.2207631468772888,-0.34840521216392517,0.17389561235904694,0.1407704800367355,0.07154130190610886,-0.0999012291431427,-0.051054954528808594,-0.17868120968341827,-0.014827202074229716,-0.05747748538851738,0.31242039799690247,-0.08849535137414932,-0.20693475008010864,0.12046286463737488,-0.032908886671066284,-0.15482363104820251,-0.17778368294239044,-0.15650339424610138,0.07656239718198776,0.11057158559560776,-0.002738267183303833,-0.1772112399339676,0.08608611673116684,-0.005575895309448242,-0.05362334847450256,0.011870205402374268,0.04908973351120949,-0.08368274569511414,0.13167275488376615,-0.1051539182662964,0.005427380558103323,0.02479327656328678,-0.16477803885936737,0.13381974399089813,0.3144402801990509,0.22522199153900144,0.25559136271476746,-0.09694049507379532,0.007311729248613119,0.2477638274431229,0.08428170531988144,-0.05897650495171547,-0.11508647352457048,-0.2548622190952301,-0.12442958354949953,-0.16437721252441406,-0.26578107476234436,0.030128171667456627,0.04122023284435272,-0.1290932446718216,-0.10160516947507858,-0.183707132935524,0.04956434294581413,0.009836721234023573,-0.22275371849536896,-0.03813807666301727,0.011216044425964355,0.2688482999801636,0.014924357645213604,-0.03424594923853874,-0.16595466434955597,0.13873688876628876,-0.1302044689655304,-0.07994884252548218,0.15034642815589905,-0.1866821795701981,0.0941033735871315,-0.022391000762581825,-0.16759757697582245,-0.09478043764829636,0.04446648433804512,-0.17049209773540497,0.05665849521756172,0.03612388297915459,-0.015708109363913536,-0.14181941747665405,-0.12496381998062134,0.06077348068356514,-0.049943629652261734,0.02714517153799534,0.07464627176523209,-0.15316142141819,-0.23688852787017825,0.06267878413200378,0.16844235360622406,0.1295887976884842,-0.19319647550582889,0.015935147181153297,-0.11424795538187028,-0.038291990756988525,-0.03738086298108101,-0.24384455382823944,0.043525103479623795,0.011499200016260149,0.10169561952352524,0.23174746334552765,0.14236778020858765,-0.23874531686306,-0.05971090868115425,0.125291645526886,-0.12806183099746704,-0.07235003262758255,-0.010563182644546032,0.12816449999809265,-0.04937109351158142,-0.10883282870054244,0.11279986798763277,0.15541104972362518,-0.004724249243736267,-0.020139724016189575,0.15799136459827423,0.01237250491976738,-0.05873381718993187,-0.04182403162121773,-0.057274725288152695,-0.10481489449739456,-0.05719798058271408,-0.048832058906555176,0.14496222138404846,-0.007767544128000736,0.0006328944582492113,0.06547670811414719,0.007054830435663462,-0.08963806182146072,0.09033171832561492,-0.028616130352020264,-0.15453746914863586,0.08302132785320282,-0.046963006258010864,0.04371332004666328,-0.08435426652431488,0.020188014954328537,0.04689254239201546,-0.04491886869072914,0.01939619518816471,-0.0032179756090044975,0.02335638925433159,-0.0159912072122097,-0.0003830921195913106,-0.061986081302165985,-0.06300118565559387,0.06918767094612122,0.045003317296504974,0.11478254199028017,-0.1139615848660469,-0.048154499381780624,-0.017757276073098183,-0.11912985891103745,0.02719380334019661,0.06096942350268364,0.06062282249331474,-0.003088553436100483,0.017659161239862442,0.02302067168056965,-0.00890665128827095,0.057170044630765915,0.08984655886888504,0.10076462477445602,0.017857730388641357,0.045837074518203735,-0.00763406977057457,-0.03299817442893982,0.14918680489063263,0.009990976192057133,-0.015820764005184174,0.01300715934485197,0.14254245162010193,0.059875912964344025,-0.00807413924485445,-0.07565044611692429,0.02017945609986782,0.06181013584136963,-0.07589804381132126,-0.027005091309547424,-0.020621715113520626,0.10728873312473296,-0.019522113725543026,0.043428536504507065,-0.029098358005285263,0.02754100970923901,-0.152202308177948,0.034659236669540405,-0.004475307650864124,0.03323515132069588,-0.1145155429840088,-0.003943338990211487,0.049025505781173706,0.012686471454799175,0.11795631796121596,-0.06403374671936035,0.056339915841817856,0.0037561682984232903,0.054777972400188446,0.05972881242632866,0.001645171782001853,0.050179678946733475,0.02424379251897335,-0.0375523678958416,0.00951043888926506,0.14100168645381927,-0.006870017386972904,0.08826040476560593,0.08795595914125443,-0.062290191650390625,0.1648702174425125,-0.04070449993014336,-0.03502330183982849,0.13270029425621033,-0.008869320154190063,0.0666288360953331,-0.034861695021390915,0.14135940372943878,-0.08241018652915955,0.14463399350643158,0.03434858098626137,0.050444066524505615,-0.02157437615096569,-0.09994328767061234,0.0913468673825264,0.0917196124792099,0.016866622492671013,0.039823707193136215,-0.027993423864245415,-0.07309001684188843,-0.05351489409804344,-0.03190822899341583,-0.010645640082657335,0.015825675800442696,-0.05698491632938385,-0.035101812332868576,-0.02734481543302536,-0.06831341236829758,-0.017228659242391586,0.05869394540786743,0.05487436801195145,0.1263997107744217,-0.027544325217604637,-0.02736288495361805,-0.07542997598648071,-0.037267059087753296,0.06813263893127441,-0.10187028348445892,-0.06810110807418823,0.07890390604734421,0.0648638904094696,0.05669310316443443,0.05408737435936928,0.09265446662902832,0.014223547652363775,-0.01511763036251068,0.020135559141635895,-0.002395345363765955,-0.05338238179683685,-0.07639706134796143,0.14262771606445312,0.0793553814291954,0.0522066093981266,-0.08689992129802704,-0.03259148448705673,0.011161516420543194,-0.03706139698624611,0.03168276697397232,0.1384318470954895,-0.11663922667503356,0.04898490384221077,-0.0264593418687582,-0.07439690083265305,-0.011477758176624777,-0.015427879989147186,0.00691946828737855,-0.09829768538475037,0.012015754356980324,0.004913074430078268,-0.018917124718427655,0.06339280307292938,0.028630699962377548,0.11455927789211272,0.03966859728097915,0.07407630980014801,0.06564504653215408,0.024718565866351128,0.11633312702178956,0.05509796366095543,-0.115314781665802,-0.017152000218629837,-0.0799180194735527,-0.07740911841392517,-0.03702102601528168,0.1031278744339943,-0.053528156131505966,-0.06515828520059586,-0.012694436125457289,-0.11999019235372543,0.008711541071534157,-0.04881632328033447,-0.04470299929380417,-0.09537677466869354,0.037786465138196945,0.050381775945425034,-0.08175356686115265,0.010121691040694714,-0.004284191410988569,-0.1203434318304062,0.05232555419206619,-0.026546765118837357
2,Hampshire,,permanent,Gregory Martin International,Engineering Jobs,30000.0,cv-library.co.uk,-0.11297130584716795,0.039176832884550095,0.11244601756334303,0.09946677833795547,0.1533073931932449,-0.0967053547501564,-0.3014933168888092,0.016554972156882286,0.21248574554920197,0.04088292643427849,-0.054250676184892654,-0.3281697928905487,0.05195193365216255,-0.05699276924133301,-0.08796373009681702,0.16142505407333374,0.3640047609806061,-0.043398816138505936,0.30676066875457764,0.11549606174230576,0.1095072329044342,0.3821377754211426,-0.18668965995311737,0.08140291273593903,0.011301666498184204,0.2872464954853058,-0.10518795996904372,-0.2549920976161957,-0.014178365468978882,0.39799392223358154,0.17469175159931183,0.08079203963279724,-0.09471622109413148,-0.08726632595062256,-0.03828946128487587,-0.12079187482595444,0.08215870708227158,-0.23532898724079132,0.014276694506406784,0.21436311304569244,0.3313950300216675,-0.10583152621984482,0.34509846568107605,-0.04314581677317619,0.13462938368320465,-0.02154545485973358,0.39787033200263977,-0.08607987314462662,-0.4307339191436768,-0.09987690299749374,-0.045885439962148666,0.19067008793354032,-0.3608962595462799,0.02880135178565979,-0.040975216776132584,0.03280122950673103,-0.007731102406978607,0.33567869663238525,0.4156815111637115,0.06842220574617386,0.1350407600402832,-0.11037936806678772,0.1638239175081253,0.06574950367212296,-0.05826222896575928,0.13594277203083038,-0.05295972153544426,0.1660981923341751,-0.14588257670402527,-0.16277845203876495,0.031429607421159744,0.06293638795614243,-0.12744058668613434,-0.1986498236656189,-0.0037716131191700697,0.16948159039020538,0.040159888565540314,0.17519664764404297,0.2238418608903885,0.10955864191055298,-0.09750431776046752,-0.05188463255763054,0.19979803264141083,-0.3790929317474365,0.03534907102584839,0.04403242841362953,0.0556664764881134,-0.07798554748296738,0.31374144554138184,0.1735624074935913,0.076270192861557,0.370351642370224,0.03635098412632942,-0.1506276577711105,-0.25183728337287903,0.09660636633634569,-0.3278876543045044,0.11955398321151732,0.12955710291862488,0.2926258444786072,-0.2048182338476181,-0.17155694961547852,0.0027185603976249695,-0.023080334067344666,0.08420295268297195,0.09849151968955994,0.10549067705869676,-0.33219385147094727,0.1027597114443779,-0.07881294935941696,-0.1686890572309494,-0.0692806988954544,-0.09594198316335678,-0.08236796408891678,0.2515641152858734,0.03620419278740883,-0.033635202795267105,-0.16085194051265717,-0.07841245830059052,0.1022488996386528,0.108492411673069,0.24526119232177737,-0.08063877373933792,-0.09310416132211684,-0.36645546555519104,-0.36793896555900574,0.21759510040283203,0.03416888788342476,0.1813894361257553,-0.05036567151546478,-0.20540426671504977,-0.2173348218202591,-0.04123873636126518,0.2108910083770752,0.05450158193707466,-0.31391388177871704,0.029444947838783264,-0.1022488698363304,0.09156133979558943,-0.15626873075962067,0.08654791861772537,-0.18514429032802585,0.0714016929268837,0.4693679809570313,-0.6023147106170654,-0.1095488667488098,0.06311160326004028,0.39307475090026855,-0.17120420932769775,-0.09560111910104752,-0.05323587730526924,-0.034043457359075546,-0.1280568540096283,0.21706803143024445,0.055105675011873245,-0.18471312522888184,0.268575519323349,-0.19412218034267423,0.18282704055309296,0.15982504189014435,-0.038343336433172226,0.10058456659317017,-0.19101671874523163,-0.16731198132038116,-0.3763647973537445,0.1153867244720459,-0.06266841292381287,0.23383291065692904,0.21318072080612183,-0.03785417973995209,-0.10789396613836288,0.08455284684896469,0.3480105400085449,-0.015811851248145103,-0.18229396641254425,0.1627659946680069,0.0005010167951695621,0.11814682930707932,-0.05666521191596985,0.18669335544109344,-0.13455985486507416,-0.05715718865394592,-0.09218119829893112,-0.11752120405435562,0.0031522412318736315,-0.26509156823158264,-0.2253725677728653,0.2838388979434967,-0.09201636165380478,-0.058311622589826584,0.10408595949411392,0.01976671628654003,0.014880615286529064,-0.09559793025255205,-0.008433218114078045,0.19865401089191437,0.1687171310186386,-0.2317097932100296,0.27554208040237427,0.007976353168487549,-0.15134693682193756,0.09044951945543288,0.13904863595962524,0.0028227122966200113,0.04933195933699608,0.14917941391468048,0.02888030745089054,-0.017227960750460625,-0.03520529344677925,-0.04238388687372208,-0.08839746564626694,-0.08069980144500732,-0.028813350945711136,0.18847188353538513,0.01746225543320179,0.0012772532645612955,0.07919760048389435,0.003982536494731903,-0.02961467206478119,0.03822473064064979,-0.013966696336865423,-0.12173737585544586,0.012717073783278464,-0.04212776944041252,0.0656624585390091,-0.10705294460058212,0.01876060478389263,0.05340208485722542,-0.03888285160064697,-0.02288002707064152,-0.030041273683309555,-0.030544374138116837,-0.052825599908828735,0.021584030240774155,-0.04663883149623871,-0.019401920959353447,0.1017967090010643,0.10556497424840929,0.0662640780210495,-0.06398842483758926,-0.0023124709259718657,-0.05202458053827286,-0.1210031881928444,0.023951755836606026,0.06714323163032532,0.009366052225232124,-0.0006796946981921792,0.012839756906032562,-0.000422309065470472,-0.03194575756788254,0.08183051645755768,0.18837882578372955,0.08666675537824631,-0.01593257114291191,0.09182249754667282,0.0059103211387991905,-0.024439428001642227,0.11639370024204254,0.020740685984492305,-0.0457327701151371,0.01205739937722683,0.06649935245513916,0.03771842643618584,0.0165807344019413,-0.027781939134001732,0.0775919035077095,0.08896338194608688,-0.044732607901096344,-0.03607107326388359,0.027266647666692737,0.15783068537712097,0.02092663384974003,0.04928392171859741,-0.018830252811312675,0.05238350108265877,-0.12868398427963257,0.032918624579906464,0.006302558816969395,-0.03221641480922699,-0.07260678708553314,0.06099719554185867,0.0183890201151371,0.0276491641998291,0.14308764040470123,-0.04984673112630844,0.06711699068546295,0.011282338760793207,0.006782153155654669,0.07342381775379181,-0.04106101393699646,0.0649852529168129,0.07483720034360886,0.025704074651002884,0.04314219206571579,0.14354336261749268,-0.0078340545296669,0.07686465978622437,0.04007645696401596,-1.1227699360460974e-05,0.16781970858573914,-0.04589765518903732,0.07183379679918289,0.18064436316490173,-0.05858542397618294,0.07305245101451874,-0.025276828557252884,0.13222551345825195,-0.09457240998744965,0.14457383751869202,0.03735799342393875,0.05807719752192497,-0.029363051056861877,-0.06703267991542816,0.03236981853842735,0.047799304127693176,0.011226766742765903,0.037446439266204834,-0.007993003353476524,-0.03360598534345627,0.0059405723586678505,-0.01870027743279934,-0.0008621690794825554,0.03904160484671593,-0.037467729300260544,-0.05336042493581772,0.029463235288858417,-0.014821882359683514,-0.035283688455820084,0.09980568289756776,0.0718383938074112,0.11050266027450562,-0.005468632094562054,-0.020774241536855698,-0.08262881636619568,-0.06963802874088287,0.025452619418501857,-0.06493310630321503,-0.06382638216018677,0.0678347498178482,0.07243905961513519,0.08985669165849686,0.05039115622639656,0.0827791839838028,0.06860718131065369,-0.029721658676862717,0.008465426973998547,0.04588589072227478,-0.018651627004146576,0.021278824657201767,0.1024651750922203,0.0874829813838005,0.03803953528404236,-0.08391447365283966,-0.036648910492658615,0.019188040867447853,-0.007024465594440699,-0.027109509333968163,0.09318692982196808,-0.09371419996023178,0.04201183468103409,-0.014547398313879968,0.01985301822423935,0.04259032756090164,-0.002447627717629075,0.01501855719834566,-0.08011873066425323,0.005231491290032864,-0.014538006857037544,0.0329689159989357,0.0408191904425621,0.007525160908699036,0.06600945442914963,0.07255782186985016,0.054273415356874466,0.12784165143966675,0.02195708267390728,0.12794223427772522,0.021472427994012833,-0.14212223887443542,-0.05061193183064461,-0.009365488775074482,-0.06984280049800873,0.0006921929307281971,0.13285768032073977,-0.06673003733158112,-0.07210317999124527,-0.03847317770123482,-0.05824778601527214,0.04516402631998062,-0.037517376244068146,-0.10682997852563858,-0.11283589899539948,0.018252871930599213,-0.002010983880609274,-0.08691933006048203,-0.02349812351167202,-0.038349419832229614,-0.15535548329353333,0.07858540117740631,-0.02005631104111671


In [None]:
if USE_SAVED_MODEL:
    print("USE SAVED MODEL IN ", INOUT_DIR)
    best_model = h2o.load_model(INOUT_DIR + '/' + BEST_SAL_MODEL_NAME)
    best_model
    #Later ...     best_pred_rate = evaluate(best_model, veccat_job_df)
else:
    print("")
#     if (USE_SAVED_FRAME == False): train_evaluate(vec_job_df)
    [vec_good_pred_rate, vec_mae, vec_model] = train_evaluate(vec_job_df)    

    # Too SLOW, up to 80 hours (estimated) to run so not use it:
    if False:
        [veccat_good_pred_rate, veccat_mae, veccat_model] = train_evaluate(veccat_job_df)
        if veccat_good_pred_rate > vec_good_pred_rate:
            best_model = veccat_model
            best_pred_rate = veccat_good_pred_rate
            best_mae = veccat_mae
        
    best_model = vec_model
    best_pred_rate = vec_good_pred_rate
    best_mae = vec_mae
    
        
    best_model.model_id = BEST_SAL_MODEL_NAME
    print("Save best model to ", INOUT_DIR)
    model_path = h2o.save_model(model=best_model, path=INOUT_DIR, force=True)
    
    print("\n\n**************** BEST PREDICTION RATE: ", best_pred_rate, " with MAE: ", best_mae, "***************")


2018-02-08 05:45:40 - START  train_evaluate
py_8_sid_b7a6
2018-02-08 05:45:40 - START  split
2018-02-08 05:45:43 - END  split
2018-02-08 05:45:43 - START  grid_train
hyper_parameters:  {'ntrees': [1400], 'col_sample_rate': [0.6], 'learn_rate': [0.03], 'max_leaves': [900], 'max_bins': [63]}
parameters:  {'seed': 12345678901, 'stopping_metric': 'mae', 'nfolds': 3, 'tree_method': 'hist', 'grow_policy': 'lossguide', 'max_depth': 0, 'stopping_rounds': 3}
xgboost Grid Build progress: |███████████████████████████████████████████

In [None]:
model=h2o.get_model('best_sal_model')

In [None]:
model.scoring_history()

In [None]:
model

In [None]:
[train2_df, valid2_df, test2_df] = vec_job_df.split_frame(ratios=[0.96,0.02],seed=SEED)
test2_df.describe()

In [None]:
pred = model.predict(test2_df)
cbined_df = pred.cbind(test2_df)
cbined_df

In [None]:
# END
# init here just to see cluster status
h2o.init()
if SHUTDOWN_H2O: h2o.cluster().shutdown()
EndOfFunc()
print(start_time, "- Started time")