In [1]:
import os
import json
import papermill as pm
import datetime

In [2]:
dataset_path = r'G:\PythonProjects\WineRecognition2\data\text\halliday_winesearcher_menu_gen_samplesv3\Halliday_WineSearcher_MenuGenSamples.txt'
vocab_path = 'G:/PythonProjects/WineRecognition2/data/vocabs/Words_Halliday_Wine_AU_WORD_NUMS.json'
datainfo_path = 'G:/PythonProjects/WineRecognition2/data_info.json'
case_sensitive_vocab = False
use_num2words = True
test_size = 0.2
#bilstm_model_path = 'G:/PythonProjects/WineRecognition2/artifacts/train/BiLSTM_CRF_17022022_185854/model/data/model.pth'

## train BiLSTM-CRF

In [None]:
exp_settings = json.load(
    open(r"G:\PythonProjects\WineRecognition2\nn\experiment_settings.json")
)



experiment = {
    'MODEL_NAME': 'BiLSTM_CRF',
    'RUN_NAME': f'train-H_WS_MenuSamples_Num2Words-64',
    'START_TIME': None,
    'OUTPUT_DIR': None,
    'DATASET_PATH': dataset_path,
    'VOCAB_PATH': vocab_path,
    'DATAINFO_PATH': datainfo_path,
    'DEVICE': 'cuda',
    'BATCH_SIZE': 2048,
    'EMBEDDING_DIM': 64,
    'HIDDEN_DIM': 64,
    'NUM_EPOCHS': 150,
    'LEARNING_RATE': 0.01,
    'SCHEDULER_FACTOR': 0.1,
    'SCHEDULER_PATIENCE': 10,
    'CASE_SENSITIVE_VOCAB': case_sensitive_vocab,
    'WEIGHT_DECAY': 1e-4,
    'TEST_SIZE': test_size,
    'USE_NUM2WORDS': use_num2words
}

experiment['START_TIME'] = '{:%d%m%Y_%H%M%S}'.format(datetime.datetime.now())
experiment['OUTPUT_DIR'] = f"{exp_settings['artifacts_path']}/train/{experiment['MODEL_NAME'] + '_' + experiment['START_TIME']}"

bilstm_model_path = experiment['OUTPUT_DIR'] + '/model/data/model.pth'

if not os.path.exists(experiment['OUTPUT_DIR']):
    os.mkdir(experiment['OUTPUT_DIR'])
    
pm.execute_notebook(
    input_path='train_bilstm_crf.ipynb',
    output_path=os.path.join(experiment['OUTPUT_DIR'], 'train_bilstm_crf.ipynb'),
    parameters=experiment
)

Executing:   0%|          | 0/19 [00:00<?, ?cell/s]

## train CRF with LSTM features

In [None]:
exp_settings = json.load(
    open(r"G:\PythonProjects\WineRecognition2\experiment_settings.json")
)

experiment = {
    'DATASET_PATH': dataset_path,
    'LSTM_MODEL_PATH': bilstm_model_path,
    'VOCAB_PATH': vocab_path,
    'DICTIONARY_PATH': r"G:\PythonProjects\WineRecognition2\data\dictionaries\Dict-byword_Halliday_Winesearcher_Wine_AU-only_completed_rows",
    'DATAINFO_PATH': datainfo_path,
    'DEVICE': 'cuda',
    'CASE_SENSITIVE_VOCAB': case_sensitive_vocab,
    'MODEL_NAME': "CRF_with_LSTM_and_Our_features",
    'ALGORITHM': 'lbfgs',
    'C1': 0.1,
    'C2': 0.1,
    'MAX_ITERATIONS': 150,
    'ALL_POSSIBLE_TRANSITIONS': True,
    'TEST_SIZE': test_size,
    'RUN_NAME': 'train-H_WS_MenuSamples-Num2Words',
    'OUTPUT_DIR': None,
    'START_TIME': None,
    'USE_NUM2WORDS': use_num2words
}

experiment['START_TIME'] = '{:%d%m%Y_%H%M%S}'.format(datetime.datetime.now())
experiment['OUTPUT_DIR'] = f"{exp_settings['artifacts_path']}/train/{experiment['MODEL_NAME'] + '_' + experiment['START_TIME']}"

if not os.path.exists(experiment['OUTPUT_DIR']):
    os.mkdir(experiment['OUTPUT_DIR'])

pm.execute_notebook(
    input_path='train_crf_with_lstm_features.ipynb',
    output_path=os.path.join(experiment['OUTPUT_DIR'], 'train_crf_with_lstm_features.ipynb'),
    parameters=experiment
)

Executing:   0%|          | 0/17 [00:00<?, ?cell/s]