## Prepare

In [None]:
from prepare import get_anki_dataset, get_target_dataset, load_dataset, show_tokens

path_to_file_anki = get_anki_dataset('ukr-eng.zip')
path_to_file_target = get_target_dataset('ua-target-201704.zip')

en_tensors, ua_tensors, en_lang_tokenizer, ua_lang_tokenizer = load_dataset(path_to_file_anki, path_to_file_target)

print("English Language; index to word mapping")
show_tokens(en_lang_tokenizer, en_tensors[-1])
print()
print("Ukrainian Language; index to word mapping")
show_tokens(ua_lang_tokenizer, ua_tensors[-1])

## Train seq2seq model

In [None]:
from prepare import get_anki_dataset, get_target_dataset
from train_seq2seq import train_seq2seq
import model_params

path_to_file_anki = get_anki_dataset('ukr-eng.zip')
path_to_file_target = get_target_dataset('ua-target-201704.zip')

train_seq2seq(path_to_file_anki, path_to_file_target, config=model_params.SEQ2SEQ_MODEL_PARAMS)

## Train transformer model

In [None]:
from prepare import get_anki_dataset, get_target_dataset
from train_transformer import train_transformer
import model_params

path_to_file_anki = get_anki_dataset('ukr-eng.zip')
path_to_file_target = get_target_dataset('ua-target-201704.zip')

train_transformer(path_to_file_anki, path_to_file_target, config=model_params.TRANSFORMER_MODEL_PARAMS)

## Predict with seq2seq model

In [None]:
from predict_seq2seq import translate_seq2seq
import model_params

def translate_(sent):
    return translate_seq2seq(sent, config=model_params.SEQ2SEQ_MODEL_PARAMS)

translate_(u'ти згоден')
translate_(u'Том весь вечір дивиться телевізор.')
translate_(u'Я щойно згадав, що мені треба щось зробити.')

## Predict with transformer model

In [1]:
from predict_transformer import translate_transformer
import model_params

def translate_(sent):
    return translate_transformer(sent, config=model_params.TRANSFORMER_MODEL_PARAMS)

translate_(u'ти згоден')
translate_(u'Том весь вечір дивиться телевізор.')
translate_(u'Я щойно згадав, що мені треба щось зробити.')