In [1]:
!pip install gensim==3.8.1



##### Colab Stuff

In [2]:
from google.colab import drive
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [3]:
import os
os.chdir(os.path.join('drive', 'My Drive', 'ift6759', 'ift6759-t6-p2'))
os.getcwd()

'/content/drive/My Drive/ift6759/ift6759-t6-p2'

In [4]:
!nvidia-smi

NVIDIA-SMI has failed because it couldn't communicate with the NVIDIA driver. Make sure that the latest NVIDIA driver is installed and running.



### Embeding Matrix Generation


In [0]:
from utils.gensim_embeddings import create_model
from gensim.models import FastText

def build_emb_matrix(task, emb_size, alignment):
    file_name = alignment + '_' + task[:-4]
    data_path = os.path.join(os.getcwd(), 'data', file_name)
    os.makedirs(os.path.join(os.getcwd(), 'embeddings', task, str(emb_size)), exist_ok=True)
    save_path = os.path.join(os.getcwd(), 'embeddings', task, str(emb_size), file_name)
    print(task, file_name, data_path, save_path)
    return create_model(FastText, data_path, save_path=save_path, size=emb_size)

def build_enc_dec_emb_matrices(enc_task, dec_task, emb_size=128, alignment='unaligned'):
    enc_emb = build_emb_matrix(enc_task, emb_size, alignment)
    print("enc_emb created")
    dec_emb = build_emb_matrix(dec_task, emb_size, alignment)
    print("dec_emb created")
    return enc_emb, dec_emb

In [6]:
build_enc_dec_emb_matrices(
    enc_task = 'unformated_en_w2w',
    dec_task = 'unformated_fr_w2w',
    emb_size = 8
)

unformated_en_w2w unaligned_unformated_en /content/drive/My Drive/ift6759/ift6759-t6-p2/data/unaligned_unformated_en /content/drive/My Drive/ift6759/ift6759-t6-p2/embeddings/unformated_en_w2w/8/unaligned_unformated_en
enc_emb created
unformated_fr_w2w unaligned_unformated_fr /content/drive/My Drive/ift6759/ift6759-t6-p2/data/unaligned_unformated_fr /content/drive/My Drive/ift6759/ift6759-t6-p2/embeddings/unformated_fr_w2w/8/unaligned_unformated_fr
dec_emb created


(<gensim.models.fasttext.FastText at 0x7f5243350e48>,
 <gensim.models.fasttext.FastText at 0x7f51ba6853c8>)

### GRU Language Model Training

#### unformated_en_w2w

In [0]:
!python train_language_model.py --task unformated_en_w2w --epochs 10 --batch_size 512 --embedding_warmer_epoch 5

2020-04-13 19:12:24.093586: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcudart.so.10.1
Tensorflow version 2.2.0-rc2
2020-04-13 19:12:26.416485: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcuda.so.1
2020-04-13 19:12:26.418427: E tensorflow/stream_executor/cuda/cuda_driver.cc:313] failed call to cuInit: CUDA_ERROR_NO_DEVICE: no CUDA-capable device is detected
2020-04-13 19:12:26.418467: I tensorflow/stream_executor/cuda/cuda_diagnostics.cc:156] kernel driver does not appear to be running on this host (4df7907d14d6): /proc/driver/nvidia/version does not exist
2020-04-13 19:12:26.424709: I tensorflow/core/platform/profile_utils/cpu_utils.cc:102] CPU Frequency: 2300000000 Hz
2020-04-13 19:12:26.424920: I tensorflow/compiler/xla/service/service.cc:168] XLA service 0x23032c0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
2020-04-13 19:1

#### unformated_fr_w2w

In [0]:
!python train_language_model.py --task unformated_fr_w2w --epochs 10 --batch_size 512 --embedding_warmer_epoch 5

2020-04-13 19:30:17.566636: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcudart.so.10.1
Tensorflow version 2.2.0-rc2
2020-04-13 19:30:20.108938: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcuda.so.1
2020-04-13 19:30:20.110990: E tensorflow/stream_executor/cuda/cuda_driver.cc:313] failed call to cuInit: CUDA_ERROR_NO_DEVICE: no CUDA-capable device is detected
2020-04-13 19:30:20.111038: I tensorflow/stream_executor/cuda/cuda_diagnostics.cc:156] kernel driver does not appear to be running on this host (4df7907d14d6): /proc/driver/nvidia/version does not exist
2020-04-13 19:30:20.117752: I tensorflow/core/platform/profile_utils/cpu_utils.cc:102] CPU Frequency: 2300000000 Hz
2020-04-13 19:30:20.117987: I tensorflow/compiler/xla/service/service.cc:168] XLA service 0x15cd2c0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
2020-04-13 19:3

#### unformated_fr_c2c

In [0]:
!python train_language_model.py --task unformated_fr_c2c --epochs 10 --batch_size 512

2020-04-13 19:56:35.477014: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcudart.so.10.1
Tensorflow version 2.2.0-rc2
2020-04-13 19:56:37.875094: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcuda.so.1
2020-04-13 19:56:37.877069: E tensorflow/stream_executor/cuda/cuda_driver.cc:313] failed call to cuInit: CUDA_ERROR_NO_DEVICE: no CUDA-capable device is detected
2020-04-13 19:56:37.877110: I tensorflow/stream_executor/cuda/cuda_diagnostics.cc:156] kernel driver does not appear to be running on this host (4df7907d14d6): /proc/driver/nvidia/version does not exist
2020-04-13 19:56:37.883437: I tensorflow/core/platform/profile_utils/cpu_utils.cc:102] CPU Frequency: 2300000000 Hz
2020-04-13 19:56:37.883654: I tensorflow/compiler/xla/service/service.cc:168] XLA service 0x2ed72c0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
2020-04-13 19:5

#### formated_fr_c2c


In [0]:
!python train_language_model.py --task formated_fr_c2c --epochs 10 --batch_size 512 

2020-04-13 20:43:23.071321: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcudart.so.10.1
Tensorflow version 2.2.0-rc2
2020-04-13 20:43:25.500083: I tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcuda.so.1
2020-04-13 20:43:25.519453: E tensorflow/stream_executor/cuda/cuda_driver.cc:313] failed call to cuInit: CUDA_ERROR_NO_DEVICE: no CUDA-capable device is detected
2020-04-13 20:43:25.519547: I tensorflow/stream_executor/cuda/cuda_diagnostics.cc:156] kernel driver does not appear to be running on this host (4df7907d14d6): /proc/driver/nvidia/version does not exist
2020-04-13 20:43:25.533904: I tensorflow/core/platform/profile_utils/cpu_utils.cc:102] CPU Frequency: 2300000000 Hz
2020-04-13 20:43:25.534357: I tensorflow/compiler/xla/service/service.cc:168] XLA service 0x27492c0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
2020-04-13 20:4