In [1]:
#_Word_Utils.py
from six import text_type as unicode
from six import string_types

#[ES] Entrada: String. Salida: String convertido al formato unicode
def word_to_unicode(w):
    if isinstance(w, string_types) and not isinstance(w, unicode):
        return unicode(w, encoding="utf-8")
    else:
        return w

#[ES]: ws: Lista de palabras. unicode: Transforma las palabras al formato unicode. lower: Transforma las palabras a minúsculas
def standarize_words(ws,unicode=False, lower=False):
    for i in range(len(ws)):
        if unicode:
            ws[i]=word_to_unicode(ws[i])
        if lower:
            ws[i] = ws[i].lower()
    return ws


In [2]:
#Vovabulary.py

from six import iteritems


class Vocabulary(object):
    word_id=[]
    id_word=[]
    
    #[ES] words: Lista de palabras. to_unicode: Transforma las palabras a formato unicode. lower: Transforma todas la palabras a minúsculas
    def __init__(self, words=[], to_unicode=True, lower = False):
        
        words = standarize_words(words,to_unicode,lower)
        
        self.word_id = {w: i for i, w in enumerate(words)}
        self.id_word = {i: w for w, i in iteritems(self.word_id)}
       
    def __len__(self):
        return len(self.word_id)
    
    @property
    def words(self):
        return list(self.word_id) 
    
    #[ES]: Dado un indice i (natural) devuelve la palabra número i del vocabulario. En caso de que no exista eleva una exepción
    def index_to_word(self,word):
        try:
            return self.id_word[word]
        except KeyError as err:
            raise
    
    #[ES]: Dada una palabra (String) devuelve la posición (natural), que ocupa en el vocabulario. En caso de que no exista eleva una exepción
    def word_to_index(self,word,default=None):
        try:
            return self.word_id[word]
        except KeyError as err:
            raise
    
    
        

In [3]:
#Embedding.py

import logging
import sys
from tqdm import tqdm
import numpy as np
from sklearn.preprocessing import normalize

class Embedding(object):
   
    vocabulary = Vocabulary()
    vectors = []
    
    #[ES] vocabulary: Objeto de la clase Vocabulary que contiene las palabras del embedding. vector: Matriz de vectores, Para i de 0 a n, la fila i se corresponderá con la palabra i del vocabulario. 
    #En caso de existir palabras duplicadas se elevará una excepción. 
    def __init__(self, vocabulary=Vocabulary(), vectors=[]):
            
        self.vocabulary = vocabulary
        self.vectors = np.array(vectors)
        
        #[EN]: Check if we have the same number of words and vectors
        #[ES]: Comprobar si tenemos el mismo numero de vectores que de palabras
        if len(self.vocabulary) != self.vectors.shape[0]:
            raise ValueError("We have a different number of words and vectors. We have {} words and {} vectors".format(len(self.vocabulary),self.vectors.shape[0]))
        
        #[EN]: Test if there are duplicated words
        #[ES]: Comprobar si tenemos palabras duplicadas
        if len(self.vocabulary) != len(set(self.vocabulary.words)):
            logging.warning("Vocabulary has duplicates")
            

    
    def __len__(self):
         return len(self.vocabulary)
    
    @property
    def words(self):
        return self.vocabulary.words
    @property
    def dims(self):
        return self.vectors.shape[1]

    #[ES] Dada una palabra (String), devuelve su vector (Array de floats). En caso de que la palabra no existe eleva una excepción
    def word_to_vector(self,word,lower=False): 
        try:
            if lower:
                return self.vectors[self.vocabulary.word_to_index(word.lower())]
            else:
                return self.vectors[self.vocabulary.word_to_index(word)]
        except KeyError as err:
            raise
            
    #[ES] Normalización L2 por filas. Para cada vector asegura que la raiz cuadrada de la suma de los cuadros es igual a 1.
    #[ES] Si replace==True se sustituarian los vectores actuales por los vectores normalizados. En caso contrario, se devolverá un nuevo embedding con las mismas palabras que el actual pero los vectores normalizados.  
    def length_normalize(self,replace=True):
        norms = np.sqrt(np.sum(self.vectors**2, axis=1))
        norms[norms == 0] = 1
        if replace:
            self.vectors = self.vectors / norms[:, np.newaxis]
            
        else:
            return Embedding(vectors = self.vectors / norms[:, np.newaxis], vocabulary=self.vocabulary)
    
    #[ES] Normalización L2 por columnas. . Para cada columna asegura que la raiz cuadrada de la suma de los cuadros es igual a 1.
    #[ES] Si replace==True se sustituarian los vectores actuales por los vectores normalizados. En caso contrario, se devolverá un nuevo embedding con las mismas palabras que el actual pero los vectores normalizados.  
    def length_normalize_dimensionwise(self,replace=True):
        norms = np.sqrt(np.sum(self.vectors**2, axis=0))
        norms[norms == 0] = 1
        if replace:
            self.vectors = self.vectors / norms
           
        else:
            return Embedding(vectors = self.vectors / norms, vocabulary=self.vocabulary)
        
    def L1_rowwise(self,replace=True):
        if replace:
            normalize(self.vectors, norm='l1', axis=1, copy=False, return_norm=False)
            
        else:
            return Embedding(vectors = normalize(self.vectors, norm='l1', axis=1, copy=True, return_norm=True), vocabulary=self.vocabulary)
    
    def L1_dimensionwwise(self,replace=True):
        if replace:
            normalize(self.vectors, norm='l1', axis=0, copy=False, return_norm=False)
            
        else:
            return Embedding(vectors = normalize(self.vectors, norm='l1', axis=0, copy=True, return_norm=True), vocabulary=self.vocabulary)
        
        
    #[ES] Para cada columna resta la media de todas las columnas del embedding
    #[ES] Si replace==True se sustituarian los vectores actuales por los vectores normalizados. En caso contrario, se devolverá un nuevo embedding con las mismas palabras que el actual pero los vectores normalizados.  
    def mean_center(self,replace=True):
        avg = np.mean(self.vectors, axis=0)
        if replace:
            self.vectors = self.vectors - avg  
           
        else:
            return Embedding(vectors = self.vectors - avg , vocabulary=self.vocabulary)
        
    #[ES] Para cada fila resta la media de todas las filas del embedding
    #[ES] Si replace==True se sustituarian los vectores actuales por los vectores normalizados. En caso contrario, se devolverá un nuevo embedding con las mismas palabras que el actual pero los vectores normalizados.
    def mean_center_embeddingwise(self,replace=True):
        avg = np.mean(self.vectors, axis=1)
        if replace:
            self.vectors = self.vectors - avg[:, np.newaxis]
           
        else:
            return Embedding(vectors = self.vectors - avg[:, np.newaxis] , vocabulary=self.vocabulary)

    #[ES] Exporta a ruta "path" el embedding actual. El formato será "dog -0.190911 -0.0466989 ... \n" si printHeader== True imprimirá al comienzo del fichero una linea que contiene el número de palabras del embedding y la longitud de los vectores del embedding
    def export(self,path,printHeader=True):
        words = self.words
        vectors = self.vectors
        
        with open(path, 'w') as file:
        
            if (printHeader):
                print('%d %d' % (len(self), self.dims), file=file)

            for i in tqdm(range(len(self))):
                print(words[i] + ' ' +' '.join(['%.6g' % x for x in vectors[i]]), file=file)

    def save(self, file):
        #@TODO cPickle
        return
        

In [1]:
#Load_embeding.py
import pandas as pd
import numpy as np
import csv
from sys import stdout
from IPython.display import clear_output
import logging
from tqdm import tqdm
import io
from six import text_type   
import codecs

#[ES] Carga un embedding desde un directorio, devuelve un objeto del tipo embedding.
#[ES] Parámetros:
    #path: Ruta (obligatorio)
    #format: text, archivo de texto, con o sin encabezado. bin archivo binario (w2v). senna modo especial para estos embeddings. vgg modo especial para los embedding de imágenes. DT_embedddings: Modo espacial para leer estos embeddings
    #vocabulary: Si es None cargará todas las palabras del fichero, si es una lista de palabras [cat, dog...] solo se cargarán las palabras pertenecientes a esa lista, útil si solo se quiere evaluar los embeddings en unos datasets
    #length_normalize: Normalización L2 por filas de los embeddings cargados
    #normalize_dimensionwise: Normalización L2 por columanas de los embeddigs cargados. 
        #En caso de que length_normalize y normalize_dimensionwise sean TRUE. Primero se realiza la normalización por columnas y después por filas.
    #to_unicode: Transforma a unicode las palabras del embedding
    #lower: Transforma a minúsculas las palabras del emnedding
    #path2: En caso de que el formato sea "senna" o "DT_embedings" en path irá el fichero con las palabras, y en path2 el fichero con los vectores
    #dims_restricton: Entero i (dimensiones del embedding). Por cada fila leida se tomará como número los elementos n..n-i y los elementos 0..n-i-1 se concaterán y serán tomados como palabra. Muy útil para embeddings con palabras que contienen espacio o carácteres extraños que son tomados como espacios.
    #delete_duplicates: Elimina los duplicados del embeddig, por cada palabra duplicada se mantendrá solo la primera que aparezca en el fichero. Solo recomendable para embeddings con mucha suciedad como los obtenidos de common crawl, donde algunas palabras con caracteres extraños no reconocidos por python se leen como si fueran la misma, eliminar estas palabras no tiene impacto alguno en el embedding, por ejemplo en el caso de FastText CC solo se eliminan 4 palabras.
    #method_vgg: En caso de que el formato sea "vgg", si este atributo es "delete" se eliminarán los duplicados de la misma forma explicada en el atributo anterior. En caso de que sea "average" se hará la media de los vectores de las palabras duplicadas. Este es un embedding que tiene la peculiaridad de tener un gran número de duplicados
    
def load_embedding(path, format="text", vocabulary = None, length_normalize=True, normalize_dimensionwise = False, to_unicode=True, lower=False, path2='',dims_restriction=None, delete_duplicates=False, method_vgg = "delete"):
    assert format in ["text","bin","senna","vgg","DT_embeddings"], "Unrecognized format"
    
    if vocabulary is not None:
        if len(set(vocabulary)) != len(vocabulary):
            logging.warning("Provided vocabulary has duplicates. IMPORTANT NOTE: The embedding that this function will return will not have duplicates.")
    
    if format == "text":
        vocab, matrix = from_TXT(path,vocabulary,dims_restriction)
    
    if format == "bin":
        vocab, matrix = from_BIN(path,vocabulary)
    
    if format == "senna":
        vocab, matrix = from_SENNA(path,path2)
    
    if format == "vgg":
        vocab, matrix = from_vgg(path,method_vgg)
    
    if format == "DT_embeddings":
        vocab, matrix = from_DT_embeddings(path,path2)
    
    if delete_duplicates:
        remove_duplicates(vocab,matrix)
    
    vocabulary = Vocabulary(vocab,to_unicode,lower)
    e = Embedding(vocabulary=vocabulary,vectors = matrix)
    
    if normalize_dimensionwise:
        e.length_normalize_dimensionwise()
    
    if length_normalize:
        e.length_normalize()
        
    return e

def has_header(path,vocabulary = None):
    with open(path) as f:
        first_line = f.readline()
        first_line = first_line.split(' ')
        if len(first_line)==2:
            return 1
        return 0

def remove_duplicates(words,vectors):
    seen = set()
    seen_add = seen.add
    duplicate_indexes = [idx for idx,item in enumerate(words) if item in seen or seen_add(item)]
    for d in reversed(duplicate_indexes):
        logging.warning("Word {} deleted".format((words[d])))
        del(words[d])
        del(vectors[d])
    
    
    

def from_TXT(path, vocabulary=None, dims_restriction = None):
    words = []
    vectors = []
    
    #with codecs.open(path, "r",encoding='utf-8', errors='ignore') as f:
    with open(path) as f:
        if has_header:
            next(f)
        for line_no, line in enumerate(f):
            l = line.split()
            
            if vocabulary is None:
                try:
                    if not dims_restriction:
                        vectors.append(np.asarray(l[1:]).astype(np.float32))
                        words.append(l[0])
                    else:
                        wi = len(l)-dims_restriction
                        st = ''.join(l[0:wi])
                        words.append(st)
                        vectors.append(np.asarray(l[wi:]).astype(np.float32))
                        
                except ValueError:
                    logging.warning("Line {}.Error reading the vector for the word {}... Word has been omitted".format(line_no,l[0:3]))
                    
                        
            elif l[0] in vocabulary:
                try:
                    if not dims_restriction:
                        vectors.append(np.asarray(l[1:]).astype(np.float32))
                        words.append(l[0])
                    else:
                        wi = len(l)-dims_restriction
                        st = ''.join(l[0:wi])
                        words.append(st)
                        vectors.append(np.asarray(l[wi:]).astype(np.float32))
                except ValueError:
                    logging.warning("Line {}.Error reading the vector for the word {}... Word has been omitted".format(line_no,l[0:3]))
                    
    return words, vectors    
            
    



def from_BIN(path,vocabulary = None):
    with io.open(path,'rb') as file:
        words = []
        
        header = file.readline()
        vocab_size, layer1_size = list(map(int, header.split()))
        vocab_size_aux = vocab_size

        if vocabulary is None:
            vectors = np.zeros((vocab_size, layer1_size), dtype=np.float32)
        else:
            vectors = []

        binary_len = np.dtype("float32").itemsize * layer1_size
        for line in tqdm(range(vocab_size)):
            word = []
            while True:
                ch = file.read(1)
                if ch == b' ':
                    break
                if ch != b'\n':
                    word.append(ch)

            if vocabulary is None:
               
                words.append(b''.join(word).decode("latin-1"))
            
                vectors[line, :] = np.fromstring(file.read(binary_len), dtype=np.float32)
                
            else:
                w = b''.join(word).decode("latin-1")
                if w in vocabulary:
                    words.append(w)
                    vectors.append(np.fromstring(file.read(binary_len), dtype=np.float32))

                else:
                    vocab_size_aux-=1
                    file.read(binary_len)
                
                    
        if len(words) != vocab_size_aux:
            raise ValueError("Header says that there are {} words, but {} were read".format(vocab_size_aux,len(words)))

        return words, vectors

    
    
def from_SENNA(path_words,path_vectors):
    words = []
    vectors = []
    
    with open(path_words) as f:
        for line in f:
            l = line.split()
            words.append(l[0])
                
    with open(path_vectors) as f:
        for line in f:
            l = line.split()
            vectors.append(np.asarray(l).astype(np.float32))
    return words, vectors

    
def from_vgg(path,method_vgg = "delete"):
    
    data = pd.read_csv(path, sep=',', header=None)
    words = []
    vectors = []
    for i in range(len(data.index)):
        w = data.iloc[i,0]
        if w not in words:
                words.append(w)
                vectors.append(np.array(data.iloc[i,1:]).astype(np.float32))
        else:
            if method_vgg == "mean":
                ind = words.index(w)
                vectors[ind] = (vectors[ind] + np.array(data.iloc[i,1:]).astype(np.float32))/2
                
                
    return words, vectors


def from_DT_embeddings(path_nodes, path_vectors):
    vectors = []
    nodes = {}
    words =[]
    with codecs.open(path_nodes, "r",encoding='utf-8', errors='ignore') as fnodes:
        for line_no, line in enumerate(fnodes):
            wt,wn = line.split()
            w = wt.split('/')[0]
            nodes.update({wn:w})
    
    with codecs.open(path_vectors, "r",encoding='utf-8', errors='ignore') as fwords:
        next(fwords)
        for line_no, line in enumerate(fwords):
            l = line.split()
            vectors.append(np.asarray(l[1:]).astype(np.float32))
            words.append(nodes[l[0]])        
            
    return words,vectors
            
            
        

In [5]:
#similarity.py
import scipy.stats
from tqdm import tqdm
import matplotlib.pyplot as plt

#[ES] Calcula la similitud coseno entre dos vectores dados. 
def calculate_cosine_simil(vector1, vector2):
    return np.dot(vector1,vector2)/(np.linalg.norm(vector1)*np.linalg.norm(vector2))
    
    #if isNormalized:
    #    return np.dot(vector1,vector2)
    #else:
    #    return np.dot(vector1,vector2)/(np.linalg.norm(vector1)*np.linalg.norm(vector2))

#[ES] Dado un embedding y dos palabras (string), devulve la similitud coseno entre ambas palabras, en caso de que alguna de las dos no exista en el embeddig se devolverá None
def similarity_2_words(e,word1,word2, lower = False): 
    try:
        v1 = e.word_to_vector(word1,lower)
    except KeyError as err:
        logging.critical("The word {} does not exits in the embeding".format(word1))
        return None
    try:
        v2 = e.word_to_vector(word2,lower)
    except KeyError as err:
        logging.critical("The word {} does not exits in the embeding".format(word2))
        return None
   

    return calculate_cosine_simil(v1, v2)

    
    
#[ES] Entrada.
        #embedding: a evaluar
        #X lista de pares de palabras
        #gold: Resultados de la similitud entre los pares de palabras
        #backoff_embs: Lista de embeddings, en caso de que alguna palabra de los pares no se encuentre en el embedding a evaluar, utilizará un embedding de la lista en lugar del que se va a evaluar para ese par de palabras (se toman ambas palabras del embedding backoff), primero se probará con el primero de lista, después con el segundo...
    # Salida:
        #coverage: Porcentaje de pares para los que se ha podido dar una respuesta del total de pares de palabras
        #pearson: Correlación de pearson entre los resultados de similaridad del embedding y los proporcionado
        #spearman: Correlación de spearman entre los resultados de similaridad del embedding y los proporcionado
def similarity_emd(embedding, X, gold, backoff_embs=None, lower = False):
    rescsv = ''
    results = []
    gold_scores = []
    oov = 0
    for gold_score in tqdm(range(len(gold))):
        try:
            cos = calculate_cosine_simil(
                                         embedding.word_to_vector(X[gold_score][0],lower), 
                                         embedding.word_to_vector(X[gold_score][1],lower))
            results.append(cos)
            rescsv = str(rescsv)  + str(cos) + ','
            gold_scores.append(gold[gold_score])
            
        except KeyError as err:
            if backoff_embs is None:
                oov+=1
                print(X[gold_score])
            else:
                actual_emb=0
                for e in backoff_embs:
                    try:
                        cos = calculate_cosine_simil(
                                         e.word_to_vector(X[gold_score][0],lower), 
                                         e.word_to_vector(X[gold_score][1],lower))
                        results.append(cos)
                        
                        gold_scores.append(gold[gold_score])
                        break
                    except KeyError as err:
                        if actual_emb == len(backoff_embs)-1:
                             oov+=1
                    
                    actual_emb+=1
        
        
    #ts = Series(results, index=list(range(0, len(results))))
    #ts = ts.cumsum()
    #ts.plot()
    #print("==========RESULTS===============")
    #print(rescsv)
    
    coverage = len(results)/(len(results) + oov)
    pearson = scipy.stats.pearsonr(gold_scores, results)[0]
    spearman = scipy.stats.spearmanr(gold_scores, results)[0]
        
    return{'coverage':coverage, 'pearson':pearson, 'spearman':spearman}

def average_similarity(embeddings, X, gold, weights = None, lower=False):
    
    if weights is not None and len(embeddings)!=len(weights):
        raise ValueError("Embedding and weights must have the same length")
    
    results = []
    gold_scores = []
    oov = 0
    for gold_score in tqdm(range(len(gold))):
        avgW=0
        avg = []
        e = 0
        div = 0
        for emb in range(len(embeddings)):
            try:
                cos = calculate_cosine_simil(
                                         embeddings[emb].word_to_vector(X[gold_score][0],lower), 
                                         embeddings[emb].word_to_vector(X[gold_score][1],lower))
                if weights is None:     
                    avg.append(cos)
                else:
                    avgW+=cos*weights[emb]
                    div+=weights[emb]
            except KeyError as err:
                e+=1
        
        if e<len(embeddings):
        #if e == 0:   
            if weights is None:
                results.append(np.mean(avg))
            else:
                results.append(avgW/div)
                
            gold_scores.append(gold[gold_score])
        else:
            oov+=1
    
    coverage = len(results)/(len(results) + oov)
    pearson = scipy.stats.pearsonr(gold_scores, results)[0]
    spearman = scipy.stats.spearmanr(gold_scores, results)[0]
        
    return{'coverage':coverage, 'pearson':pearson, 'spearman':spearman}



In [6]:
scipy.stats.mstats.gmean(abs([-0.12312]))

TypeError: bad operand type for abs(): 'list'

In [7]:
# similarity datasets
from sklearn.datasets.base import Bunch
from six import iteritems
import pandas as pd
import csv
from pandas import Series, DataFrame

dataset_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/SimilarityDataset/'

Mturk287_path = dataset_path + 'EN-MTurk-287.txt'
Mturk771_path = dataset_path + 'EN-MTurk-771.txt' 
mendev_path = dataset_path + 'EN-MEN-LEM-DEV.txt' 
mentest_path = dataset_path + 'EN-MEN-LEM-TEST.txt' 
men_path = dataset_path + 'EN-MEN-LEM.txt' 
WS353_all_path = dataset_path + 'EN-WS353_all.txt'
WS353_relaredness_path = dataset_path + 'EN-WSR353_relatedness.txt'
WS353_similarity_path = dataset_path + 'EN-WSS353_similarity.txt'
WS353_set1_path = dataset_path + 'EN-WS353-SET1.txt'
WS353_set2_path = dataset_path + 'EN-WS353-SET2.txt'
RG65_path =dataset_path + 'EN-RG-65.txt'
RW_path = dataset_path + 'EN-RW.txt'
SIM999_path = dataset_path + 'EN-SIM999.txt'
Verb143_path = dataset_path + 'EN-VERB-143.txt'
MC30_path = dataset_path + 'EN-MC-30.txt'
YP_130_path = dataset_path + 'EN-YP-130.txt'
SimVerb3500_path = dataset_path + 'EN-SimVerb-3500.txt'

def get_MTurk287():
    data = pd.read_csv(Mturk287_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y=2 * data[:,2].astype(np.float))

def get_MTurk771():
    data = pd.read_csv(Mturk771_path, sep=" ", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y=2 * data[:,2].astype(np.float))

def get_MENdev():
    data = pd.read_csv(mendev_path, sep=" ", header=None)
    data = data.apply(lambda x: [y if isinstance(y, float) else y[0:-2] for y in x])
    return Bunch(X=data.values[:,0:2].astype("object"), y= data.values[:,2].astype(np.float)/ 5.0)

def get_MENtest():
    data = pd.read_csv(mentest_path, sep=" ", header=None)
    data = data.apply(lambda x: [y if isinstance(y, float) else y[0:-2] for y in x])
    return Bunch(X=data.values[:,0:2].astype("object"), y= data.values[:,2].astype(np.float)/ 5.0)


def get_MENall():
    data = pd.read_csv(men_path, sep=" ", header=None)
    data = data.apply(lambda x: [y if isinstance(y, float) else y[0:-2] for y in x])
    return Bunch(X=data.values[:,0:2].astype("object"), y= data.values[:,2].astype(np.float)/ 5.0)

def get_WS353_all():
    data = pd.read_csv(WS353_all_path, sep="\t", header=0).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))

def get_WS353_relatedness():
    data = pd.read_csv(WS353_relaredness_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))

def get_WS353_similarity():
    data = pd.read_csv(WS353_similarity_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))

def get_WS353_set1():
    data = pd.read_csv(WS353_set1_path, sep="\t", header=0).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))

def get_WS353_set2():
    data = pd.read_csv(WS353_set2_path, sep="\t", header=0).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))

def get_RG65():
    data = pd.read_csv(RG65_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float) * 10.0 / 4.0)

def get_RW():
    data = pd.read_csv(RW_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))

def get_SimLex999():    
    data = pd.read_csv(SIM999_path, sep="\t", header=0).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,3].astype(np.float))

def get_Verb143():
    data = pd.read_csv(Verb143_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float)*10.0)

def get_MC30():
    data = pd.read_csv(MC30_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float) * 10.0 / 4.0)

def get_YP130():
    data = pd.read_csv(YP_130_path, sep=" ", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float) * 10.0 / 4.0)

def get_SimVerb3500():
    data = pd.read_csv(SimVerb3500_path, sep="\t", header=None).values
    return Bunch(X=data[:,0:2].astype("object"), y= data[:,2].astype(np.float))



datasets = {
        "SimLex999": get_SimLex999(),
        "MTurk-287": get_MTurk287(),
        "MTurk-771": get_MTurk771(),
        "MEN_DEV": get_MENdev(),
        "MEN_TEST": get_MENtest(),
        "MEN_ALL": get_MENall(),
        "WS353_all": get_WS353_all(),
        "WS353_relatedness": get_WS353_relatedness(),
        "WS353_similarity": get_WS353_similarity(),
        "WS353_set1": get_WS353_set1(),
        "WS353_set2": get_WS353_set2(),
        "RG65": get_RG65(),
        "VERB-143": get_Verb143(),
        "MC-30": get_MC30(),
        "YP-130": get_YP130(),
        "SimVerb-3500": get_SimVerb3500(),
        "RW": get_RW()
    
    }
    

def get_vocab_simil_all(lower=False):
    vocab = []
    for name, data in iteritems(datasets):
            vocab = np.append(vocab, np.append((data.X[:,0]),(data.X[:,1])))
    if lower:
        for i in range(len(vocab)):
            vocab[i]=vocab[i].lower()
    return set(vocab)  

def get_dataset(dataset):
    if dataset == 'MTurk-287':
        return get_MTurk287()
    elif dataset == 'MTurk-771':
        return get_MTurk771()
    elif dataset == 'MEN':
        return  get_MENall()
    elif dataset == 'WS353_all':
        return  get_WS353_all()
    elif dataset == 'WS353_relatedness':
        return  get_WS353_relatedness()
    elif dataset == 'WS353_similarity':
        return  get_WS353_similarity()
    elif dataset == 'WS353_set1':
        return  get_WS353_set1()
    elif dataset == 'WS353_set2':
        return  get_WS353_set2()
    elif dataset == 'RG65':
        return  get_RG65()
    elif dataset == 'RW':
        return  get_RW()
    elif dataset == 'VERB-143':
        return  get_Verb143()
    elif dataset == 'MC-30':
        return  get_MC30()
    elif dataset == 'YP-130':
        return  get_YP130()
    elif dataset == 'SimVerb-3500':
        return  get_SimVerb3500()
    elif dataset == 'SimLex999':
        return  get_SimLex999()
    else:
        raise ValueError("The dataset {} is not supported".format(dataset))
    
def evaluate_in_dataset(dataset,emb,backoff_embs=None,formatemb="text", normalize=True, to_unicode=True, lower=True, path2='', lowercase_dataset = False):
    
    data = get_dataset(dataset)
    if isinstance(emb, str):
        emb = load_embedding(emb, format=formatemb, vocabulary = set(np.append((data.X[:,0]),(data.X[:,1]))), normalize=normalize, to_unicode=to_unicode, lower=lower, path2=path2)
    
    return similarity_emd(emb, data.X, data.y, backoff_embs,lowercase_dataset)



def evaluate_in_dataset_avg(dataset, embs, weigths, lowercase_dataset=False):
    data = get_dataset(dataset)
    return average_similarity(embs, data.X, data.y, weights,lowercase_dataset)



    
def evaluate_on_all(emb,backoff_embs=None,formatemb="text", normalize=True, to_unicode=True, lower=True, path2='',lowercase_dataset=False):
    result = []
    
    if isinstance(emb, str):
        emb = load_embedding(emb, format=formatemb, vocabulary = get_vocab_all(), normalize=normalize, to_unicode=to_unicode, lower=lower, path2=path2)
    
    for name, data in iteritems(datasets):
        d = {'dataset':name}
        d.update(similarity_emd(emb, data.X, data.y, backoff_embs,lowercase_dataset))
        result = np.append(result, d)
    
    return result



def evaluate_on_all_avg(embs, weights=None,lowercase_dataset=False):
    result = []
    for name, data in iteritems(datasets):
        d = {'dataset':name}
        d.update(average_similarity(embs, data.X, data.y, weights,lowercase_dataset))
        result = np.append(result, d)
        
    return result


def results_to_csv(res, correlation='spearman', printRes=True, returnRes=False):
    assert correlation in ["spearman","pearson"], "Unrecognized Correlation method"
    txtRest= ''
    txtCov = ''
    for y in res:
        txtRest = txtRest + str(y[correlation]) + ','
        txtCov = txtCov + str(y['coverage']) + ','
    
    if printRes:
        print(txtRest)
        print(txtCov)
    if returnRes:
        return txtRest,txtCov
    
def export_to_csv(txtResults,txtCov,name=None, filenameResults = 'Results.csv', filenameCoverage = 'Coverage.csv',delimiter=","):
    if name:
        txtResults = str(name)+ ","+ txtResults
        txtCov = str(name)+"," + txtCov
    
    
    with open(filenameResults, 'a+') as file:
        print('%s' % (str(txtResults)), file=file)
        
    with open(filenameCoverage, 'a+') as file:
        print('%s' % (str(txtCov)), file=file)
    
        
    
        
    

In [7]:
from tqdm import tqdm
from annoy import AnnoyIndex
#import knn
#https://github.com/chrischoy/knn_cuda
#def k_nearest_GPU(emb,vector,k=10):
#    return knn.knn(emb.vectors, vector, k)

#https://github.com/spotify/annoy
def k_nearest_annoy(u,vector,k=10):
    return u.get_nns_by_vector(vector,k)

    
def generate_annoy(emb):
    t = AnnoyIndex(emb.dims)
    for i in tqdm(range(len(emb.words))):
        t.add_item(i,emb.vectors[i])
    t.build(10)
    
    return t

def nearest_cosine(emb,vector,k):
    nearest = sorted(emb.words,key= lambda w: calculate_cosine_simil(vector,emb.word_to_vector(w)), reverse=True)
    return nearest[0:k]

    

        

In [None]:
vec = N2.word_to_vector('03629986-n')
print(vec[0:2])

In [None]:
nearest_cosine(N1,vec,10)

In [None]:
t = generate_annoy(N1)

In [None]:
i = k_nearest_annoy(t,vec)
for ind in i:
    print(N1.words[ind]+",")

In [None]:
N1 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/UKBrm.Synset-UKBr.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N2 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/Synset.Synset-UKBr.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


In [None]:
import time
start_time = time.time()
print(get_top_cosine_sort(N1.word_to_vector('cat'),N1,N1.words,10))
print("--- %s seconds ---" % (time.time() - start_time))


In [None]:
start_time = time.time()
print(get_top_cosine(N1.word_to_vector('cat'),N1,10,N1.words))
print("--- %s seconds ---" % (time.time() - start_time))

In [None]:
t = generate_annoy(N1)

In [None]:
start_time = time.time()
print(k_nearest_annoy(t,N1,N1.word_to_vector('cat'),k=10))
print("--- %s seconds ---" % (time.time() - start_time))

In [None]:
def cos_cdist(matrix, vector):
    """
    Compute the cosine distances between each row of matrix and vector.
    """
    v = vector.reshape(1, -1)
    #print(v)
    return 1 - scipy.spatial.distance.cdist(matrix, v, 'cosine').reshape(-1)

start_time = time.time()
cos = cos_cdist(N1.vectors,N1.word_to_vector('cat'))
index =  get_largest_index(cos,10)

top = []
for i in index:
    top.append(N1.words[i])

print(top)
    

print("--- %s seconds ---" % (time.time() - start_time))

In [None]:
u = set(generate_overlapping_vocab([N1,N2]))

In [None]:
a = generate_annoy_embeddings([N1,N2], u)

In [None]:
annoy_array[0].get_nns_by_vector(N2.word_to_vector('cat'),10)

In [None]:
k_nearest_annoy(a[0],N2,N2.word_to_vector('door'),10)

In [None]:
index =  a[1].get_nns_by_vector(N2.word_to_vector('door'),10)

In [None]:


for emb in [N1,N2]:
    vectors = []
    for w in tqdm(u):
        vectors.append(emb.word_to_vector(w))
    
    

In [None]:
from heapq import nlargest
n = nlargest(10, enumerate(cos), key=lambda x: x[1])
res_list = [x[0] for x in n]
res_list

In [None]:
calculate_cosine_for_list(N1.word_to_vector('cat'),N1,N1.words)

In [None]:
calculate_cosine_simil(N1.word_to_vector('cat'),N1.vectors[1])

In [8]:
#New_emb_Combinations.py
from tqdm import tqdm
import numpy as np
from joblib import Parallel, delayed
import multiprocessing
from heapq import nlargest
from tqdm import tqdm
from sklearn.preprocessing import normalize
from annoy import AnnoyIndex

def normalize_vector(vector,norm='l2'):
    vector = np.asarray(vector).reshape(-1,len(vector))
    return normalize(vector,norm=norm)[0]

def generate_overlapping_vocab(embs):
    vocab = set(embs[0].words)
    for i in range(1,len(embs)):
        vocab = vocab.intersection(embs[i].words)
    return list(vocab)
    #return set(embs[0].words).intersection(*embs.words)

    
def calculate_cosine_for_list(vector, emb, overlap_vocab):    
    #start_time = time.time()
    f = lambda w: calculate_cosine_simil(vector,emb.word_to_vector(w))
    return np.fromiter((f(xi) for xi in overlap_vocab), vector.dtype, count=len(overlap_vocab))

    
    
def get_largest_index(list_cos,k):
    n = nlargest(k, enumerate(list_cos), key=lambda x: x[1])
    return  [x[0] for x in n]


def get_top_cosine(vector,emb,k=10,overlap_vocab=None):
    if overlap_vocab is None:
        overlap_vocab = emb.words
        logging.warning('No overlapping vocabulary, using the vocabulary of the embedding')
    
    cos = calculate_cosine_for_list(vector, emb, overlap_vocab)
    index =  get_largest_index(cos,k)
    
    del cos
    top = []
    for i in index:
        top.append(overlap_vocab[i])
    return top
    

def get_top_cosine_sort(vector,emb,overlap_vocab,k=10):
    nearest = sorted(emb.words,key= lambda w: calculate_cosine_simil(vector,emb.word_to_vector(w)), reverse=True)
    
    top = []
    i = 0
    while len(top)<k & i<len(nearest):
        if nearest[i] in overlap_vocab:
            top.append(nearest[i])
        i += 1
    return top


def cos_cdist(matrix, vector):
    v = vector.reshape(1, -1)
    return 1 - scipy.spatial.distance.cdist(matrix, v, 'cosine').reshape(-1)


def get_top_cosine_scipy(vector,emb,k=10,overlap_vocab=None, overlap_matrix = None):
    if overlap_vocab is None:
        overlap_vocab = emb.words
        overlap_matrix = emb.vectors
        logging.warning('No overlapping vocabulary, using the vocabulary of the embedding')
        
    cos = cos_cdist(overlap_matrix,vector)
    index =  get_largest_index(cos,k)

    top = []
    for i in index:
         top.append(overlap_vocab[i])
    return top
    
    
    

def k_nearest_annoy(u,emb,vector,k=10):
    index =  u.get_nns_by_vector(vector,k)
    return [emb.words[x] for x in index]
    
def generate_annoy(emb):
    t = AnnoyIndex(emb.dims)
    for i in tqdm(range(len(emb.words))):
        t.add_item(i,emb.vectors[i])
    t.build(10)
    
    return t

def generate_annoy_embeddings(embs, overlapping_vocab):
    annoy_array = []
    
    for emb in embs:
        t = AnnoyIndex(emb.dims)
        for num, w in enumerate(emb.words):
            if w in overlapping_vocab:
                t.add_item(num,emb.vectors[num])
        t.build(10)
        annoy_array.append(t)
        
    return annoy_array


def generate_overlapping_matrix(overlapping_vocab,emb):
    matrix = []
    for w in overlapping_vocab:
        matrix.append(emb.word_to_vector(w))
        #matrix = np.append(matrix,emb.word_to_vector(w),axis=0)
    return matrix

def generate_overlapping_matrix_embs(overlapping_vocab,embs):
    over = []
    for e in embs:
        over.append(generate_overlapping_matrix(overlapping_vocab,e))
    return over

def generate_word(embedding,list_embs,word,overlapping_vocab=None,overlapping_matrix=None, annoy = None, number_of_words = 10, method = 'cosine'):
    assert method in ["cosine","knearest"], "Concatenate: Unrecognized method"
    
    if overlapping_vocab is None:
        overlapping_vocab = generate_overlapping_vocab(list_embs)
    
    if overlapping_matrix is None:
        overlapping_matrix = generate_overlapping_matrix_embs(overlapping_vocab,list_embs)
    
    #if method == 'cosine':
    #    overlapping_vocab = overlapping_vocab
    #else: 
    #    overlapping_vocab = overlapping_vocab

    if len(overlapping_vocab) == 0:
        raise ValueError("There are no overlapping words between the embeddings")
        
    if method == 'knearest': 
        if annoy is None:
            annoy = generate_annoy_embeddings(list_embs,overlapping_vocab)
    
        
    
    #else:
    #    if annoy is None:
    #        annoy=[]
    #        for emb in list_embs:
    #            annoy.append(generate_annoy(emb))
    #            
    #    if len(annoy) != len(list_embs):
    #        raise ValueError('We need the same number of annoy indexes than embeddings')
    
    
    
    
    #Search a vector for the word (We will use the first embedding that contains the word)
    vector = None
    emb_n = None
    emb_u = None
    
    for e_num, e in enumerate(list_embs):
        try:
            vector = e.word_to_vector(word)
            emb_n = e
            emb_u = e_num
            break
        except KeyError as err:
            continue
    
    if vector is None:
        logging.warning("Word {} not found in any embedding.".format(word))
        return None
    
    if method == 'cosine':
        #top = get_top_cosine(vector,emb_n,number_of_words,overlapping_vocab)
        
        #return vector, emb_n, number_of_words, overlapping_vocab, overlapping_matrix[emb_u]
        #print('VECTOR:')
        #print(vector)
        #print('emb_n')
        #print(emb_n)
        top = get_top_cosine_scipy(vector,emb_n,number_of_words,overlapping_vocab,overlapping_matrix[emb_u])
    else:
        top = k_nearest_annoy(annoy[emb_u],emb_n,vector,number_of_words)
    
    if len(top)<number_of_words:
        logging.warning("Not enough words to generate a vector for the word {}, consider to modify the number_of_words parameter. Note: The vector will be generated with the available words".format(word))
    #print('W: ')
    #print(word)
    #print('TOP:')
    #print(top)
    result = np.zeros(embedding.dims, dtype=np.float32)
    
    for w in top:
        result+=embedding.word_to_vector(w)
    
    
    
    return result/len(top)
        


    
def get_vector_concat(embs, word,weights=None, method="zeros",overlapping_vocab = None, overlapping_matrix = None, annoy=None,k=10, method_generate = 'cosine', normalize=False):
    vector = []
    for e in range(len(embs)):
        try:
            if weights is None:
                if normalize:
                    vector = np.append(vector,normalize_vector(embs[e].word_to_vector(word)),axis=0)
                else:  
                    vector = np.append(vector,embs[e].word_to_vector(word),axis=0)
                
            else:
                if normalize:
                    vector = np.append(vector,normalize_vector(embs[e].word_to_vector(word))*weights[e],axis=0)
                else:
                    vector = np.append(vector,embs[e].word_to_vector(word)*weights[e],axis=0)
        except KeyError as err:
            if method == "zeros":
                vector = np.append(vector,np.zeros(shape=(embs[e].dims),dtype=np.float32))
                
            elif method == "generate":
                vector_gen = generate_word(embs[e],embs,word,overlapping_vocab,overlapping_matrix, annoy,k,method_generate)
                if vector_gen is None:
                    logging.warning("Word {} omitted.".format(word))
                    return None
                else: 
                    #logging.warning("Vector generated for the word {}".format(word))
                    if weights is None:
                        if normalize:
                            vector = np.append(vector,normalize_vector(vector_gen),axis=0)
                        else:  
                            vector = np.append(vector,vector_gen,axis=0)
                
                    else:
                        if normalize:
                            vector = np.append(vector,normalize_vector(vector_gen)*weights[e],axis=0)
                        else:
                            vector = np.append(vector,vector_gen*weights[e],axis=0)
    
            else:
                return None
    
    return vector

def get_vector_avg(embs,word,weights=None,method="ignore",overlapping_vocab = None, overlapping_matrix = None, annoy=None,k=10, method_generate = 'cosine', normalize=False, norm='l1'):
    div = 0
    avg = np.zeros(embs[0].dims, dtype=np.float32)

    for e in range(len(embs)):
        try:
            if weights is None:
                if normalize:
                    avg+=normalize_vector(embs[e].word_to_vector(word),norm)
                else:
                    avg+=embs[e].word_to_vector(word)
                div += 1
            else:
                if normalize:
                    avg+=normalize_vector(embs[e].word_to_vector(word),norm) * weights[e]
                else:
                    avg+=embs[e].word_to_vector(word) * weights[e]
                div+=weights[e]
            
        except KeyError as err:
            if method == "skip":
                return None
            elif method=="generate":
                vector_gen = generate_word(embs[e],embs,word,overlapping_vocab,overlapping_matrix,annoy,k,method_generate)
                if vector_gen is None:
                    logging.warning("Word {} omitted.".format(word))
                    return None
                else:
                    #logging.warning("Vector generated for the word {}".format(word))
                    
                    if weights is None:
                        if normalize:
                            avg+=normalize_vector(vector_gen,norm)
                        else:
                            avg+=vector_gen
                        div += 1
                    else:
                        if normalize:
                            avg+=normalize_vector(vector_gen,norm) * weights[e]
                        else:
                            avg+=vector_gen * weights[e]
                        div+=weights[e]
              
            else:
                continue

    if (div > 0):
        return avg/div

    else:
        logging.warning("Word {} not found in any embedding.".format(word))
        return None
    
                    
def concatenate_embeddings(embs, path='/home/concat.vec', vocabulary = None, weights=None, method="zeros",generate_method='cosine',k=10,normalize=False,where="file"):
    assert method in ["zeros","skip","generate"], "Concatenate: Unrecognized method"
    assert generate_method in ["cosine","knearest"], "Concatenate: Unrecognized generation method"
    assert where in ["file","return","generate"], "Concatenate: Unrecognized return method"
    
    if vocabulary is None: 
        vocabulary = set()
        for e in embs:
            for w in e.words:
                vocabulary.add(w)
                
    
    else:
        if len(set(vocabulary)) != len(vocabulary):
            logging.warning("Provided vocabulary has duplicates. IMPORTANT NOTE: The new embedding WILL HAVE duplicates, you may want to check your vocabulary")
    
    annoy = None
            
    if method == "generate":
        overlapping_vocab = generate_overlapping_vocab(embs)
        if generate_method == 'knearest':
            annoy = generate_annoy_embeddings(embs,overlapping_vocab)
            overlapping_matrix = None
        else: 
            annoy = None
            overlapping_matrix = generate_overlapping_matrix_embs(overlapping_vocab,embs)
    else:
        overlapping_vocab = None
        overlapping_matrix = None
 
    
    num_words = 0
    word_ignored = 0
    len_vectors = 0
    
    for e in embs:
        len_vectors+=e.dims
        
    if where == "file":
        with open(path, 'w') as file:
            for w in tqdm(vocabulary):
                v = get_vector_concat(embs,w,weights,method,overlapping_vocab,overlapping_matrix,annoy,k,generate_method,normalize)
                if v is not None:
                    print(w + ' ' +' '.join(['%.6g' % x for x in v] ), file=file)
                    num_words+=1
                else:
                    word_ignored+=1
                    logging.warning("Word {} ignored".format(w))
    
    else:
        vocab = []
        vectors = []
        for w in tqdm(vocabulary):
            v = get_vector_concat(embs,w,weights,method,overlapping_vocab,overlapping_matrix,annoy,k,generate_method,normalize)
            if v is not None:
                vocab.append(w)
                vectors.append(v)
                num_words+=1
            else:
                word_ignored+=1
                logging.warning("Word {} ignored".format(w))
            
    if word_ignored > 0:
        logging.warning("Ignored {} words of the combined vocabulary between the embeddings".format(word_ignored))
    

    
    logging.getLogger().setLevel(logging.INFO)
    logging.info("The new embedding has {} word and vectors have {} dimensions".format(num_words,len_vectors))
    
    if where  == "file":
        return True
    
    return Embedding(vocabulary=Vocabulary(words=vocab, lower = False), vectors=vectors)
    
def avg_embeddings(embs, path='/home/avg.vec', vocabulary = None, weights=None, method = "ignore",generate_method='cosine',k=10,normalize=False, normalize_norm='l2', where="file"):
    assert method in ["skip","ignore","generate"], "Average: Unrecognized method"
    assert where in ["file","return"], "Average: Unrecognized return method"
        
    dims = embs[0].dims
    for e in embs:
        if e.dims!=dims:
            raise ValueError("All the embedding must have the same vector length. Found and embedding with {} dimensions and another one with {} dimensions".format(dims,e.dims))
    
    
    if vocabulary is None: 
        vocabulary = []
        for e in embs:
            vocabulary= np.append(vocabulary,e.words, axis=0)
        vocabulary = set(vocabulary)
    
    else:
        if len(set(vocabulary)) != len(vocabulary):
            logging.warning("Provided vocabulary has duplicates. IMPORTANT NOTE: The new embedding WILL HAVE duplicates, you may want to check your vocabulary")
    
    annoy = None
    
    if method == "generate":
        overlapping_vocab = generate_overlapping_vocab(embs)
        if generate_method == 'knearest':
            annoy = generate_annoy_embeddings(embs,overlapping_vocab)
            overlapping_matrix = None
        else: 
            annoy = None
            overlapping_matrix = generate_overlapping_matrix_embs(overlapping_vocab,embs)
    else:
        overlapping_vocab = None
        overlapping_matrix = None

    
    num_words = 0
    word_ignored= 0
    
    if where == "file":
    
        with open(path, 'w') as file:
            for w in tqdm(vocabulary):

                r = get_vector_avg(embs,w,weights,method,overlapping_vocab,overlapping_matrix,annoy,k,generate_method,normalize,normalize_norm)
                if r is not None:
                    print(w + ' ' +' '.join(['%.6g' % x for x in r] ), file=file)
                    num_words+=1
                else:
                    word_ignored+=1
                    logging.warning("Word {} ignored".format(w))
    else:
        vocab = []
        vectors = []
        for w in tqdm(vocabulary):
            r = get_vector_avg(embs,w,weights,method,overlapping_vocab,overlapping_matrix,annoy,k,generate_method,normalize,normalize_norm)
            if r is not None:
                vocab.append(w)
                vectors.append(r)
                num_words+=1
            else:
                word_ignored+=1
                logging.warning("Word {} ignored".format(w))

            
    if word_ignored > 0:
        logging.warning("Ignored {} words of the combined vocabulary between the embeddings".format(word_ignored))
    

    
    logging.getLogger().setLevel(logging.INFO)
    logging.info("The new embedding has {} words and vectors have {} dimensions".format(num_words,dims))
    
    if where  == "file":
        return True
    
    return Embedding(vocabulary=Vocabulary(words=vocab, lower = False), vectors=vectors)


def generate_dictionary_for_vecmap(emb1, emb2, path, return_dict = False):
    vocab1 = emb1.words
    vocab2 = emb2.words
    
    dictionary = set(vocab1).intersection(vocab2)
    
    with open(path, 'w') as file:
        for w in tqdm(dictionary):
            print(w + ' ' + w, file = file)
    
    if return_dict:
        return dictionary
    
    return True
    
def generate_dictionary_vecmap_top_words(infile,outfile,frequency=False):
    
    with open(infile) as f:
        if not frequency:
            words = f.read().splitlines('\t')
        else:
            words = []
            for line in f:
                words.append(line.split()[0])
            
    with open(outfile, 'w') as file:
        for w in tqdm(words):
            print(w + ' ' + w, file = file)
            
    return True


def generate_dictionary_emb_synset(infile,outfile):
    
    words = []
    sysets = []
    
    with open(infile) as f:
        for line in f:
            w = line.split()
            if len(w)==2:
                words.append(w[0])
                sysets.append(w[1][0:-2])
    with open(outfile, 'w+') as file:
        for w in tqdm(range(len(words))):
            print(words[w] + ' ' + sysets[w], file = file)
            
    return True

In [9]:
import multiprocessing
import os

global list_embs
global overlapping_vocab
global list_vocabulary
global list_weights
global method_avg
global list_annoy
global k_avg
global generate_method_avg
global overlapping_matrix
import time
import datetime


def avg_batch_file(path,first,last):
    
    global list_embs
    global overlapping_vocab
    global list_vocabulary
    global list_weights
    global method_avg
    global list_annoy
    global k_avg
    global generate_method_avg
    global overlapping_matrix
    with open(path, 'w') as file:
        start_time = time.time()
        for i in range(first,last):
            r = get_vector_avg(list_embs,list_vocabulary[i],list_weights,method_avg,overlapping_vocab,overlapping_matrix,list_annoy,k_avg,generate_method_avg)
            if r is not None:
                print(list_vocabulary[i] + ' ' +' '.join(['%.6g' % x for x in r] ), file=file)
            #else:
            #    word_ignored+=1
            #    logging.warning("Word {} ignored".format(list_vocabulary[i]))
            
            if i%100==0:
                print("Thread" + str(multiprocessing.current_process()) + ": " + str(i-first) + " of " + str(last-first) + " Time remaining: " + str(datetime.timedelta(seconds=(time.time() - start_time)/100*(last-i))))
                start_time = time.time()




def avg_embeddings_generate_multithread(embs, path='/home/avg', vocabulary = None, weights=None, method = "ignore",generate_method='cosine',k=10):
    global list_embs
    global overlapping_vocab
    global list_vocabulary
    global list_weights
    global method_avg
    global list_annoy
    global k_avg
    global generate_method_avg
    global overlapping_matrix

    
    assert method in ["skip","ignore","generate"], "Average: Unrecognized method"
        
    dims = embs[0].dims
    for e in embs:
        if e.dims!=dims:
            raise ValueError("All the embedding must have the same vector length. Found and embedding with {} dimensions and another one with {} dimensions".format(dims,e.dims))
    
    
    if vocabulary is None: 
        vocabulary = []
        for e in embs:
            vocabulary= np.append(vocabulary,e.words, axis=0)
        vocabulary = set(vocabulary)  
    else:
        if len(set(vocabulary)) != len(vocabulary):
            logging.warning("Provided vocabulary has duplicates. IMPORTANT NOTE: The new embedding WILL HAVE duplicates, you may want to check your vocabulary")  
    
    if method == "generate":
        overlapping_vocab = generate_overlapping_vocab(embs)
        if generate_method == 'knearest':
            annoy = generate_annoy_embeddings(embs,overlapping_vocab)
            overlapping_matrix = None
        else: 
            annoy = None
            overlapping_matrix = generate_overlapping_matrix_embs(overlapping_vocab,embs)
    else:
        overlapping_vocab = None
        
    list_vocabulary = list(vocabulary)
    list_embs = embs
    list_weights = weights
    method_avg = method
    list_annoy = annoy
    k_avg = k
    generate_method_avg = generate_method

    
    CPUs= multiprocessing.cpu_count()-1
    
    batch = int(len(vocabulary)/CPUs)
    batch_start = 0
    batch_end = batch_start + batch
    
    
    
    for process_idx in range(CPUs):
        if process_idx ==  CPUs-1:
            batch_end = len(vocabulary)
            
        name = path+str(process_idx)
        
        p = multiprocessing.Process(target=avg_batch, args=(name,batch_start,batch_end,))
        os.system("taskset -p -c %d %d" % (process_idx % CPUs, os.getpid()))
        p.start()
        batch_start = batch_end
        batch_end = batch_end + batch
        

        
        
        
        

                          
    
    
    

In [10]:
global embp
global list_embs
global overlapping_vocab
global list_vocabulary
global method_gen
global list_annoy
global k_gen
global overlapping_matrix



def generate_batch(path,first,last):
    global embp
    global list_embs
    global overlapping_vocab
    global list_vocabulary
    global method_gen
    global list_annoy
    global k_gen
    global overlapping_matrix
    
    with open(path, 'w') as file:
        start_time = time.time()
        for i in range(first,last):
            try:
                vector = embp.word_to_vector(list_vocabulary[i])
            
            except KeyError as err:
                vector = generate_word(embp,list_embs,list_vocabulary[i],overlapping_vocab,overlapping_matrix,list_annoy,k_gen,method_gen) 
            
            if vector is not None:
                print(list_vocabulary[i] + ' ' +' '.join(['%.6g' % x for x in vector] ), file=file)
            else:
                logging.warning("Word {} ignored".format(list_vocabulary[i]))
                
            if i%100==0:
                print("Thread" + str(multiprocessing.current_process()) + ": " + str(i-first) + " of " + str(last-first) + " Time remaining: " + str(datetime.timedelta(seconds=(time.time() - start_time)/100*(last-i))))
                start_time = time.time()
        
def merge_vocab_generator(emb,embs,path,vocab=None, method = 'cosine', k = 10):
    global embp                    
    global list_embs
    global overlapping_vocab
    global list_vocabulary
    global method_gen
    global list_annoy
    global k_gen
    global overlapping_matrix                          

    embs.append(emb)
    
    if vocab is None: 
        vocab = []
        for e in embs:
            vocab= np.append(vocab,e.words, axis=0)
        vocab = set(vocab)  
    
    
    overlapping_vocab = generate_overlapping_vocab(embs)
    
    
    if method == 'cosine':
        overlapping_matrix = generate_overlapping_matrix_embs(overlapping_vocab,embs)
    else:
        overlapping_matrix = None
    
    if method == 'knearest':
        annoy = generate_annoy_embeddings(embs,overlapping_vocab)
    else:
        annoy = None
    
    embp = emb                    
    list_embs = embs
    
    list_vocabulary = list(set(vocab))
    method_gen = method
    list_annoy = annoy
    k_gen = k
    overlapping_matrix = overlapping_matrix
    
    CPUs= multiprocessing.cpu_count()-1
    
    batch = int(len(list_vocabulary)/CPUs)
    batch_start = 0
    batch_end = batch_start + batch
    
    
    
    for process_idx in range(CPUs):
        if process_idx ==  CPUs-1:
            batch_end = len(list_vocabulary)
            
        name = path+str(process_idx)
        
        p = multiprocessing.Process(target=generate_batch, args=(name,batch_start,batch_end,))
        os.system("taskset -p -c %d %d" % (process_idx % CPUs, os.getpid()))
        p.start()
        batch_start = batch_end
        batch_end = batch_end + batch                  

                    
                        

In [11]:
generate_dictionary_emb_synset('/home/iker/Escritorio/wnet30_dict.txt','/home/iker/Escritorio/wnet30_dict_filtered.txt')

100%|██████████| 120433/120433 [00:00<00:00, 771821.71it/s]


True

In [12]:
#auto_eval_scrips.py
from copy import deepcopy
import itertools
import datetime
import psutil
import sys
import os

def test_normalization(path,embformat='txt', dims_restriction = None, delete_duplicates = False, lowercase_datasets=False):
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    
    print('============ORIGINAL==========')
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    

    print('============Mean center EMB==========')
    E.mean_center_embeddingwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))

    del E
    
    print('============L1 por columnas==========')
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    E.L1_dimensionwwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    del E
    
    
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = True, normalize_dimensionwise=False, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    originalmatrix = deepcopy(E.vectors)
    
    print('============L2 rowwise + Mean Center==========')
    E.mean_center()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============L2 rowwise + PPA==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.vectors = PPA(E.vectors)
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============L2 rowwise + L2 dimensionwise==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.length_normalize_dimensionwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============L2 rowwise + L2 dimensionwise + PPA==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.length_normalize_dimensionwise()
    E.vectors = PPA(E.vectors)
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    del originalmatrix
    del E
    
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    originalmatrix = deepcopy(E.vectors)
    
    print('============L2 dimensionwise==========')
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============L2 dimensionwise + Mean Center==========')
    E.mean_center()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============L2 dimensionwise + PPA==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.vectors = PPA(E.vectors)
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    del originalmatrix
    del E
    
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    E.mean_center()
    originalmatrix = deepcopy(E.vectors)
    
    print('============Mean center==========')
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============ Mean Center + L2 dimensionwise ==========')
    E.length_normalize_dimensionwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============Mean Center + PPA==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.vectors = PPA(E.vectors)
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============ Mean Center + L2 rowwise + L2 dimensionwise ==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.length_normalize()
    E.length_normalize_dimensionwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    del originalmatrix
    del E
    
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    E.vectors = PPA(E.vectors)
    originalmatrix = deepcopy(E.vectors)
    
    print('============ PPA  ==========')
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============ PPA + L2 dimensionwise ==========')
    E.length_normalize_dimensionwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============ PPA + Mean Center ==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.mean_center()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    print('============ PPA + L2 rowwise + L2 dimensionwise ==========')
    del E.vectors
    E.vectors = deepcopy(originalmatrix)
    E.length_normalize()
    E.length_normalize_dimensionwise()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    del originalmatrix
    del E
    print('============ L2 rowwise + L2 dimensionwise + Mean center ==========')
    E = load_embedding(path, format=embformat, vocabulary = None, length_normalize = True, normalize_dimensionwise=True, dims_restriction=dims_restriction, delete_duplicates = delete_duplicates)
    E.mean_center()
    results_to_csv(evaluate_on_all(E,lowercase_dataset=lowercase_datasets))
    
    del E
    
    return True


def test_similarity_auto(embs,names,w):
    t = ''
    for n in range(len(names)):
        if n == len(names)-1:
             t = t+','+str(names[n])
        else:
            if n==0:
                t = str(names[n])
            else:
                t = t+'+'+str(names[n])
        
    a,b = results_to_csv(evaluate_on_all_avg(embs,lowercase_dataset=True,weights=np.array(w)),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(t))

    
def test_concatenate_auto(embs,names,w,normalize=True):
    t = ''
    for n in range(len(names)):
        if n == len(names)-1:
             t = t+','+str(names[n])
        else:
            if n==0:
                t = str(names[n])
            else:
                t = t+'+'+str(names[n])
    
    
    c = concatenate_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=np.array(w), method="generate",generate_method='cosine',k=10,normalize=True,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(t), filenameResults = 'L2Concat_REDO.csv', filenameCoverage = 'L2ConcatCoverage_REDO.csv')
    
    del c
    
    c = concatenate_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=np.array(w), method="generate",generate_method='cosine',k=10,normalize=False,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(t), filenameResults = 'Concat_REDO.csv', filenameCoverage = 'ConcatCoverage_REDO.csv')

    
    
def test_average_auto(embs,names,w,normalize=True):
    t = ''
    for n in range(len(names)):
        if n == len(names)-1:
             t = t+','+str(names[n])
        else:
            if n==0:
                t = str(names[n])
            else:
                t = t+'+'+str(names[n])
    
    c = avg_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=np.array(w), method="generate",generate_method='cosine',k=10,normalize=True,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(t), filenameResults = 'L2AVG_REDO.csv', filenameCoverage = 'L2AVGCoverage_REDO.csv')
    del c
    
    c = avg_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=np.array(w), method="generate",generate_method='cosine',k=10,normalize=False,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(t), filenameResults = 'AVG_REDO.csv', filenameCoverage = 'AVGCoverage_REDO.csv')

    
def test_similarity_avg():
    dataset_vocab = get_vocab_simil_all()
    dataset_min = get_vocab_simil_all(True)
    
    
    GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
    W2V = load_embedding(W2V_path, vocabulary = dataset_min, format='bin', length_normalize = False, normalize_dimensionwise=False)
    FT = load_embedding(FastText_CC_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(UKB_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(lexvec, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    SKE = load_embedding(SketchEngine_web_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
    PDC = load_embedding(PDC_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    
    embs = [GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC,SKE,PDC]
    names = ['GLOVE','W2V','FT','jointcHYB','UKB','LEXVEC','SKE','PDC']
    
    #De dos en dos
    
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            
            test_similarity_auto([embs[x],embs[y]],[names[x],names[y],'"[1,1]"'],[1,1])
            test_similarity_auto([embs[x],embs[y]],[names[x],names[y],'"[2,1]"'],[2,1])
            test_similarity_auto([embs[x],embs[y]],[names[x],names[y],'"[1,2]"'],[1,2])
            
    #De tres en 3
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                w=[1,1,1]
                test_similarity_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
                
                for w in list(itertools.permutations([1, 2, 3])):
                    test_similarity_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
                
                for w in list(itertools.permutations([2, 1, 1])):
                    test_similarity_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
                
                for w in list(itertools.permutations([3, 1, 1])):
                    test_similarity_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
                
                for w in list(itertools.permutations([2, 2, 1])):
                    test_similarity_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
    
    #de 4 en 4
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    w = [1,1,1,1]
                    test_similarity_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)
                    for w in list(itertools.permutations([1, 2, 3, 4])):
                        test_similarity_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)

                    for w in list(itertools.permutations([3, 1, 1, 1])):
                        test_similarity_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)
                    
                    for w in list(itertools.permutations([2, 1, 1, 1])):
                        test_similarity_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)
                    
                    for w in list(itertools.permutations([2, 2, 1, 1])):
                        test_similarity_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)

                   
    #de 5 en 5
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        w = [1,1,1,1,1]
                        test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                        for w in list(itertools.permutations([1, 2, 3, 4,5])):
                            test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)

                        for w in list(itertools.permutations([3, 1, 1, 1,1])):
                            test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                        
                        for w in list(itertools.permutations([2, 1, 1, 1,1])):
                            test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                        
                        for w in list(itertools.permutations([2, 2, 1, 1,1])):
                            test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                        
                        for w in list(itertools.permutations([3, 2, 2, 1,1])):
                            test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                            
                        
                    
    #de 6 en 6
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            w = [1,1,1,1,1,1]
                            test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                            for w in list(itertools.permutations([1, 2, 3, 4, 5, 6])):
                                test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                                
                            for w in list(itertools.permutations([3,1, 1, 1, 1,1])):
                                test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                            
                            for w in list(itertools.permutations([2,1, 1, 1, 1,1])):
                                test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                            
                            for w in list(itertools.permutations([2, 2, 2, 2, 1,1])):
                                test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                               
     #de 7 en 7
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            for t in range(i+1,len(names)): 
                                w = [1,1,1,1,1,1,1]
                                test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)
                                for w in list(itertools.permutations([1, 2, 3, 4, 5, 6,7])):
                                    test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)

                                for w in list(itertools.permutations([3,1,1, 1, 1, 1,1])):
                                    test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)
                                
                                for w in list(itertools.permutations([2,1,1, 1, 1, 1,1])):
                                    test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)

                                for w in list(itertools.permutations([2,2,2, 2, 1, 1,1])):
                                    test_similarity_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)

                                
    #Todos
    w = [1,1,1,1,1,1,1,1]
    test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
    for w in list(itertools.permutations([1, 2, 3, 4, 5, 6, 7 ,8])):
        test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
                           
    for w in list(itertools.permutations([3, 1,1,1, 1, 1, 1,1])):
        test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
   
    for w in list(itertools.permutations([2, 1,1,1, 1, 1, 1,1])):
        test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
   

    for w in list(itertools.permutations([2, 2,2,2, 1, 1, 1,1])):
        test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
   
    for w in list(itertools.permutations([3, 2,2,1,1, 1, 1,1])):
        test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
    
    for w in list(itertools.permutations([4, 4,2,2,1, 1, 1,1])):
        test_similarity_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)
 





def equal_dims(embs):
    dims = embs[0].dims
    for e in embs:
        if e.dims != dims:
            return False
    return True

def test_concat_avg():        
    dataset_vocab = get_vocab_simil_all()
    dataset_min = get_vocab_simil_all(True)
    
    
    GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
    W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
    FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    SKE = load_embedding(SketchEngine_web_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
    PDC = load_embedding(PDC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    
    embs = [GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC,SKE,PDC]
    names = ['GLOVE','W2V','FT','jointcHYB','UKB','LEXVEC','SKE','PDC']
    
    #De dos en dos
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            
            test_concatenate_auto([embs[x],embs[y]],[names[x],names[y],'"[1,1]"'],[1,1])
            test_concatenate_auto([embs[x],embs[y]],[names[x],names[y],'"[2,1]"'],[2,1])
            test_concatenate_auto([embs[x],embs[y]],[names[x],names[y],'"[1,2]"'],[1,2])
            test_concatenate_auto([embs[x],embs[y]],[names[x],names[y],'"[8,1]"'],[8,1])
            test_concatenate_auto([embs[x],embs[y]],[names[x],names[y],'"[1,8]"'],[1,8])
            
            if embs[x].dims==embs[y].dims:
                test_average_auto([embs[x],embs[y]],[names[x],names[y],'"[1,1]"'],[1,1])
                test_average_auto([embs[x],embs[y]],[names[x],names[y],'"[2,1]"'],[2,1])
                test_average_auto([embs[x],embs[y]],[names[x],names[y],'"[1,2]"'],[1,2])
    
        #De tres en 3
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                w = [1,1,1]
                test_concatenate_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
                
                if equal_dims([embs[x],embs[y],embs[j]]):
                    test_average_auto([embs[x],embs[y],embs[j]],[names[x],names[y],names[j],'"'+str(np.array(w))+'"'],w)
                
    #de 4 en 4
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    w = [1,1,1,1]
                    test_concatenate_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)
                    if equal_dims([embs[x],embs[y],embs[j],embs[z]]):
                        test_average_auto([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z],'"'+str(np.array(w))+'"'],w)
                    
                    
                   
    #de 5 en 5
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        w = [1,1,1,1,1]
                        test_concatenate_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                        if equal_dims([embs[x],embs[y],embs[j],embs[z],embs[v]]):
                            test_average_auto([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v],'"'+str(np.array(w))+'"'],w)
                         
                    
    #de 6 en 6
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            w = [1,1,1,1,1,1]
                            test_concatenate_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                            if equal_dims([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]]):
                                test_average_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i],'"'+str(np.array(w))+'"'],w)
                            
     #de 7 en 7
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            for t in range(i+1,len(names)): 
                                w = [1,1,1,1,1,1,1]
                                test_concatenate_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)
                                if equal_dims([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]]):
                                    test_average_auto([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i],embs[t]],[names[x],names[y],names[j],names[z],names[v],names[i],names[t],'"'+str(np.array(w))+'"'],w)
                                 
                                               
                                
    #Todos
    w = [1,1,1,1,1,1,1,1]
    test_concatenate_auto(embs,[names[0],names[1],names[2],names[3],names[4],names[5],names[6],names[7],'"'+str(np.array(w))+'"'],w)

from copy import deepcopy
def test_reduction(embs, name):
    path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/ConcatenatedNoL2/'
    
    path = path + name
    
    c = concatenate_embeddings(embs, path='/home/concat.vec', vocabulary = None, weights=None, method="zeros",generate_method='cosine',k=10,normalize=False, where="return")
    del embs
    
    c.export(path+'.vec')
    
    del c
    
    #original = deepcopy(c)
    
    
    #c.vectors = algo(c.vectors,n)
    #a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    #export_to_csv(txtResults=a, txtCov = b, name=name+'_PPA_'+str(n), filenameResults = 'dim_red', filenameCoverage = 'dim_redCoverage.csv')
    
    
    #del c
    
    #c = deepcopy(original)
    #c.vectors = PCA(c.vectors,n)
    
    #a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    #export_to_csv(txtResults=a, txtCov = b, name=name+'_PCA_'+str(n), filenameResults = 'dim_red', filenameCoverage = 'dim_redCoverage.csv')

    
    #c.export(path+'_PCA_'+str(n))
    
    #del c
    
    #original.vectors = T_SVD(original.vectors,n)
    #original.export(path+'_SVD_'+str(n))
    
    #a,b = results_to_csv(evaluate_on_all(original,lowercase_dataset=True),printRes=False,returnRes=True)
    #export_to_csv(txtResults=a, txtCov = b, name=name+'_SVD_'+str(n), filenameResults = 'dim_red', filenameCoverage = 'dim_redCoverage.csv')

    
    #del original
    
    
    #e_ppa = load_embedding(path+'_PPA_'+str(n), vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=n)
    #e_pca = load_embedding(path+'_PCA_'+str(n), vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=n)
    #e_svd = load_embedding(path+'_SVD_'+str(n), vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=n)

    #a,b = results_to_csv(evaluate_on_all(e_ppa,lowercase_dataset=True),printRes=False,returnRes=True)
    #export_to_csv(txtResults=a, txtCov = b, name=name+'_PPA_'+str(n), filenameResults = 'dim_red', filenameCoverage = 'dim_redCoverage.csv')
    
    #a,b = results_to_csv(evaluate_on_all(e_pca,lowercase_dataset=True),printRes=False,returnRes=True)
    #export_to_csv(txtResults=a, txtCov = b, name=name+'_PCA_'+str(n), filenameResults = 'dim_red', filenameCoverage = 'dim_redCoverage.csv')

    #a,b = results_to_csv(evaluate_on_all(e_svd,lowercase_dataset=True),printRes=False,returnRes=True)
    #export_to_csv(txtResults=a, txtCov = b, name=name+'_SVD_'+str(n), filenameResults = 'dim_red', filenameCoverage = 'dim_redCoverage.csv')

    return True

def add__reduction():
    #GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    
    test_reduction([GLOVE,jointcHYB],'GLOVE + jointcHYB')
    del GLOVE
    
    FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([FT,jointcHYB],'FT + jointcHYB')
    del FT
    
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([LEXVEC,jointcHYB],'LEXVEC + jointcHYB')
    del LEXVEC
    
    
    W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
    test_reduction([W2V,jointcHYB],'W2V + jointcHYB')
    del jointcHYB
    del W2V
    
    return True
    
    

def test_dim_reduction():
    #GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
    #W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
    #FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    #jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    #UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    #LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    #SKE = load_embedding(SketchEngine_web_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
    #PDC = load_embedding(PDC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    
    
    #test_reduction([GLOVE,jointcHYB],'GLOVE + jointcHYB')
    GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([GLOVE,jointcHYB],'GLOVE + jointcHYB')
    if 'GLOVE' in locals():
        del GLOVE
    if 'jointcHYB' in locals():
        del jointcHYB
 
    FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([FT,jointcHYB],'FT + jointcHYB')
    
    if 'FT' in locals():
        del FT
    if 'jointcHYB' in locals():
        del jointcHYB
    
    W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([W2V,jointcHYB],'W2V + jointcHYB')
    if 'W2V' in locals():
        del W2V
    if 'jointcHYB' in locals():
        del jointcHYB
    
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([LEXVEC,jointcHYB],'LEXVEC + jointcHYB')
    
    if 'LEXVEC' in locals():
        del LEXVEC
    if 'jointcHYB' in locals():
        del jointcHYB
    
    FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([LEXVEC,jointcHYB,FT],'LEXVEC + jointcHYB + FT')

    if 'FT' in locals():
        del FT 
    if 'LEXVEC' in locals():
        del LEXVEC
    if 'jointcHYB' in locals():
        del jointcHYB
    
    FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_reduction([LEXVEC,jointcHYB,FT,UKB],'LEXVEC + jointcHYB + FT + UKB')
    
    
    '''
    UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
   
    test_reduction([FT,UKB],'FT + UKB')

    del UKB
    del FT
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
   
    test_reduction([jointcHYB,LEXVEC],'LEXVEC + jointcHYB')
   
    del jointcHYB
    del LEXVEC
    
    
    GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
    W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
    FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    SKE = load_embedding(SketchEngine_web_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
    PDC = load_embedding(PDC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    
    
    test_reduction([GLOVE,W2V,jointcHYB],'GLOVE + W2V + jointcHYB',600)
    test_reduction([GLOVE,FT,jointcHYB],'GLOVE + FT + jointcHYB',600)
    test_reduction([GLOVE,W2V,jointcHYB],'GLOVE + W2V + jointcHYB',300)
    test_reduction([GLOVE,FT,jointcHYB],'GLOVE + FT + jointcHYB',300)
    
    test_reduction([W2V,FT,jointcHYB],'W2V + FT + jointcHYB',600)
    test_reduction([W2V,FT,jointcHYB],'W2V + FT + jointcHYB',300)
    
    test_reduction([LEXVEC,FT,jointcHYB,UKB],'LEXVEC + FT + jointcHYB + UKB',600)
    test_reduction([LEXVEC,FT,jointcHYB,UKB],'LEXVEC + FT + jointcHYB + UKB',300)
    
    test_reduction([LEXVEC,FT,W2V,GLOVE],'LEXVEC + FT + W2V + GLOVE',600)
    test_reduction([LEXVEC,FT,W2V,GLOVE],'LEXVEC + FT + W2V + GLOVE',300)
    
    test_reduction([LEXVEC,FT,W2V,jointcHYB],'LEXVEC + FT + W2V + jointcHYB',600)
    test_reduction([LEXVEC,FT,W2V,jointcHYB],'LEXVEC + FT + W2V + jointcHYB',300)
    
    test_reduction([GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC,SKE,PDC],'GLOVE + W2V + FT + jointcHYB + UKB + LEXVEC + SKE + PDC',300)
    test_reduction([GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC,SKE,PDC],'GLOVE + W2V + FT + jointcHYB + UKB + LEXVEC + SKE + PDC',900)
    test_reduction([GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC,SKE,PDC],'GLOVE + W2V + FT + jointcHYB + UKB + LEXVEC + SKE + PDC',1200)
    
    '''
    
    return True





def sizeof_fmt(num, suffix='B'):
    ''' By Fred Cirera, after https://stackoverflow.com/a/1094933/1870254'''
    for unit in ['','Ki','Mi','Gi','Ti','Pi','Ei','Zi']:
        if abs(num) < 1024.0:
            return "%3.1f%s%s" % (num, unit, suffix)
        num /= 1024.0
    return "%.1f%s%s" % (num, 'Yi', suffix)



def print_memory_usage():
    print('>>> Virtual_memory (used): ' + str(psutil.virtual_memory().used / (1024.0 ** 3)) + ' GB')
    print('>>> Swap_memory (used): ' + str(psutil.swap_memory().used / (1024.0 ** 3)) + ' GB')
    print(' ')
    print(' ')  
    return True

def test_1_reduction(path,nameE):
    abs_path = os.path.join(path, nameE)
    with open(abs_path) as f:
        first_line = f.readline()
        first_line = first_line.split(' ')
        d = int(first_line[1])

    
    
    
    print(str(datetime.datetime.now()) + " Starting test algo, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    e = load_embedding(abs_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=d)
    
    print(str(datetime.datetime.now()) + " Starting algo, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    e.vectors = algo(e.vectors,300)
    print(str(datetime.datetime.now()) + " algo finished, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(nameE)+'_PPA_', filenameResults = 'dim_red_noL2.csv', filenameCoverage = 'dim_noL2_redCoverage.csv')
    
    del e
    del a
    del b
    
    print(str(datetime.datetime.now()) + " Starting test PCA, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    e = load_embedding(abs_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=d)   
    print(str(datetime.datetime.now()) + " Starting PCA, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    e.vectors = PCA(e.vectors,300)
    print(str(datetime.datetime.now()) + " PCA finished, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(nameE)+'_PCA_', filenameResults = 'dim_red_noL2.csv', filenameCoverage = 'dim_noL2_redCoverage.csv')
    
    del e
    del a
    del b
    
    print(str(datetime.datetime.now()) + " Starting test tSVD, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    e = load_embedding(abs_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=d)   
    
    print(str(datetime.datetime.now()) + " Starting tSVD, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    e.vectors = T_SVD(e.vectors,300)
    print(str(datetime.datetime.now()) + " tSVD finished, embedding: " + str(nameE))
    print_memory_usage()
    for name, size in sorted(((name, sys.getsizeof(value)) for name,value in locals().items()),
                             key= lambda x: -x[1])[:10]:
        print("{:>30}: {:>8}".format(name,sizeof_fmt(size)))
    a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=str(nameE)+'_tSVD_', filenameResults = 'dim_red_noL2.csv', filenameCoverage = 'dim_noL2_redCoverage.csv')
    
    del e
    del a
    del b
    
          
    print(str(datetime.datetime.now()) + " DONE, embedding: " + str(nameE))
    return True
    
   
    
    
def test_reduction2(path):
    dataset_min = get_vocab_simil_all(True)
    directory = os.fsencode(path)
    
   
    for filename in os.listdir(directory):
        test_1_reduction(directory,filename)
        
        

def test_retro(path):
    dataset_min = get_vocab_simil_all(True)
    directory = os.fsencode(path)
    for filename in os.listdir(directory):
        e = load_embedding(os.path.join(directory, filename), vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True)
        a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
        export_to_csv(txtResults=a, txtCov = b, name=str(filename)[2:-1], filenameResults = 'retro.csv', filenameCoverage = 'retroCoverage.csv')

        
        
def test_vecmap(embs,names,filename,normalize_embs):
    name = ''
    for n in range(len(names)):
        if n == len(names)-1:
             name = name+','+str(names[n])
        else:
            if n==0:
                name = str(names[n])
            else:
                name = name+'+'+str(names[n])
    
    c = avg_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="generate",generate_method='cosine',k=10,normalize=normalize_embs,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=name, filenameResults = str(filename)+'.csv', filenameCoverage = str(filename)+'_coverage.csv')
    
    c = avg_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="ignore",generate_method='cosine',k=10,normalize=normalize_embs,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=name, filenameResults = str(filename)+'_zeros.csv', filenameCoverage = str(filename)+'_zeros_coverage.csv')
    
    c = concatenate_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="generate",generate_method='cosine',k=10,normalize=normalize_embs,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=name, filenameResults = str(filename)+'_concat.csv', filenameCoverage = str(filename)+'_concat.csv')
    
    return True

def test_vecmap_avg(embs,names,filename,normalize_embs):
    name = ''
    for n in range(len(names)):
        if n == len(names)-1:
             name = name+'+'+str(names[n])
        else:
            if n==0:
                name = str(names[n])
            else:
                name = name+'+'+str(names[n])
    
    c = avg_embeddings(embs, path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="generate",generate_method='cosine',k=10,normalize=normalize_embs,where="return")
    a,b = results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=False,returnRes=True)
    export_to_csv(txtResults=a, txtCov = b, name=name, filenameResults = str(filename)+'_AVG.csv', filenameCoverage = str(filename)+'_AVG_coverage.csv')
    
    return True

def test_vecmap_FT_Orto():
    dataset_vocab = get_vocab_simil_all()
    dataset_min = get_vocab_simil_all(True)
    path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FT(Orto)/'
    
    W2V = load_embedding(path+'W2V.FT-W2V.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    GLOVE = load_embedding(path+'GLOVE.FT-GLOVEL2.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    FT = load_embedding(path+'FT.FT-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(path+'Jointc.FT-Jointc.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(path+'LEXVEC.FT-LEXVEC.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(path+'UKB.FT-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
  
    
    embs = [GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC]
    names = ['GLOVE','W2V','FT','jointcHYB','UKB','LEXVEC']
    
    #De dos en dos
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            
            test_vecmap([embs[x],embs[y]],[names[x],names[y]],'toFT',False)
            test_vecmap([embs[x],embs[y]],[names[x],names[y]],'toFT_norm',True)
            
    #De tres en 3
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                test_vecmap([embs[x],embs[y],embs[j]],[names[x],names[y],names[j]],'toFT',False)
                test_vecmap([embs[x],embs[y],embs[j]],[names[x],names[y],names[j]],'toFT_norm',True)
  
    #de 4 en 4
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                   
                    test_vecmap([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z]],'toFT',False)
                    test_vecmap([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z]],'toFT_norm',True)
                   
    #de 5 en 5
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                       
                        test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v]],'toFT',False)
                        test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v]],'toFT_norm',True)
                          
                    
    #de 6 en 6
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            
                            test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i]],'toFT',False)
                            test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i]],'toFT_norm',True)
                            
    return True


def test_vecmap_jointcHYB_Orto():
    dataset_vocab = get_vocab_simil_all()
    dataset_min = get_vocab_simil_all(True)
    path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/joint(Orto)/'
    
    W2V = load_embedding(path+'W2V.Jointc-W2V.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    GLOVE = load_embedding(path+'GLOVE.Jointc-GLOVEL2.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    FT = load_embedding(path+'FT.Jointc-FT.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(path+'Jointc.Jointc-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(path+'LEXVEC.Jointc-LEXVEC.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(path+'UKB.Jointc-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
  
    
    embs = [GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC]
    names = ['GLOVE','W2V','FT','jointcHYB','UKB','LEXVEC']
    
    #De dos en dos
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            
            test_vecmap([embs[x],embs[y]],[names[x],names[y]],'toJointc',False)
            test_vecmap([embs[x],embs[y]],[names[x],names[y]],'toJointc_norm',True)
            
    #De tres en 3
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                test_vecmap([embs[x],embs[y],embs[j]],[names[x],names[y],names[j]],'toJointc',False)
                test_vecmap([embs[x],embs[y],embs[j]],[names[x],names[y],names[j]],'toJointc_norm',True)
  
    #de 4 en 4
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                   
                    test_vecmap([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z]],'toJointc',False)
                    test_vecmap([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z]],'toJointc_norm',True)
                   
    #de 5 en 5
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                       
                        test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v]],'toJointc',False)
                        test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v]],'toJointc_norm',True)
                          
                    
    #de 6 en 6
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            
                            test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i]],'toJointc',False)
                            test_vecmap([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i]],'toJointc_norm',True)
                            
    return True



def test_avg_normalized():
    dataset_vocab = get_vocab_simil_all()
    dataset_min = get_vocab_simil_all(True)
    path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/Normalized/'
    
    W2V = load_embedding(path+'W2V.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    GLOVE = load_embedding(path+'GLOVE.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    FT = load_embedding(path+'FT.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    jointcHYB = load_embedding(path+'JOINTC-HYB-ENES.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    LEXVEC = load_embedding(path+'LEXVEC.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    UKB = load_embedding(path+'UKB.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
  
    
    embs = [GLOVE,W2V,FT,jointcHYB,UKB,LEXVEC]
    names = ['GLOVE','W2V','FT','jointcHYB','UKB','LEXVEC']
    
    #De dos en dos
    for x in range(len(names)):
        for y in range(x+1,len(names)):
           
            test_vecmap_avg([embs[x],embs[y]],[names[x],names[y]],'toFT',False)
            
    #De tres en 3
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                test_vecmap_avg([embs[x],embs[y],embs[j]],[names[x],names[y],names[j]],'toFT',False)
                
  
    #de 4 en 4
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                   
                    test_vecmap_avg([embs[x],embs[y],embs[j],embs[z]],[names[x],names[y],names[j],names[z]],'toFT',False)
                    
                   
    #de 5 en 5
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                       
                        test_vecmap_avg([embs[x],embs[y],embs[j],embs[z],embs[v]],[names[x],names[y],names[j],names[z],names[v]],'toFT',False)
                        
                    
    #de 6 en 6
    for x in range(len(names)):
        for y in range(x+1,len(names)):
            for j in range(y+1,len(names)): 
                for z in range(j+1,len(names)): 
                    for v in range(z+1,len(names)): 
                        for i in range(v+1,len(names)): 
                            
                            test_vecmap_avg([embs[x],embs[y],embs[j],embs[z],embs[v],embs[i]],[names[x],names[y],names[j],names[z],names[v],names[i]],'toFT',False)
                           
                            
    return True


def test_vecmap_FT():
    path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FT/'
    
    a = load_embedding(path+'1_FT.FT-Jointc.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'1_Jointc.FT-Jointc.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['FT,JointcHYB'],'WtoFT',False)
    test_vecmap([a,b],['FT,JointcHYB'],'WtoFT_norm',True)  
    
    a = load_embedding(path+'2_FT.FT-LEXVEC.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'2_LEXVEC.FT-LEXVEC.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['FT,LEXVEC'],'WtoFT',False)
    test_vecmap([a,b],['FT,LEXVEC'],'WtoFT_norm',True)  
    
    a = load_embedding(path+'3_FT.FT-UKB.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'3_UKB.FT-UKB.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['FT,UKB'],'WtoFT',False)
    test_vecmap([a,b],['FT,UKB'],'WtoFT_norm',True) 
    
    a = load_embedding(path+'4_FT.FT-W2V.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'4_W2V.FT-W2V.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['FT,W2V'],'WtoFT',False)
    test_vecmap([a,b],['FT,W2V'],'WtoFT_norm',True)
    
    a = load_embedding(path+'5_FT.W2V-GLOVEL2.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'5_GLOVE.FT-GLOVEL2.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['FT,GLOVE'],'WtoFT',False)
    test_vecmap([a,b],['FT,GLOVE'],'WtoFT_norm',True) 
    

def test_vecmap_jointcHYB():
    path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/joint/'
    
    a = load_embedding(path+'1_FT.Jointc-FT.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'1_Jointc.Jointc-FT.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['FT,JointcHYB'],'WtoJointc',False)
    test_vecmap([a,b],['FT,JointcHYB'],'WtoJointc_norm',True)  
    
    a = load_embedding(path+'3_GLOVE.Jointc-GLOVEL2.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'3_Jointc.Jointc-GLOVEL2.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['Jointc,GLOVE'],'WtoJointc',False)
    test_vecmap([a,b],['Jointc,GLOVE'],'WtoJointc_norm',True)  
    
    a = load_embedding(path+'4_Jointc.Jointc-UKB.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'4_Jointc.Jointc-UKB.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['Jointc,UKB'],'WtoJointc',False)
    test_vecmap([a,b],['Jointc,UKB'],'WtoJointc_norm',True) 
    
    a = load_embedding(path+'5_Jointc.Jointc-LEXVEC.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'5_LEXVEC.Jointc-LEXVEC.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['Jointc,LEXVEC'],'WJointc',False)
    test_vecmap([a,b],['Jointc,LEXVEC'],'WJointc_norm',True)
    
    a = load_embedding(path+'6_Jointc.Jointc-W2V.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    b = load_embedding(path+'6_W2V.Jointc-W2V.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    test_vecmap([a,b],['Jointc,W2V'],'WJointc',False)
    test_vecmap([a,b],['Jointc,W2V'],'WJointc_norm',True) 

In [13]:
#DIM_REDUCTION.py
#https://arxiv.org/pdf/1708.03629.pdf
#https://github.com/vyraun/Half-Size/blob/master/pca_ppa.py
#from skcuda.linalg import PCA as cuPCA
import numpy as np
from sklearn import decomposition
#import pycuda.autoinit
#import pycuda.gpuarray as gpuarray
import numpy as np
#import skcuda.linalg as linalg
from sklearn.preprocessing import StandardScaler

def PPA(matrix):
    # PCA to get Top Components
    n = matrix.shape[1]
    pca =  decomposition.PCA(n_components = n)
    X_train = matrix - np.mean(matrix)
    X_fit = pca.fit_transform(X_train)
    U1 = pca.components_
    
    z = []
    
    # Removing Projections on Top Components
    for i, x in enumerate(X_train):
        for u in U1[0:7]:        
            x = x - np.dot(u.transpose(),x) * u 
        z.append(x)

    return np.asarray(z)

def PCA(matrix, n):
    pca = decomposition.PCA(n_components = n)
    #SKLEARN CENTERS DE DATA, THIS IS REDUNTDANT. 
    X_train = matrix - np.mean(matrix)
    return pca.fit_transform(X_train)


def algo(matrix, n_components):
    #matrixPPA= PPA(matrix)
    #matrixR = PCA(matrixPPA,n_components)
    #print(matrixR.shape)
    #del matrixPPA
    #return PPA(matrixR)
    return PPA(PCA(PPA(matrix),n_components))

def T_SVD(matrix,n):
    svd = decomposition.TruncatedSVD(n_components = n)
    return svd.fit_transform(matrix)


def PPA_cuda(matrix):
    # PCA to get Top Components
    n = matrix.shape[1]
    pca =  linalg.PCA(n_components = n)
    X_train = matrix - np.mean(matrix)
    X_fit = pca.fit_transform(X_train)
    U1 = pca.components_
    
    z = []
    
    # Removing Projections on Top Components
    for i, x in enumerate(X_train):
        for u in U1[0:7]:        
            x = x - np.dot(u.transpose(),x) * u 
        z.append(x)

    return np.asarray(z)

def PCA_cuda(matrix, n):
    #matrix = StandardScaler().fit_transform(matrix)
    pca = cuPCA(n_components = n)
    X_gpu = gpuarray.GPUArray((matrix.shape[0],matrix.shape[1]), type(matrix[0][0]), order="F") 
    X_gpu.set(matrix)
    return pca.fit_transform(X_gpu).get()





## Embeddings

In [14]:

W2V_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/GoogleNews-vectors-negative300.bin'
GLOVE_CC_42_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/Glove/glove.42B.300d.txt'
GLOVE_CC_840_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Glove/glove.840B.300d.txt'
GLOVE_WIKI_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/Glove/glove.6B.300d.txt'
FastText_WIKI_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/fastTextPretrained/2017/wiki-news-300d-1M.vec'
FastText_CC_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/fastTextPretrained/2017/crawl-300d-2M.vec'
UKB_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/UKB/RWSGwn.emb'
SketchEngine_BritishNational_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/fastTextPretrained/bnc2_tt2.vec'
SketchEngine_web_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/fastTextPretrained/ententen13_tt2_1.vec'
Numberbatch_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/Conceptnet/numberbatch-en.txt'
NAACL_DeepWalk_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/NAACL/DT_embeddings_DeepWalk'
NAACL_Line_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/NAACL/DT_embeddings_LINE'
NAACL_Node2Vec_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/NAACL/DT_embeddings_Node2vec'
NAACL_Nodes_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/NAACL/DT_nodes'
Turian_100_path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/Turian/hlbl_reps_clean_1.rcv1.clean.tokenized-CoNLL03.case-intact.txt'

Senna_words_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/Senna/words.lst'
Senna_vectors_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/Senna/embeddings.txt'
Multilingual512_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/FaruquiAndDyer multilingual 512/vec.txt'
SW2_cbow_wikipedia = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/SW2V/sw2v_cbow_wikipedia_vectors.bin'
SW2_synsets_cbow_wikipedia = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/SW2V/sw2v_synsets_cbow_wikipedia_vectors.bin'
mscc_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/contex2vec/mscc.skipgram.w10.d600.neg10.iter5.words'
ukwac_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/contex2vec/ukwac.skipgram.w10.d600.neg10.iter3.words'
jointcHYB_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/jointcHYB/JOINTC-HYB-ENES.emb'
lexvec = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/lexvec/lexvec.ngramsubwords.300d.W.pos.vectors/data'
PDC_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/PDC && HDC/wikicorp.201004-pdc-iter-20-alpha-0.05-window-10-dim-300-neg-10-subsample-0.0001.txt'
HDC = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/PDC && HDC/wikicorp.201004-hdc-iter-20-alpha-0.025-window-10-dim-300-neg-10-subsample-0.0001.txt'

FT_FT_UKB_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/FT.FT-UKB.Orto.TXT'
UKB_FT_UKB_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/UKB.FT-UKB.Orto.TXT'
FT_UKB_FT_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/FT.FT-UKB.Orto.TXT'
UKB_UKB_FT_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/UKB.FT-UKB.Orto.TXT'
W2V_FT_W2V_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/W2V.FT-W2V.Orto.TXT'
GLOVE_FT_GLOVE_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/GLOVE.FT-GLOVE.Orto.TXT'
W2V_GLOVE_W2V_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/W2V.GLOVE-W2V.Orto.TXT'
GLOVE_GLOVE_W2V_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/GLOVE.GLOVE-W2V.Orto.TXT'


FT_UKB_FT_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/FT.FT-UKB.TXT'
UKB_UKB_FT_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/UKB.FT-UKB.TXT'
FT_FT_UKB_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/FT.FT-UKB.TXT'
UKB_FT_UKB_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapRemap/UKB.FT-UKB.TXT'

MEAN_FT_UKB_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapCombinations/FT.UKB.recommended.original'
MEAN_FT_UKB_ORTO_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapCombinations/FT.UKB.recommended.Orto'

MEAN_FT_W2VGLOVE_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapCombinations/FT_GLOVE.W2V.recommended.Orto'
MEAN_GLOVE_W2VGLOVE_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/VecmapCombinations/GLOVE_GLOVE.W2V.recommended.Orto'

FT_Vecmap_Normalized_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/Normalized/FT.NORMALIZED.Vecmap.TXT'
UKB_Vecmap_Normalized_path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1//TFG/vecmap_results/Normalized/UKB.NORMALIZED.Vecmap.TXT'





In [15]:
dataset_vocab = get_vocab_simil_all()
dataset_min = get_vocab_simil_all(True)

In [None]:
results_to_csv(evaluate_on_all_avg([FT,UKB,LEXVEC,jointcHYB],lowercase_dataset=True))

In [None]:
GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)

In [None]:
GLOVE = load_embedding(GLOVE_WIKI_path, vocabulary = None, length_normalize = True, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)

In [None]:
GLOVE = load_embedding(GLOVE_CC_42_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)

In [None]:
W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)

In [None]:
FT = load_embedding(FastText_WIKI_path, vocabulary = dataset_vocab, length_normalize = True, normalize_dimensionwise=False, dims_restriction=300)

In [None]:
FT = load_embedding(FastText_CC_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
jointcHYB = load_embedding(jointcHYB_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
UKB = load_embedding(UKB_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
del UKB

In [None]:
LEXVEC = load_embedding(lexvec, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
SKE = load_embedding(SketchEngine_BritishNational_path, vocabulary = dataset_vocab, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=False)

In [None]:
SKE = load_embedding(SketchEngine_web_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)

In [None]:
Numberbatch = load_embedding(Numberbatch_path, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False)

In [None]:
PDC = load_embedding(PDC, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
NAACL = load_embedding(NAACL_DeepWalk_path, vocabulary = None, length_normalize = True)

In [None]:
Turian = load_embedding(Turian_100_path)

In [None]:
senna = load_embedding(Senna_words_path, path2=Senna_vectors_path, format = "senna")

In [None]:
FT_UKB_FT = load_embedding(FT_UKB_FT_path, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
UKB_UKB_FT = load_embedding(UKB_UKB_FT_path, length_normalize = True, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)

In [None]:
FT_FT_UKB = load_embedding(FT_FT_UKB_path, vocabulary = dataset_vocab, length_normalize = True, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)

In [None]:
FT_FT_UKB_ORTO = load_embedding(FT_FT_UKB_ORTO_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB_FT_UKB_ORTO = load_embedding(UKB_FT_UKB_ORTO_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
FT_Vecmap_Normalized = load_embedding(FT_Vecmap_Normalized_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB_Vecmap_Normalized = load_embedding(UKB_Vecmap_Normalized_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


In [None]:
UKB_FT_UKB = load_embedding(UKB_FT_UKB_path, vocabulary = dataset_vocab, length_normalize = True, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)

In [None]:
MEAN_FT_UKB = load_embedding(MEAN_FT_UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300) 

In [None]:
MEAN_FT_UKB_ORTO = load_embedding(MEAN_FT_UKB_ORTO_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300) 

In [None]:
W2V_FT_W2V_ORTO = load_embedding(W2V_FT_W2V_ORTO_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
GLOVE_FT_GLOVE_ORTO = load_embedding(GLOVE_FT_GLOVE_ORTO_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
W2V_GLOVE_W2V_ORTO = load_embedding(W2V_GLOVE_W2V_ORTO_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
GLOVE_GLOVE_W2V_ORTO = load_embedding(GLOVE_GLOVE_W2V_ORTO_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
MEAN_FT_W2VGLOVE = load_embedding(MEAN_GLOVE_W2VGLOVE_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
MEAN_GLOVE_W2VGLOVE = load_embedding(MEAN_GLOVE_W2VGLOVE_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
#E = load_embedding(UKB_path, lower =False, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False)
#E.length_normalize()
#(results_to_csv(evaluate_on_all(E,lowercase_dataset=True),printRes=True,returnRes=True),'UKB')
a,b = results_to_csv(evaluate_on_all(E,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='UKB')

In [None]:
v = set(standarize_words(N1.words,unicode=False, lower=True))

In [None]:
N1 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FTL1rm.Jointc-FTr.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
N2 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/UKBrm.Jointc-UKBr.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N3 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/Jointc.Jointc-LEXVEC.Orto.TXT', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N4 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/LEXVEC.Jointc-LEXVEC.Orto.TXT', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N5 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/NUMBERBATCH_N.Jointc-NUMBERBATCH.Orto.TXT', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N6 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/Normalized/JOINTC-HYB-ENES-retro.NORMALIZED.Vecmap.TXT', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N7 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/jointcHYB_retro_ppdb.txt', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

#N8 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FTL1rm.Jointc-FTr.Orto.TXT', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N9 = 
#N10 =


#N1.mean_center()
#N2.mean_center()
#N3.mean_center()
#N4.mean_center()
#N5.mean_center()


#from sklearn.preprocessing import StandardScaler
#scaler = StandardScaler()
#scaler.fit(N1.vectors)
#scaler.fit(N1.vectors)
#scaler.fit(N1.vectors)
#scaler.fit(N1.vectors)
#N2.vectors = scaler.transform(N2.vectors)


In [None]:

a = avg_embeddings([N1,N2], path ='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/FTrm+UKBrm_genC.vec' ,vocabulary = None, method = "ignore",generate_method='cosine', where="return")

#N = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/FTrm+UKBrm_genC.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


#N.L1_dimensionwwise()
results_to_csv(evaluate_on_all(a, lowercase_dataset=True))

In [None]:
a = avg_embeddings_generate_multithread([N1,N2], path ='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/FTrm+UKBrm_genC', vocabulary = None, weights=None, method = "generate",generate_method='cosine',k=10)


In [None]:
list_embsE1 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/UKB_retro_ppdb.txt', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#E1.L1_dimensionwwise()
E2 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/ft_retro_ppdb.txt', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#E2.L1_dimensionwwise()

In [None]:
results_to_csv(evaluate_on_all_avg([E1,E2], lowercase_dataset=True))

In [None]:
E1.export('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/UKB_retro_ppdb.txt')
E2.export('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/ft_retro_ppdb.txt')

In [None]:
GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
W2V = load_embedding(W2V_path, vocabulary = dataset_vocab, format='bin', length_normalize = False, normalize_dimensionwise=False)
FT = load_embedding(FastText_CC_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
jointcHYB = load_embedding(jointcHYB, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB = load_embedding(UKB_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
LEXVEC = load_embedding(lexvec, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
SKE = load_embedding(SketchEngine_web_path, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
PDC = load_embedding(PDC, vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
results_to_csv(evaluate_on_all_avg([GLOVE],[1]))

In [None]:
embs = [FT, jointcHYB, UKB, LEXVEC,GLOVE,W2V,SKE,PDC]
weights = [8,7,6,5,4,3,2,1]

#A = avg_embeddings(embs, weights=weights, method = "ignore", where="return")
C = concatenate_embeddings(embs, method="zeros",where="return")
print("AVG")
#results_to_csv(evaluate_on_all(A))
print("CONCAT")
results_to_csv(evaluate_on_all(C))

In [None]:
del GLOVE

In [None]:
GLOVE = load_embedding('/media/iker/My Book/TFG/Glove/GLOVE.CC.L2Normalized.WHEADER.vec', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
del A
del C

In [None]:
GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
GLOVE.export('/media/iker/My Book/TFG/Emb_preprocesing/GLOVE.vec',False)
del GLOVE
W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
W2V.export('/media/iker/My Book/TFG/Emb_preprocesing/W2V.vec',False)
del W2V
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
FT.export('/media/iker/My Book/TFG/Emb_preprocesing/FT.vec',False)
del FT
jointcHYB = load_embedding(jointcHYB, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
jointcHYB.export('/media/iker/My Book/TFG/Emb_preprocesing/jointcHYB.vec',False)
del jointcHYB
UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB.export('/media/iker/My Book/TFG/Emb_preprocesing/UKB.vec',False)
del UKB
LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
LEXVEC.export('/media/iker/My Book/TFG/Emb_preprocesing/LEXVEC.vec',False)
del LEXVEC
SKE = load_embedding(SketchEngine_web_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
SKE.export('/media/iker/My Book/TFG/Emb_preprocesing/SKE.vec',False)
del SKE
PDC = load_embedding(PDC, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
PDC.export('/media/iker/My Book/TFG/Emb_preprocesing/PDC.vec',False)
del PDC

In [None]:
concatenate_embeddings(embs, path='/home/concat.vec', vocabulary = None, method="zeros",where="file"):

In [None]:
#FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#joint = load_embedding(jointcHYB, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#concatenate_embeddings([FT,joint], path='/media/iker/My Book/TFG/Concatenated/FT+joint.vec', vocabulary = None, method="zeros",where="file")
#del joint
#
#UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#concatenate_embeddings([FT,UKB], path='/media/iker/My Book/TFG/Concatenated/FT+UKB.vec', vocabulary = None, method="zeros",where="file")
#del UKB

#LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#concatenate_embeddings([FT,LEXVEC], path='/media/iker/My Book/TFG/Concatenated/FT+LEXVEC.vec', vocabulary = None, method="zeros",where="file")
#del LEXVEC

#GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
#concatenate_embeddings([FT,GLOVE], path='/media/iker/My Book/TFG/Concatenated/FT+GLOVE.vec', vocabulary = None, method="zeros",where="file")

##REDUCIR
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+joint.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = algo(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+joint_ALGO300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+joint.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = PCA(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+joint_PCA300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+joint.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = T_SVD(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+joint_SVD300.vec')
del E
###

E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+UKB.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = algo(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+UKB_algo300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+UKB.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = PCA(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+UKB_PCA300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+UKB.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = T_SVD(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+UKB_SVD300.vec')
del E
###


E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+LEXVEC.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = algo(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+LEXVEC_algo300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+LEXVEC.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = PCA(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+LEXVEC_PCA300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+LEXVEC.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = T_SVD(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+LEXVEC_SVD300.vec')
del E
###

E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+GLOVE.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = algo(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+GLOVE_algo300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+GLOVE.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = PCA(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+GLOVE_PCA300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/FT+GLOVE.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = T_SVD(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/FT+GLOVE_SVD300.vec')
del E
###





In [None]:
W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
joint = load_embedding(jointcHYB, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
concatenate_embeddings([W2V,joint], path='/media/iker/My Book/TFG/Concatenated/W2V+joint.vec', vocabulary = None, method="zeros",where="file")
del W2V
del joint

E = load_embedding('/media/iker/My Book/TFG/Concatenated/W2V+joint.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = algo(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/W2V+joint_algo300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/W2V+joint.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = PCA(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/W2V+joint_PCA300.vec')
del E
E = load_embedding('/media/iker/My Book/TFG/Concatenated/W2V+joint.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=600)
E.vectors = T_SVD(E.vectors,300)
E.export('/media/iker/My Book/TFG/Concatenated/W2V+joint_SVD300.vec')
del E


In [None]:
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(FT, LEXVEC, '/media/iker/My Book/TFG/vecmap_results/vocab/FT.LEXVEC.dic', return_dict = False)

del LEXVEC

PDC = load_embedding(PDC, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(FT, PDC, '/media/iker/My Book/TFG/vecmap_results/vocab/FT.PDC.dic', return_dict = False)
del PDC

jointcHYB = load_embedding(jointcHYB, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(FT, jointcHYB, '/media/iker/My Book/TFG/vecmap_results/vocab/FT.jointcHYB.dic', return_dict = False)
del jointcHYB


In [None]:
jointcHYB = load_embedding(jointcHYB, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(jointcHYB, FT, '/media/iker/My Book/TFG/vecmap_results/vocab/jointcHYB.FT.dic', return_dict = False)
del FT
GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(jointcHYB, GLOVE, '/media/iker/My Book/TFG/vecmap_results/vocab/jointcHYB.GLOVE.dic', return_dict = False)
del GLOVE

UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(jointcHYB, UKB, '/media/iker/My Book/TFG/vecmap_results/vocab/jointcHYB.UKB.dic', return_dict = False)
del UKB


W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
generate_dictionary_for_vecmap(jointcHYB, W2V, '/media/iker/My Book/TFG/vecmap_results/vocab/jointcHYB.W2V.dic', return_dict = False)
del W2V

LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(jointcHYB, LEXVEC, '/media/iker/My Book/TFG/vecmap_results/vocab/jointcHYB.LEXVEC.dic', return_dict = False)
del LEXVEC


In [None]:
N1 = load_embedding('/media/iker/My Book/TFG/vecmap_results/Normalized/UKB.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
N2 = load_embedding('/media/iker/My Book/TFG/vecmap_results/Normalized/FT.NORMALIZED.Vecmap.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#D1 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/Jointc.Jointc-FT.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#D2 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/FT.Jointc-FT.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#O1 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/Jointc.Jointc-FT.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#O2 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/FT.Jointc-FT.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
print("Result from vecmap 1:")
results_to_csv(evaluate_on_all(D1))
print(" ")

In [None]:
    
print("Result from vecmap 2:")
results_to_csv(evaluate_on_all(D2))
print(" ")

In [None]:
print("Normalization vecmap 1:")
results_to_csv(evaluate_on_all(N1))
print(" ")
    

In [None]:
print("Normalization vecmap 2:")
results_to_csv(evaluate_on_all(N2))

In [None]:
print("Similarity AVG D:")
results_to_csv(evaluate_on_all_avg([D1,D2]))

In [None]:
print("Similarity AVG Orto:")
results_to_csv(evaluate_on_all_avg([N1,N2]))

In [None]:
print("Average")
avg = avg_embeddings([N1,N2], method = "ignore", where="return")
results_to_csv(evaluate_on_all(avg))

In [None]:
print("Concatenate")
concat = concatenate_embeddings([N1,N2], method = "skip", where="return")
results_to_csv(evaluate_on_all(concat))

In [None]:
print("D Mean")
avg = avg_embeddings([D1,D2], method = "ignore", where="return")
results_to_csv(evaluate_on_all(avg))

In [None]:
print("D Concat")
concat = concatenate_embeddings([D1,D2], method = "zeros", where="return")
results_to_csv(evaluate_on_all(concat))

In [None]:
print("Orto Mean")
avg = avg_embeddings([O1,O2], method = "ignore", where="return")
results_to_csv(evaluate_on_all(avg))

In [None]:
print("Orto Concat")

In [None]:
concat = concatenate_embeddings([O1,O2], method = "zeros", where="return")
results_to_csv(evaluate_on_all(concat))

In [None]:
#O1 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/Jointc.Jointc-FT.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
O2 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/FT.Jointc-FT.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#O3 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/LEXVEC.Jointc-LEXVEC.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
O4 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/UKB.Jointc-UKB.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
O5 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/Numberbatch.Jointc-Numberbatch.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
O6 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/NUMBERBATCH_N.Jointc-NUMBERBATCH.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
O5 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/W2V.Jointc-W2V.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
O6 = load_embedding('/media/iker/My Book/TFG/vecmap_results/vecmap-master/GLOVE.Jointc-GLOVEL2.Orto.TXT', vocabulary = dataset_vocab, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


In [None]:
avg = avg_embeddings([O2,O4,O6],weights=[1,1,2], method = "ignore", where="return")
#avg2 = avg_embeddings([O1,O2], method = "ignore", where="return")

#avg = avg_embeddings([avg,Numberbatch], method = "ignore", where="return")
#concat = concatenate_embeddings([avg,Numberbatch], method = "zeros", where="return")


results_to_csv(evaluate_on_all_avg([avg]))

In [None]:
concat = concatenate_embeddings([O2,O4,O5], method = "zeros", where="return")
results_to_csv(evaluate_on_all(concat))

In [None]:
concat = concatenate_embeddings([FT,UKB], method = "skip", where="return")
results_to_csv(evaluate_on_all(concat))

In [None]:
dataset_vocab = get_vocab_simil_all(True)

In [None]:

Retro = load_embedding('/media/iker/My Book/TFG/GoogleNews-vectors-negative300.txt', lower =True, vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
(evaluate_on_all(Retro,lowercase_dataset=True))

In [None]:
Retro.word_to_vector('cd',False)

In [None]:
len(dataset_vocab)

In [None]:
generate_dictionary_for_vecmap(FT, Numberbatch, '/media/iker/My Book/TFG/vecmap_results/vocab/FT.Numberbatch.dic', return_dict = False)


In [None]:
jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
generate_dictionary_for_vecmap(jointcHYB, Numberbatch, '/media/iker/My Book/TFG/vecmap_results/vocab/jointcHYB.Numberbatch.dic', return_dict = False)
del jointcHYB

In [None]:
test_normalization(W2V_path,embformat='bin', dims_restriction = 300, delete_duplicates = True, lowercase_datasets=False)

In [None]:
test_normalization(UKB_path,embformat='text', dims_restriction = 300, delete_duplicates = True, lowercase_datasets=True)

In [None]:
test_normalization(GLOVE_CC_840_path,embformat='text', dims_restriction = 300, delete_duplicates = True, lowercase_datasets=False)

In [None]:
test_normalization(FastText_CC_path,embformat='text', dims_restriction = 300, delete_duplicates = True, lowercase_datasets=False)

In [None]:
test_normalization(lexvec,embformat='text', dims_restriction = 300, delete_duplicates = True, lowercase_datasets=False)

In [None]:
test_normalization(jointcHYB_path,embformat='text', dims_restriction = 300, delete_duplicates = True, lowercase_datasets=True)

In [None]:
test_normalization(SketchEngine_web_path,embformat='text', dims_restriction = 100, delete_duplicates = True, lowercase_datasets=True)

In [None]:
i=1
#del dX
dy = []
for name, data in iteritems(datasets):
    if i == 1:
        dX = data.X
        i=2
    else:
        dX=np.append(dX,data.X,axis=0)
    print(len(data.X))
    dy=np.append(dy,data.y)
    

In [None]:
 for name, data in iteritems(datasets):
        d = {'dataset':name}
        d.update(similarity_emd(emb, data.X, data.y, backoff_embs,lowercase_dataset))
        

In [None]:
dX.shape

In [None]:
len(dy)

In [None]:
embs = [
    ['hola','routube','type',400,'data'],
    ['hola2','routube2','type2',402,'data2']
    
    
]

In [None]:
  embs = {
    'GLOVE' : [1,2],
    'PDC' : [2,3]
  }

In [None]:
names =['a','b','c']

for x in range(len(names)):
        for y in range(x+1,len(names)):
            print(y)

In [None]:
import itertools
list(itertools.permutations([1, 2, 3]))

In [None]:
combinations([1,2,3])

In [None]:
stuff = [1, 2, 3,4]
for L in range(1, len(stuff)+1):
    for subset in itertools.combinations(stuff, L):
        print(np.asarray(subset))

In [None]:
for i in range(len(stuff)):
    li=[i]
    for j in range(i+1,len(stuff)):
        lo = np.append(li,j)
        for l in range(j+1,len(stuff)):
            la = np.append(lo,l)
            print(la)

In [None]:
test_similarity_avg()

In [None]:
'"'+str(np.array(subset))+'"'

In [None]:
a = ["a","b","c"]
b = ["w","asda","a"]
c = ["a","b","c"]

w = [a,b,c]

In [None]:
v = Vocabulary(["a","b","c","d","e","f","g","h","i","j","k","l","m","n","o","p","q"])
v2 = Vocabulary(["a","kase","c","d","e","f","g","h","i","j","k","l","m","n","o","p","q"])
#v3 = Vocabulary(["qsae","hola","q","ase"])

e1 = Embedding(v, [[1,2],[2,3],[3,4],[4,5],[5,6],[6,7],[7,8],[8,9],[9,10],[10,11],[11,12],[12,13],[13,14],[14,15],[15,16],[16,17],[17,18]])
e2 = Embedding(v2, [[1,2],[100,100],[3,4],[4,5],[5,6],[6,7],[7,8],[8,9],[9,10],[10,11],[11,12],[12,13],[13,14],[14,15],[15,16],[16,17],[17,18]])
#e3 = Embedding(v3, [1,2,3,4])


In [None]:
generate_overlapping_vocab([e1])

In [None]:
np.append([1,2,3],[3,4,5],axis=0)

In [None]:
2.241242/len([1,2,3])

In [None]:
generate_word(e1,[e1,e2],"kase",overlapping_vocab=None,number_of_words = 10)

In [None]:

UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
#concatenate_embeddings([FT,UKB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+UKB_generated', vocabulary = dataset_min, method="generate",where="file")
avg_embeddings([FT,UKB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+UKB_generated', vocabulary = dataset_min, weights=None, method = "generate", where="file")

In [None]:
del UKB
LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
concatenate_embeddings([FT,LEXVEC], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+LEXVEC_generated', vocabulary = dataset_min, method="generate",where="file")
avg_embeddings([FT,LEXVEC], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+LEXVEC_generated', vocabulary = dataset_min, weights=None, method = "generate", where="file")

In [None]:
del LEXVEC
jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)



In [None]:
concatenate_embeddings([FT,jointcHYB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+jointcHYB_generated', vocabulary = dataset_min, method="generate",where="file")
avg_embeddings([FT,jointcHYB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+jointcHYB_generated', vocabulary = dataset_min, weights=None, method = "generate", where="file")

In [None]:
del jointcHYB
del FT

In [None]:
UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)

In [None]:
concatenate_embeddings([W2V,UKB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/W2V+UKB_generated', vocabulary = dataset_min, method="generate",where="file")
avg_embeddings([W2V,UKB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/W2V+UKB_generated', vocabulary = dataset_min, weights=None, method = "generate", where="file")

In [None]:
del UKB
del W2V

In [None]:
e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+UKB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=600)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FT+UKB generated')


e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+UKB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FTmUKB generated')



e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+LEXVEC_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=600)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FT+LEXVEC generated')


e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+LEXVEC_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FTuLEXVEC generated')


e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+jointcHYB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=600)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FT+jointcHYB generated')

e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+jointcHYB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FTujointcHYB generated')

e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/W2V+UKB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=600)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='W2V+UKB generated')
              
e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/W2V+UKB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='W2VuUKB generated')

In [None]:
e.words

In [None]:
del e
UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)


In [None]:
concatenate_embeddings([FT,UKB,LEXVEC,jointcHYB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+UKB+LEXVEC+jointcHYB_generated', vocabulary = dataset_min, method="generate",where="file")
avg_embeddings(FT,UKB,LEXVEC,jointcHYB], path='/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+UKB+LEXVEC+jointcHYB_generated', vocabulary = dataset_min, weights=None, method = "generate", where="file")

In [None]:
del UKB
del FT
del LEXVEC
del jointcHYB

e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+UKB+LEXVEC+jointcHYB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FT+UKB+LEXVEC+jointcHYB_generated'
              
e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Mean/FT+UKB+LEXVEC+jointcHYB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=False, dims_restriction=300)
a,b = results_to_csv(evaluate_on_all(e,lowercase_dataset=True),printRes=False,returnRes=True)
export_to_csv(txtResults=a, txtCov = b, name='FTuUKBuLEXVECujointcHYB_generated'

In [None]:
e = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/FT+UKB+LEXVEC+jointcHYB_generated', vocabulary = None, length_normalize = False, normalize_dimensionwise=False)


In [None]:
a = set([1,2,3,4,45,6,1,2,3,3,3,3,3,3,3,3,88,1,2,11])

In [None]:
for w in a:
    print(w)

In [None]:
Retro = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/jointcHYB_retro_ppdb.txt', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
Retro.export('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra-2.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/jointcHYB_retro_ppdb.txt -o JOINTC-HYB-ENES-retro.NORMALIZED.Vecmap.TXT')

In [None]:
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
merge_vocab_generator(UKB,[FT],path='/home/iker/Escritorio/Meta/Res/UKBwFT',vocab=dataset_min, method = 'cosine', k = 10)
merge_vocab_generator(FT,[UKB],path='/home/iker/Escritorio/Meta/Res/FTwUKB',vocab=dataset_min, method = 'cosine', k = 10)


In [None]:
FT = load_embedding('/home/iker/Escritorio/Meta/Res/FTwUKB.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB = load_embedding('/home/iker/Escritorio/Meta/Res/UKBwFT.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

In [None]:
results_to_csv(evaluate_on_all_avg([FT,UKB], lowercase_dataset=True))

In [None]:
GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = True, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
W2V = load_embedding(W2V_path, vocabulary = dataset_min, format='bin', length_normalize = True, normalize_dimensionwise=False)
FT = load_embedding(FastText_CC_path, vocabulary = dataset_min, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
jointcHYB = load_embedding(jointcHYB_path, vocabulary = dataset_min, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB = load_embedding(UKB_path, vocabulary = dataset_min, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
LEXVEC = load_embedding(lexvec, vocabulary = dataset_min, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
SKE = load_embedding(SketchEngine_web_path, vocabulary = dataset_min, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
PDC = load_embedding(PDC_path, vocabulary = dataset_min, length_normalize = True, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    

In [None]:
UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


In [None]:
c = concatenate_embeddings([UKB,UKB], path='/home/concat.vec', vocabulary = dataset_min, method="generate",generate_method='cosine',k=10,where="return",normalize=True)
    

In [None]:
results_to_csv(evaluate_on_all(c, lowercase_dataset=True))

In [None]:
test_concat_avg()

In [None]:
W2V.word_to_vector('Animalize')

In [None]:
def normalize_vector(vector):
    vector = np.asarray(vector).reshape(-1,len(vector))
    return normalize(vector,norm='l2')[0]



In [None]:
a1 = normalize_vector([100,100])
b1 = normalize_vector([100,100])
a2 = normalize_vector([1,0])
b2 = normalize_vector([0,1])

c1 = np.append(a1,a2)
c2 = np.append(b1,b2)

In [None]:
a1 = [1,0.5]
b1 = [1*100,0.6*100]
a2 = [1,0.55]
b2 = [1,1]
a3 = [1.1, 0.55]
b3 = [0.9*100,0.6*100]

In [None]:
calculate_cosine_simil(np.append(a1,a2), np.append(b1,b2))

In [None]:
np.dot(np.append(a1,a2), np.append(b1,b2))

In [None]:
np.linalg.norm(c1)*np.linalg.norm(c2)

In [None]:
(pow(a1[0],2)+pow(a1[1],2))

In [None]:
print(calculate_cosine_simil([100,100],[100,100]))
print(calculate_cosine_simil([1,0],[0,1]))

In [None]:
calculate_cosine_simil(np.mean([a1,a2],axis=0), np.mean([b1,b2],axis=0))

In [None]:
calculate_cosine_simil(np.append(a1,np.append(a2,a3)), np.append(b1,np.append(b2,b3)))

In [None]:
cosine_2(np.append(a1,np.append(a2,a3)), np.append(b1,np.append(b2,b3)))

In [None]:
calculate_cosine_simil(a3,b3)

In [None]:
np.mean([a1,a2],axis=0)

In [None]:
np.mean([b1,b2],axis=0)

In [None]:
a1

In [None]:
np.append(b1,b2)

In [None]:
cosine_2([1,1,1],[1,9])

In [None]:

def cosine_2(vector1, vector2):
    return np.dot(vector1/np.linalg.norm(vector1),vector2/np.linalg.norm(vector2))
    

In [None]:
normalize_vector(np.append(b1,np.append(b2,b3)))

In [None]:
np.append(b1,np.append(b2,b3))

In [None]:
a1.reshape(3,)

In [None]:
normalize_vector(UKB.vectors[1]).shape

In [None]:
normalize_vector(UKB.vectors[1])[0]

In [None]:
m = avg_embeddings([UKB,FT], path='/home/avg.vec', vocabulary = dataset_min, weights=None, method = "ignore",generate_method='cosine',k=10, where="return")
    

In [None]:
results_to_csv(evaluate_on_all(m, lowercase_dataset=True))

In [None]:
test_dim_reduction()

In [None]:
#GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
#W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
#FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
SKE = load_embedding(SketchEngine_web_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
PDC = load_embedding(PDC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)




In [None]:
def test_l(emb):
    l = 0
    i = 0 
    
    for w in emb.vectors:
        l+= np.linalg.norm(w)
        i+=1
    
    return l/i


print('GLOVE: ' + str(test_l(GLOVE)))
print('W2V: ' + str(test_l(W2V)))
print('FT: ' + str(test_l(FT)))
print('jointcHYB: ' + str(test_l(jointcHYB)))
print('UKB: ' + str(test_l(UKB)))
print('LEXVEC: ' + str(test_l(LEXVEC)))

In [None]:
print('SKE: ' + str(test_l(SKE)))
print('PDC: ' + str(test_l(PDC)))

In [None]:
test_concatenate_auto([GLOVE,jointcHYB],['GLOVE','jointcHYB','"[50,1]"'],[50,1])
test_concatenate_auto([GLOVE,jointcHYB],['GLOVE','jointcHYB','"[25,1]"'],[25,1])
test_concatenate_auto([GLOVE,jointcHYB],['GLOVE','jointcHYB','"[100,1]"'],[100,1])

test_concatenate_auto([GLOVE,UKB],['GLOVE','UKB','"[50,1]"'],[50,1])
test_concatenate_auto([GLOVE,UKB],['GLOVE','UKB','"[25,1]"'],[25,1])
test_concatenate_auto([GLOVE,UKB],['GLOVE','UKB','"[100,1]"'],[100,1])
   

In [None]:
test_concatenate_auto([GLOVE,jointcHYB],['GLOVE','jointcHYB','"[408.272727273,1]"'],[408.272727273,1])
test_concatenate_auto([W2V,UKB],['W2V','UKB','"[2.41470588235,1]"'],[2.41470588235,1])
test_concatenate_auto([LEXVEC,jointcHYB],['LEXVEC','jointcHYB','"[1.69343891403,1]"'],[1.69343891403,1])
test_concatenate_auto([LEXVEC,UKB],['LEXVEC','UKB','"[1.85746606335,1]"'],[1.85746606335,1])
test_concatenate_auto([LEXVEC,FT],['LEXVEC','FT','"[2.24660633484,1]"'],[2.24660633484,1])


In [None]:
test_concatenate_auto([LEXVEC,FT],['LEXVEC','FT','"[2.24660633484,1]"'],[2.24660633484,1])

In [None]:
test_retro('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/Results2/')

In [None]:
directory = os.fsencode('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/Results2/prueba.txt')
print(str(os.path.basename(directory))[2:-1])

In [None]:
print_variables()

In [None]:
for name, obj in locals().items():
    if name != 'asizeof':
        print(asizeof.asizeof(obj) / 1024)

In [None]:
test_reduction2('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/')

In [None]:
 os.fsencode('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated')

In [None]:
with open('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/W2V + jointcHYB.vec') as f:
        first_line = f.readline()
        first_line = first_line.split(' ')
        d = int(first_line[1])

In [None]:
normalize_vector([1,2,3,4],'l2')

In [None]:
test_concat_avg()

In [None]:
np.linalg.norm([0.0757194,-0.0995169,-0.0203361,0.0117365,0.0259609,-0.0307204,-0.123747,-0.0287734,0.0995169,0.113363,0.036778,-0.0969208,-0.046297,-0.0302878,-0.013954,-0.0179563,-0.0305041,0.0443499,0.0244465,-0.0385087,-0.00603051,-0.0878345,-0.0273672,-0.0305041,0.0091945,-0.0899979,-0.0597101,-0.0722579,-0.0233648,0.0324512,0.112497,0.0188217,-0.028557,0.0222831,-0.0346146,0.0683638,0.074854,-0.0517055,0.0657677,-0.0454316,0.00762602,0.109469,0.0614409,-0.0254201,0.0105466,-0.0521382,0.0465133,-0.0527872,0.0395904,0.0488931,-0.00827505,-0.0467297,0.0224995,-0.00973535,0.028557,0.0471624,-0.0739887,0.0644697,0.0164419,0.0298551,-0.0861038,0.0631716,-0.0134131,0.028557,-0.0294224,0.00773419,0.0174155,-0.0696618,-0.0395904,0.0826423,-0.0886999,0.0393741,-0.128074,0.0203361,-0.0491094,-0.0398068,-0.0460807,-0.0791808,-0.038076,-0.0636043,-0.083075,-0.0982189,-0.112497,-0.0791808,-0.0588448,-0.0835077,-0.0947574,0.0960554,-0.0908633,-0.0674984,0.109469,-0.0696618,-0.0170909,-0.0108171,-0.010168,-0.00627389,0.0369943,0.036129,0.0255283,0.0670657,0.074854,0.0562487,0.0385087,-0.100382,0.11769,0.0121151,-0.0679311,0.0137917,0.0636043,0.123747,0.0235812,-0.0213096,0.0191462,0.0657677,-0.0307204,-0.000358315,-0.0666331,-0.0415375,0.0744213,0.0137917,-0.0588448,-0.0227158,-0.0315858,-0.0350473,0.148843,-0.00908633,0.00320455,0.0488931,-0.0253119,-0.0497585,0.0162256,0.0454316,0.0271508,0.0229322,-0.0400231,-0.0141703,-0.0584121,-0.0382924,0.0131427,-0.0465133,-0.0443499,-0.0232567,-0.0311531,-0.0709599,0.0107089,-0.0149275,0.0662004,-0.0666331,0.0208769,-0.0713926,0.156631,0.0575467,-0.0605755,0.0201197,0.0201197,0.00930267,-0.0236894,0.0458643,0.0791808,0.110334,-0.027908,0.0692292,0.00838322,0.13067,0.0122233,-0.0636043,-0.0168746,-0.0207687,0.11769,0.0908633,0.0426192,0.00581417,-0.0018389,-0.0679311,-0.0348309,-0.105574,0.00212285,-0.036778,0.0189298,-0.108603,-0.0016834,0.0597101,-0.0171991,-0.0917286,-0.0218505,-0.0666331,0.0631716,0.0106548,0.0943247,0.0140622,-0.0549506,0.022824,-0.0426192,-0.110767,0.00508402,-0.0157929,-0.0553833,-0.0391577,0.00757194,-0.0426192,0.0904306,-0.00109523,-0.00632798,0.0421865,0.0471624,-0.0506238,0.0783155,0.0255283,-0.019038,-0.0796135,-0.0904306,0.0493258,0.0623062,-0.0271508,0.0175236,0.0783155,-0.00800462,-0.0199034,-0.14192,0.0124937,-0.0501911,0.0402394,0.00224454,-0.0218505,-0.0212014,-0.0597101,-0.0136836,0.0333165,0.0904306,0.0181727,-0.0744213,-0.0307204,0.0326675,0.0311531,-0.0255283,-0.104709,-0.0426192,-0.0248792,0.101248,-0.140189,-0.006977,-0.0389414,-0.0605755,0.0627389,-0.137593,-0.0484604,-0.0106007,0.0200116,0.0395904,-0.0413212,0.0495421,0.00328568,-0.0113038,0.0744213,0.111632,-0.0700945,-0.064037,-0.0128182,-0.0181727,-0.0331002,0.0480277,-0.00822096,0.046297,-0.0601428,0.0426192,0.0215259,-0.0147112,-0.0791808,0.00762602,-0.029206,-0.0761521,0.0411048,-0.0389414,0.0107089,0.0454316,0.0432682,-0.00397527,0.0352636,0.127209,-0.0157929,-0.00951901,0.00402935,-0.0482441,-0.00160904,-0.101248,-0.0311531,0.0162256,0.0040564,0.00106818,-0.00092621,-0.0151439,-0.0243384,0.00578712,-0.0623062,0.0739887,0.0178481,0.0800462,-0.0391577,0.131535,-0.0250956])

In [None]:
#FTo = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)   
FTretroWN = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/Results/FT_retro_WN+.txt', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)   
FTretroWNs = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/Results/FT_retro_WN.txt', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)   

ftretroPPDB = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/Results/FT_retro_ppdb.txt', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)   


In [None]:
word1 = 'car'
word2 = 'mouse'

In [None]:
calculate_cosine_simil(FTo.word_to_vector(word1),FTo.word_to_vector(word2))

In [None]:
calculate_cosine_simil(FTretroWNs.word_to_vector(word1),FTretroWN.word_to_vector(word2))

In [None]:
calculate_cosine_simil(FTretroWN.word_to_vector(word1),FTretroWN.word_to_vector(word2))

In [None]:
calculate_cosine_simil(ftretroPPDB.word_to_vector(word1),ftretroPPDB.word_to_vector(word2))

In [None]:
np.mean(cos_cdist(FTo.vectors,FTo.word_to_vector(word1)))

In [None]:
np.mean(cos_cdist(FTretroWN.vectors,FTretroWN.word_to_vector(word1)))

In [None]:
np.mean(cos_cdist(FTretroWNs.vectors,FTretroWNs.word_to_vector(word1)))

In [None]:
np.mean(cos_cdist(ftretroPPDB.vectors,ftretroPPDB.word_to_vector(word1)))

In [None]:
results_to_csv(evaluate_on_all(ftretroPPDB,lowercase_dataset=True),printRes=True,returnRes=False)
    

In [None]:
results_to_csv(evaluate_on_all(FTretroWNs,lowercase_dataset=True),printRes=True,returnRes=False)
    

In [None]:
FTretroWN2 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/FT_retro_WN+2.txt', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)   
#FTretroWN15 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/FT_retro_WN+15.txt', vocabulary = dataset_min, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)   


In [None]:
results_to_csv(evaluate_on_all(FTretroWN2,lowercase_dataset=True),printRes=True,returnRes=False)


In [None]:
from subprocess import call
#print(str(datetime.datetime.now()) + ' ====> Test test_concat_avg')
#test_concat_avg()
#print(str(datetime.datetime.now()) + ' ====> Run script')
#with open("/home/iker/Escritorio/retro+.script", 'rb') as file:
#    script = file.read()
#rc = call(script, shell=True)
#del rc

#print(str(datetime.datetime.now()) + ' ====> Run test retro')
#test_retro('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/retrofitting-master/Results2/')

print(str(datetime.datetime.now()) + ' ====> Run add reduction')
add__reduction()

#print(str(datetime.datetime.now()) + ' ====> Run test reduction')
#test_reduction2('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/')


In [None]:
#test_reduction2('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Concatenated/')
test_reduction2('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/Done/extra/')


In [None]:
print(str(datetime.datetime.now()) + ' ====> Run add reduction')
add__reduction()
print(str(datetime.datetime.now()) + ' ====> Run test reduction')
test_reduction2('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/ConcatenatedNoL2/')


In [None]:
from subprocess import call

In [None]:
def test_l(emb):
    l = 0
    i = 0 
    
    for w in emb.vectors:
        l+= np.linalg.norm(w)
        i+=1
    
    return l/i

In [None]:
#GLOVE = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/GLOVE.FT-GLOVEL2.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#FT = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FT.FT-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#UKB = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/UKB.FT-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#LEXVEC = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/LEXVEC.FT-LEXVEC.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
J = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/Jointc.FT-Jointc.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)

#N1 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FTL1rm.Jointc-FTr.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#N2 = load_embedding('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/UKBrm.Jointc-UKBr.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


In [None]:
del G
del F
del U


G = deepcopy(GLOVE)
F = deepcopy(FT)
U = deepcopy(UKB)

In [None]:
GLOVE.vectors = PPA(GLOVE.vectors)
FT.vectors = PPA(FT.vectors)
UKB.vectors = PPA(UKB.vectors)
J.vectors = PPA(J.vectors)

In [None]:
gn = test_l(G)
fn = test_l(F)
un = test_l(U)


In [None]:
c = avg_embeddings([UKB,FT,GLOVE,J], path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="generate",generate_method='cosine',k=10,normalize=True, normalize_norm='l1', where="return")
results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=True,returnRes=False)
    

In [None]:
del GLOVE
del FT
del UKB
del N1
del N2

In [None]:
c = concatenate_embeddings([UKB,FT,J,GLOVE], path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="generate",generate_method='cosine',k=10,normalize=True, where="return")
results_to_csv(evaluate_on_all(c,lowercase_dataset=True),printRes=True,returnRes=False)
    

In [None]:
 with codecs.open('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/joint', "r",encoding='utf-8', errors='ignore') as fnodes:
        for line_no, line in enumerate(fnodes):
            print(line)

In [None]:
directory = os.fsencode('/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/joint(Orto)')
files = os.listdir(directory)

for x in range(len(files)):
    for y in range(x,len(files)):
        print(str(files[x])+str(files[y]))
        
    

In [None]:
l = list(itertools.permutations(files))

In [None]:
files

In [None]:
test_vecmap_FT_Orto()
test_vecmap_jointcHYB_Orto()


In [None]:
test_vecmap_FT()
test_vecmap_jointcHYB()

In [None]:
def print_n(normalize):
    print(normalize)

In [None]:
print_n(False) calculate_cosine_simil

In [None]:
#GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)
#FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
   
#W2V = load_embedding(W2V_path, vocabulary = None, format='bin', length_normalize = False, normalize_dimensionwise=False)
#jointcHYB = load_embedding(jointcHYB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB = load_embedding(UKB_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#LEXVEC = load_embedding(lexvec, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#SKE = load_embedding(SketchEngine_web_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=100)
#PDC = load_embedding(PDC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
    

In [None]:
generate_word(embedding,list_embs,word,overlapping_vocab=None,overlapping_matrix=None, annoy = None, number_of_words = 10, method = 'cosine'):

In [None]:
c = avg_embeddings([FT,UKB], path='/home/concat.vec', vocabulary = dataset_min, weights=None, method="generate",generate_method='cosine',k=10,normalize=True, where="return")
results_to_csv(evaluate_on_all(c,lowercase_dataset=True))

In [None]:
dogo = GLOVE.word_to_vector('dog')
caro = GLOVE.word_to_vector('car')
loveo = GLOVE.word_to_vector('love')

In [None]:
i  = UKB.vocabulary.word_to_index('car')
UKB.vectors = np.delete(UKB.vectors,i,0)
del UKB.vocabulary.word_id['car']
del UKB.vocabulary.id_word[i]

In [None]:
a = np.asarray([1,2,3,4])

In [None]:
del GLOVE.vocabulary.words[i]

In [None]:
GLOVE.word_to_vector('love')

In [None]:
doge = generate_word(GLOVE,[GLOVE,FT],'dog',overlapping_vocab=None,overlapping_matrix=None, annoy = None, number_of_words = 11, method = 'cosine')
care = generate_word(GLOVE,[GLOVE,FT],'car',overlapping_vocab=None,overlapping_matrix=None, annoy = None, number_of_words = 11, method = 'cosine')
lovee = generate_word(GLOVE,[GLOVE,FT],'love',overlapping_vocab=None,overlapping_matrix=None, annoy = None, number_of_words = 11, method = 'cosine')

In [None]:
doge = (GLOVE.word_to_vector('dogs')+GLOVE.word_to_vector('puppy')+GLOVE.word_to_vector('Dog')+GLOVE.word_to_vector('pet')+GLOVE.word_to_vector('cat')+GLOVE.word_to_vector('canine')+GLOVE.word_to_vector('puppies')+GLOVE.word_to_vector('terrier')+GLOVE.word_to_vector('pup')+GLOVE.word_to_vector('Dogs'))/10
care = (GLOVE.word_to_vector('cars')+GLOVE.word_to_vector('Car')+GLOVE.word_to_vector('vehicle')+GLOVE.word_to_vector('automobile')+GLOVE.word_to_vector('Cars')+GLOVE.word_to_vector('truck')+GLOVE.word_to_vector('vehicles')+GLOVE.word_to_vector('auto')+GLOVE.word_to_vector('driving')+GLOVE.word_to_vector('dealership'))/10
loveee = (GLOVE.word_to_vector('loved')+GLOVE.word_to_vector('loving')+GLOVE.word_to_vector('adore')+GLOVE.word_to_vector('LOVE')+GLOVE.word_to_vector('loves')+GLOVE.word_to_vector('Love')+GLOVE.word_to_vector('luv')+GLOVE.word_to_vector('hope')+GLOVE.word_to_vector('looove')+GLOVE.word_to_vector('loooove'))/10


In [None]:

print(calculate_cosine_simil(doge,dogo))
print(calculate_cosine_simil(care,caro))
print(calculate_cosine_simil(lovee,loveo))


In [None]:
UKB.word_to_vector('dog')

In [None]:
overlapping_vocab[16161]

for w in range(len(overlapping_vocab)):
    if (overlapping_matrix[w]!=UKB.word_to_vector(overlapping_vocab[w])).all():
        print(w)
    print('h')

In [None]:
UKB.word_to_vector('thickheaded')

In [None]:
overlapping_matrix[16161]

In [None]:
get_top_cosine_scipy(UKB.word_to_vector('dog'),UKB,k=10)

In [None]:
ov = generate_overlapping_vocab([GLOVE,FT])
oe = generate_overlapping_matrix_embs(ov,[GLOVE,FT])

embs = ([GLOVE,FT])
ov2 = generate_overlapping_vocab(embs)
oe2 = generate_overlapping_matrix_embs(ov2,embs)

In [None]:
i = 0
for w in a:
    if w == 'dog':
        break
    else:
        i+=1

In [None]:
v = generate_overlapping_vocab([UKB])

In [None]:
m = generate_overlapping_matrix_embs(v,[UKB])

In [None]:
list(v)[400]

In [None]:
list(v)

In [None]:
list(set(v))

In [None]:
UKB.word_to_vector('bitumen')

In [None]:
 
    cos = cos_cdist(emb.vectors,vector)
    index =  get_largest_index(cos)
    top = []
    
    i = 0
    num = 0
    while i < len(index) & num<k:
        if emb.words[i] in overlap_vocab:
            top.append(emb.words[0])
            num+=1
        i+=1
    

In [None]:
cos = cos_cdist(GLOVE.vectors,GLOVE.word_to_vector('dog'))
index =  get_largest_index(cos)

In [None]:
overlap_vocab = set(GLOVE.words)

In [None]:
i = 0
num = 0
top=[]
while i < len(index) and num<10:
    if GLOVE.words[index[i]] in overlap_vocab:
        top.append(GLOVE.words[index[i]])
        num+=1
    i+=1

In [None]:
i < len(index) and num<10

In [None]:
top = get_top_cosine_scipy(vector,emb_n,numer_of_word,overlapping_vocab,overlapping_matrix)

In [None]:
matrix = []
    for w in overlapping_vocab:
        #matrix.append(emb.word_to_vector(w))
        matrix = np.append(matrix,emb.word_to_vector(w),axis=0)
    return matrix

In [None]:
matrix=[]
matrix = np.append(matrix,[1,2,3,4],axis=1)

In [None]:
set(set(['hola','que','ase']))

In [None]:
matrix.append([1,2,3,4])

In [None]:
matrix

In [22]:

path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/FT(Orto)/'

#GLOVEV = load_embedding(path+'GLOVE.FT-GLOVEL2.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
#FTV = load_embedding(path+'FT.FT-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
FT = load_embedding(FastText_CC_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
GLOVE = load_embedding(GLOVE_CC_840_path, vocabulary = None, length_normalize = False, normalize_dimensionwise=True, delete_duplicates=True, dims_restriction=300)




In [38]:
word = 'love'

In [39]:
cos = cos_cdist(FT.vectors,GLOVE.word_to_vector(word))
index =  get_largest_index(cos,10)

top = []
for i in index:
    top.append(FT.words[i])
top

['Clappison',
 '26yo',
 'Lazarowicz',
 'Koosh',
 'Westmacott',
 'Lightbown',
 'Stipetic',
 'Noff',
 'encouaged',
 'Saska']

In [40]:
cos = cos_cdist(FTV.vectors,GLOVEV.word_to_vector(word))
index =  get_largest_index(cos,10)

top = []
for i in index:
    top.append(FTV.words[i])
top

['love',
 'loving',
 'LOVE',
 'adore',
 'Love',
 'loved',
 'loves',
 'hate',
 'lovers',
 'lover']

In [41]:
calculate_cosine_simil(GLOVE.word_to_vector(word),FT.word_to_vector(word))

0.00443694

In [42]:
calculate_cosine_simil(GLOVEV.word_to_vector(word),FTV.word_to_vector(word))

0.6899997

In [15]:
test_concat_avg()

100%|██████████| 3000000/3000000 [00:45<00:00, 66369.10it/s]




100%|██████████| 5846/5846 [06:19<00:00, 15.39it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 47563.54it/s]
100%|██████████| 287/287 [00:00<00:00, 61690.42it/s]
100%|██████████| 771/771 [00:00<00:00, 59255.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 67959.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 61272.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 66031.58it/s]
100%|██████████| 353/353 [00:00<00:00, 63095.09it/s]
100%|██████████| 252/252 [00:00<00:00, 60671.87it/s]
100%|██████████| 203/203 [00:00<00:00, 66701.43it/s]
100%|██████████| 153/153 [00:00<00:00, 69639.56it/s]
100%|██████████| 200/200 [00:00<00:00, 55719.75it/s]
100%|██████████| 65/65 [00:00<00:00, 45797.04it/s]
100%|██████████| 144/144 [00:00<00:00, 52841.63it/s]
100%|██████████| 30/30 [00:00<00:00, 22429.43it/s]
100%|██████████| 130/130 [00:00<00:00, 57311.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69553.98it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.31it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76229.55it/s]
100%|██████████| 287/287 [00:00<00:00, 73409.27it/s]
100%|██████████| 771/771 [00:00<00:00, 72281.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75044.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75380.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92325.90it/s]
100%|██████████| 353/353 [00:00<00:00, 71467.36it/s]
100%|██████████| 252/252 [00:00<00:00, 74324.21it/s]
100%|██████████| 203/203 [00:00<00:00, 66451.55it/s]
100%|██████████| 153/153 [00:00<00:00, 66902.47it/s]
100%|██████████| 200/200 [00:00<00:00, 72503.09it/s]
100%|██████████| 65/65 [00:00<00:00, 65473.05it/s]
100%|██████████| 144/144 [00:00<00:00, 64321.59it/s]
100%|██████████| 30/30 [00:00<00:00, 49364.11it/s]
100%|██████████| 130/130 [00:00<00:00, 66592.52it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72404.40it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.35it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 95431.47it/s]
100%|██████████| 287/287 [00:00<00:00, 73832.51it/s]
100%|██████████| 771/771 [00:00<00:00, 76880.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75226.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87953.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77291.09it/s]
100%|██████████| 353/353 [00:00<00:00, 91152.45it/s]
100%|██████████| 252/252 [00:00<00:00, 70856.38it/s]
100%|██████████| 203/203 [00:00<00:00, 76335.28it/s]
100%|██████████| 153/153 [00:00<00:00, 74205.42it/s]
100%|██████████| 200/200 [00:00<00:00, 75423.56it/s]
100%|██████████| 65/65 [00:00<00:00, 62948.46it/s]
100%|██████████| 144/144 [00:00<00:00, 74954.06it/s]
100%|██████████| 30/30 [00:00<00:00, 67722.88it/s]
100%|██████████| 130/130 [00:00<00:00, 67191.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87270.69it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.38it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75723.96it/s]
100%|██████████| 287/287 [00:00<00:00, 67362.35it/s]
100%|██████████| 771/771 [00:00<00:00, 74913.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75086.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 71880.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87729.20it/s]
100%|██████████| 353/353 [00:00<00:00, 75908.19it/s]
100%|██████████| 252/252 [00:00<00:00, 77348.31it/s]
100%|██████████| 203/203 [00:00<00:00, 69206.19it/s]
100%|██████████| 153/153 [00:00<00:00, 56770.04it/s]
100%|██████████| 200/200 [00:00<00:00, 66203.20it/s]
100%|██████████| 65/65 [00:00<00:00, 58680.53it/s]
100%|██████████| 144/144 [00:00<00:00, 79817.60it/s]
100%|██████████| 30/30 [00:00<00:00, 44588.63it/s]
100%|██████████| 130/130 [00:00<00:00, 58762.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75980.62it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:42<00:00, 35.95it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 81825.29it/s]
100%|██████████| 287/287 [00:00<00:00, 99336.96it/s]
100%|██████████| 771/771 [00:00<00:00, 78842.61it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94822.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84896.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84210.57it/s]
100%|██████████| 353/353 [00:00<00:00, 52613.24it/s]
100%|██████████| 252/252 [00:00<00:00, 54228.34it/s]
100%|██████████| 203/203 [00:00<00:00, 54135.54it/s]
100%|██████████| 153/153 [00:00<00:00, 43051.69it/s]
100%|██████████| 200/200 [00:00<00:00, 45095.19it/s]
100%|██████████| 65/65 [00:00<00:00, 47167.78it/s]
100%|██████████| 144/144 [00:00<00:00, 50487.32it/s]
100%|██████████| 30/30 [00:00<00:00, 45722.79it/s]
100%|██████████| 130/130 [00:00<00:00, 54668.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81383.65it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.43it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76719.45it/s]
100%|██████████| 287/287 [00:00<00:00, 70709.89it/s]
100%|██████████| 771/771 [00:00<00:00, 83679.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95010.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89062.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79550.57it/s]
100%|██████████| 353/353 [00:00<00:00, 70855.15it/s]
100%|██████████| 252/252 [00:00<00:00, 76702.80it/s]
100%|██████████| 203/203 [00:00<00:00, 75697.34it/s]
100%|██████████| 153/153 [00:00<00:00, 76350.80it/s]
100%|██████████| 200/200 [00:00<00:00, 82402.83it/s]
100%|██████████| 65/65 [00:00<00:00, 62630.31it/s]
100%|██████████| 144/144 [00:00<00:00, 76686.11it/s]
100%|██████████| 30/30 [00:00<00:00, 55725.92it/s]
100%|██████████| 130/130 [00:00<00:00, 75762.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84638.64it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.47it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77416.85it/s]
100%|██████████| 287/287 [00:00<00:00, 75024.32it/s]
100%|██████████| 771/771 [00:00<00:00, 76351.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76488.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91247.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90838.89it/s]
100%|██████████| 353/353 [00:00<00:00, 58814.23it/s]
100%|██████████| 252/252 [00:00<00:00, 73126.10it/s]
100%|██████████| 203/203 [00:00<00:00, 71453.82it/s]
100%|██████████| 153/153 [00:00<00:00, 53132.02it/s]
100%|██████████| 200/200 [00:00<00:00, 71875.66it/s]
100%|██████████| 65/65 [00:00<00:00, 68741.74it/s]
100%|██████████| 144/144 [00:00<00:00, 72332.91it/s]
100%|██████████| 30/30 [00:00<00:00, 53227.21it/s]
100%|██████████| 130/130 [00:00<00:00, 65167.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81244.47it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.50it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 87233.98it/s]
100%|██████████| 287/287 [00:00<00:00, 77313.12it/s]
100%|██████████| 771/771 [00:00<00:00, 77966.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77904.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84438.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73820.42it/s]
100%|██████████| 353/353 [00:00<00:00, 76627.13it/s]
100%|██████████| 252/252 [00:00<00:00, 75405.91it/s]
100%|██████████| 203/203 [00:00<00:00, 75209.23it/s]
100%|██████████| 153/153 [00:00<00:00, 72783.09it/s]
100%|██████████| 200/200 [00:00<00:00, 76685.33it/s]
100%|██████████| 65/65 [00:00<00:00, 64148.18it/s]
100%|██████████| 144/144 [00:00<00:00, 74253.72it/s]
100%|██████████| 30/30 [00:00<00:00, 61320.23it/s]
100%|██████████| 130/130 [00:00<00:00, 73903.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81734.36it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:41<00:00, 36.19it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 72564.81it/s]
100%|██████████| 287/287 [00:00<00:00, 73266.30it/s]
100%|██████████| 771/771 [00:00<00:00, 92094.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82706.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84261.89it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93231.62it/s]
100%|██████████| 353/353 [00:00<00:00, 76052.46it/s]
100%|██████████| 252/252 [00:00<00:00, 69377.39it/s]
100%|██████████| 203/203 [00:00<00:00, 72997.57it/s]
100%|██████████| 153/153 [00:00<00:00, 73449.53it/s]
100%|██████████| 200/200 [00:00<00:00, 72590.93it/s]
100%|██████████| 65/65 [00:00<00:00, 64973.73it/s]
100%|██████████| 144/144 [00:00<00:00, 72489.17it/s]
100%|██████████| 30/30 [00:00<00:00, 52167.96it/s]
100%|██████████| 130/130 [00:00<00:00, 71192.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78325.84it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:41<00:00, 36.28it/s]
INFO:root:The new embedding has 5814 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 81110.93it/s]
100%|██████████| 287/287 [00:00<00:00, 80675.91it/s]
100%|██████████| 771/771 [00:00<00:00, 86984.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 99296.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77665.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86469.80it/s]
100%|██████████| 353/353 [00:00<00:00, 77558.37it/s]
100%|██████████| 252/252 [00:00<00:00, 74366.05it/s]
100%|██████████| 203/203 [00:00<00:00, 70653.37it/s]
100%|██████████| 153/153 [00:00<00:00, 72226.06it/s]
100%|██████████| 200/200 [00:00<00:00, 70480.66it/s]
100%|██████████| 65/65 [00:00<00:00, 68950.37it/s]
100%|██████████| 144/144 [00:00<00:00, 49405.30it/s]
100%|██████████| 30/30 [00:00<00:00, 59074.70it/s]
100%|██████████| 130/130 [00:00<00:00, 63817.83it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81608.96it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.32it/s]
INFO:root:The new embedding has 5814 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 56200.08it/s]
100%|██████████| 287/287 [00:00<00:00, 70031.14it/s]
100%|██████████| 771/771 [00:00<00:00, 59966.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 59453.19it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74927.72it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80026.66it/s]
100%|██████████| 353/353 [00:00<00:00, 60260.05it/s]
100%|██████████| 252/252 [00:00<00:00, 59200.44it/s]
100%|██████████| 203/203 [00:00<00:00, 57941.05it/s]
100%|██████████| 153/153 [00:00<00:00, 58599.99it/s]
100%|██████████| 200/200 [00:00<00:00, 55293.71it/s]
100%|██████████| 65/65 [00:00<00:00, 54910.32it/s]
100%|██████████| 144/144 [00:00<00:00, 59540.59it/s]
100%|██████████| 30/30 [00:00<00:00, 46794.02it/s]
100%|██████████| 130/130 [00:00<00:00, 46060.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 57994.86it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.41it/s]
INFO:root:The new embedding has 5814 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79816.17it/s]
100%|██████████| 287/287 [00:00<00:00, 70108.63it/s]
100%|██████████| 771/771 [00:00<00:00, 80098.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80463.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77174.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90087.07it/s]
100%|██████████| 353/353 [00:00<00:00, 80205.27it/s]
100%|██████████| 252/252 [00:00<00:00, 62185.36it/s]
100%|██████████| 203/203 [00:00<00:00, 77137.50it/s]
100%|██████████| 153/153 [00:00<00:00, 76269.14it/s]
100%|██████████| 200/200 [00:00<00:00, 79929.57it/s]
100%|██████████| 65/65 [00:00<00:00, 76905.43it/s]
100%|██████████| 144/144 [00:00<00:00, 78714.95it/s]
100%|██████████| 30/30 [00:00<00:00, 61771.78it/s]
100%|██████████| 130/130 [00:00<00:00, 80743.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80057.50it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.33it/s]
INFO:root:The new embedding has 5814 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80305.68it/s]
100%|██████████| 287/287 [00:00<00:00, 79189.87it/s]
100%|██████████| 771/771 [00:00<00:00, 69237.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80576.79it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74534.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98666.29it/s]
100%|██████████| 353/353 [00:00<00:00, 79226.74it/s]
100%|██████████| 252/252 [00:00<00:00, 68862.12it/s]
100%|██████████| 203/203 [00:00<00:00, 75056.74it/s]
100%|██████████| 153/153 [00:00<00:00, 71685.49it/s]
100%|██████████| 200/200 [00:00<00:00, 75342.27it/s]
100%|██████████| 65/65 [00:00<00:00, 64481.97it/s]
100%|██████████| 144/144 [00:00<00:00, 73989.93it/s]
100%|██████████| 30/30 [00:00<00:00, 64198.53it/s]
100%|██████████| 130/130 [00:00<00:00, 76089.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76135.09it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.44it/s]
INFO:root:The new embedding has 5814 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82110.71it/s]
100%|██████████| 287/287 [00:00<00:00, 78308.95it/s]
100%|██████████| 771/771 [00:00<00:00, 80141.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77209.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 97906.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80147.47it/s]
100%|██████████| 353/353 [00:00<00:00, 82612.95it/s]
100%|██████████| 252/252 [00:00<00:00, 77010.17it/s]
100%|██████████| 203/203 [00:00<00:00, 76970.14it/s]
100%|██████████| 153/153 [00:00<00:00, 78412.57it/s]
100%|██████████| 200/200 [00:00<00:00, 78603.90it/s]
100%|██████████| 65/65 [00:00<00:00, 76388.28it/s]
100%|██████████| 144/144 [00:00<00:00, 79096.36it/s]
100%|██████████| 30/30 [00:00<00:00, 59437.47it/s]
100%|██████████| 130/130 [00:00<00:00, 71145.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93865.90it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.38it/s]
INFO:root:The new embedding has 5814 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80762.30it/s]
100%|██████████| 287/287 [00:00<00:00, 78795.92it/s]
100%|██████████| 771/771 [00:00<00:00, 80579.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82422.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80659.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 101249.73it/s]
100%|██████████| 353/353 [00:00<00:00, 80292.26it/s]
100%|██████████| 252/252 [00:00<00:00, 79339.78it/s]
100%|██████████| 203/203 [00:00<00:00, 77039.79it/s]
100%|██████████| 153/153 [00:00<00:00, 70752.87it/s]
100%|██████████| 200/200 [00:00<00:00, 70321.13it/s]
100%|██████████| 65/65 [00:00<00:00, 76473.99it/s]
100%|██████████| 144/144 [00:00<00:00, 69018.37it/s]
100%|██████████| 30/30 [00:00<00:00, 55578.23it/s]
100%|██████████| 130/130 [00:00<00:00, 79252.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81083.38it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:40<00:00, 36.53it/s]
INFO:root:The new embedding has 5814 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 57420.79it/s]
100%|██████████| 287/287 [00:00<00:00, 58057.55it/s]
100%|██████████| 771/771 [00:00<00:00, 92776.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 57827.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84635.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 66854.99it/s]
100%|██████████| 353/353 [00:00<00:00, 58256.51it/s]
100%|██████████| 252/252 [00:00<00:00, 58851.04it/s]
100%|██████████| 203/203 [00:00<00:00, 58016.06it/s]
100%|██████████| 153/153 [00:00<00:00, 58653.55it/s]
100%|██████████| 200/200 [00:00<00:00, 57924.38it/s]
100%|██████████| 65/65 [00:00<00:00, 54211.53it/s]
100%|██████████| 144/144 [00:00<00:00, 54639.02it/s]
100%|██████████| 30/30 [00:00<00:00, 39199.10it/s]
100%|██████████| 130/130 [00:00<00:00, 55889.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 56029.07it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:14<00:00, 43.62it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 62347.26it/s]
100%|██████████| 287/287 [00:00<00:00, 72708.70it/s]
100%|██████████| 771/771 [00:00<00:00, 76283.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84513.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80120.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78258.27it/s]
100%|██████████| 353/353 [00:00<00:00, 76857.83it/s]
100%|██████████| 252/252 [00:00<00:00, 74988.62it/s]
100%|██████████| 203/203 [00:00<00:00, 70314.95it/s]
100%|██████████| 153/153 [00:00<00:00, 67126.41it/s]
100%|██████████| 200/200 [00:00<00:00, 74078.13it/s]
100%|██████████| 65/65 [00:00<00:00, 60289.64it/s]
100%|██████████| 144/144 [00:00<00:00, 67680.39it/s]
100%|██████████| 30/30 [00:00<00:00, 63678.70it/s]
100%|██████████| 130/130 [00:00<00:00, 67541.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 55802.03it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 234.07it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 54852.98it/s]
100%|██████████| 287/287 [00:00<00:00, 73395.84it/s]
100%|██████████| 771/771 [00:00<00:00, 73795.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75014.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75215.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95061.51it/s]
100%|██████████| 353/353 [00:00<00:00, 69635.47it/s]
100%|██████████| 252/252 [00:00<00:00, 74481.33it/s]
100%|██████████| 203/203 [00:00<00:00, 74622.59it/s]
100%|██████████| 153/153 [00:00<00:00, 73156.47it/s]
100%|██████████| 200/200 [00:00<00:00, 73778.43it/s]
100%|██████████| 65/65 [00:00<00:00, 66821.02it/s]
100%|██████████| 144/144 [00:00<00:00, 72039.57it/s]
100%|██████████| 30/30 [00:00<00:00, 55067.45it/s]
100%|██████████| 130/130 [00:00<00:00, 71867.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83828.60it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 232.35it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77065.16it/s]
100%|██████████| 287/287 [00:00<00:00, 72572.81it/s]
100%|██████████| 771/771 [00:00<00:00, 75476.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76096.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87361.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93077.14it/s]
100%|██████████| 353/353 [00:00<00:00, 75183.53it/s]
100%|██████████| 252/252 [00:00<00:00, 74946.08it/s]
100%|██████████| 203/203 [00:00<00:00, 73546.14it/s]
100%|██████████| 153/153 [00:00<00:00, 72536.28it/s]
100%|██████████| 200/200 [00:00<00:00, 74618.47it/s]
100%|██████████| 65/65 [00:00<00:00, 71612.76it/s]
100%|██████████| 144/144 [00:00<00:00, 75290.42it/s]
100%|██████████| 30/30 [00:00<00:00, 63743.22it/s]
100%|██████████| 130/130 [00:00<00:00, 72029.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80900.17it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 233.10it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75791.08it/s]
100%|██████████| 287/287 [00:00<00:00, 74315.67it/s]
100%|██████████| 771/771 [00:00<00:00, 74062.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75199.76it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93337.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89619.97it/s]
100%|██████████| 353/353 [00:00<00:00, 78222.17it/s]
100%|██████████| 252/252 [00:00<00:00, 76210.59it/s]
100%|██████████| 203/203 [00:00<00:00, 72785.41it/s]
100%|██████████| 153/153 [00:00<00:00, 73315.26it/s]
100%|██████████| 200/200 [00:00<00:00, 73927.98it/s]
100%|██████████| 65/65 [00:00<00:00, 59177.29it/s]
100%|██████████| 144/144 [00:00<00:00, 72759.88it/s]
100%|██████████| 30/30 [00:00<00:00, 58936.36it/s]
100%|██████████| 130/130 [00:00<00:00, 73743.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80437.83it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 231.33it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78476.76it/s]
100%|██████████| 287/287 [00:00<00:00, 76736.49it/s]
100%|██████████| 771/771 [00:00<00:00, 78998.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80183.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89406.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74944.68it/s]
100%|██████████| 353/353 [00:00<00:00, 78956.34it/s]
100%|██████████| 252/252 [00:00<00:00, 75057.85it/s]
100%|██████████| 203/203 [00:00<00:00, 74812.73it/s]
100%|██████████| 153/153 [00:00<00:00, 76341.72it/s]
100%|██████████| 200/200 [00:00<00:00, 75355.80it/s]
100%|██████████| 65/65 [00:00<00:00, 71406.43it/s]
100%|██████████| 144/144 [00:00<00:00, 63818.66it/s]
100%|██████████| 30/30 [00:00<00:00, 53957.60it/s]
100%|██████████| 130/130 [00:00<00:00, 73396.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91170.33it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 235.44it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77685.26it/s]
100%|██████████| 287/287 [00:00<00:00, 78930.25it/s]
100%|██████████| 771/771 [00:00<00:00, 83840.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78333.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77068.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91413.03it/s]
100%|██████████| 353/353 [00:00<00:00, 74664.11it/s]
100%|██████████| 252/252 [00:00<00:00, 70804.17it/s]
100%|██████████| 203/203 [00:00<00:00, 72229.70it/s]
100%|██████████| 153/153 [00:00<00:00, 81686.42it/s]
100%|██████████| 200/200 [00:00<00:00, 72830.42it/s]
100%|██████████| 65/65 [00:00<00:00, 64711.55it/s]
100%|██████████| 144/144 [00:00<00:00, 70599.62it/s]
100%|██████████| 30/30 [00:00<00:00, 57693.31it/s]
100%|██████████| 130/130 [00:00<00:00, 62365.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85753.05it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 230.75it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75369.82it/s]
100%|██████████| 287/287 [00:00<00:00, 72546.57it/s]
100%|██████████| 771/771 [00:00<00:00, 74747.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75153.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72348.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90264.79it/s]
100%|██████████| 353/353 [00:00<00:00, 74125.83it/s]
100%|██████████| 252/252 [00:00<00:00, 74829.35it/s]
100%|██████████| 203/203 [00:00<00:00, 76280.57it/s]
100%|██████████| 153/153 [00:00<00:00, 73702.60it/s]
100%|██████████| 200/200 [00:00<00:00, 76973.83it/s]
100%|██████████| 65/65 [00:00<00:00, 62301.13it/s]
100%|██████████| 144/144 [00:00<00:00, 70931.27it/s]
100%|██████████| 30/30 [00:00<00:00, 67144.67it/s]
100%|██████████| 130/130 [00:00<00:00, 74013.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85919.17it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 232.44it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 90356.67it/s]
100%|██████████| 287/287 [00:00<00:00, 75603.90it/s]
100%|██████████| 771/771 [00:00<00:00, 75786.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78487.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87596.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78750.50it/s]
100%|██████████| 353/353 [00:00<00:00, 68207.92it/s]
100%|██████████| 252/252 [00:00<00:00, 74967.35it/s]
100%|██████████| 203/203 [00:00<00:00, 74661.85it/s]
100%|██████████| 153/153 [00:00<00:00, 72758.33it/s]
100%|██████████| 200/200 [00:00<00:00, 73648.88it/s]
100%|██████████| 65/65 [00:00<00:00, 65175.65it/s]
100%|██████████| 144/144 [00:00<00:00, 72672.33it/s]
100%|██████████| 30/30 [00:00<00:00, 44987.17it/s]
100%|██████████| 130/130 [00:00<00:00, 63758.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86200.69it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 230.83it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76754.59it/s]
100%|██████████| 287/287 [00:00<00:00, 74508.87it/s]
100%|██████████| 771/771 [00:00<00:00, 76260.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77362.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84521.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73966.22it/s]
100%|██████████| 353/353 [00:00<00:00, 78454.29it/s]
100%|██████████| 252/252 [00:00<00:00, 75153.91it/s]
100%|██████████| 203/203 [00:00<00:00, 74904.87it/s]
100%|██████████| 153/153 [00:00<00:00, 74317.14it/s]
100%|██████████| 200/200 [00:00<00:00, 77478.60it/s]
100%|██████████| 65/65 [00:00<00:00, 64466.72it/s]
100%|██████████| 144/144 [00:00<00:00, 75440.89it/s]
100%|██████████| 30/30 [00:00<00:00, 67613.71it/s]
100%|██████████| 130/130 [00:00<00:00, 65575.41it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87799.43it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 236.91it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75549.20it/s]
100%|██████████| 287/287 [00:00<00:00, 75414.44it/s]
100%|██████████| 771/771 [00:00<00:00, 74251.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77969.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77328.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91604.69it/s]
100%|██████████| 353/353 [00:00<00:00, 73911.21it/s]
100%|██████████| 252/252 [00:00<00:00, 78200.99it/s]
100%|██████████| 203/203 [00:00<00:00, 76362.66it/s]
100%|██████████| 153/153 [00:00<00:00, 77738.16it/s]
100%|██████████| 200/200 [00:00<00:00, 70109.55it/s]
100%|██████████| 65/65 [00:00<00:00, 72915.15it/s]
100%|██████████| 144/144 [00:00<00:00, 73674.04it/s]
100%|██████████| 30/30 [00:00<00:00, 67288.30it/s]
100%|██████████| 130/130 [00:00<00:00, 73091.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88444.24it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 231.64it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 56740.42it/s]
100%|██████████| 287/287 [00:00<00:00, 77602.19it/s]
100%|██████████| 771/771 [00:00<00:00, 81121.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86658.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 99579.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78511.20it/s]
100%|██████████| 353/353 [00:00<00:00, 79859.19it/s]
100%|██████████| 252/252 [00:00<00:00, 78050.85it/s]
100%|██████████| 203/203 [00:00<00:00, 78121.27it/s]
100%|██████████| 153/153 [00:00<00:00, 75854.43it/s]
100%|██████████| 200/200 [00:00<00:00, 77342.87it/s]
100%|██████████| 65/65 [00:00<00:00, 68362.53it/s]
100%|██████████| 144/144 [00:00<00:00, 74703.74it/s]
100%|██████████| 30/30 [00:00<00:00, 55627.37it/s]
100%|██████████| 130/130 [00:00<00:00, 63021.21it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77658.74it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 236.38it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81842.88it/s]
100%|██████████| 287/287 [00:00<00:00, 79514.19it/s]
100%|██████████| 771/771 [00:00<00:00, 79394.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81295.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74917.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98290.95it/s]
100%|██████████| 353/353 [00:00<00:00, 58762.87it/s]
100%|██████████| 252/252 [00:00<00:00, 66014.90it/s]
100%|██████████| 203/203 [00:00<00:00, 76150.94it/s]
100%|██████████| 153/153 [00:00<00:00, 78710.72it/s]
100%|██████████| 200/200 [00:00<00:00, 77874.19it/s]
100%|██████████| 65/65 [00:00<00:00, 75395.40it/s]
100%|██████████| 144/144 [00:00<00:00, 80007.92it/s]
100%|██████████| 30/30 [00:00<00:00, 57143.11it/s]
100%|██████████| 130/130 [00:00<00:00, 77838.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87536.61it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 231.77it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80999.61it/s]
100%|██████████| 287/287 [00:00<00:00, 76775.64it/s]
100%|██████████| 771/771 [00:00<00:00, 80924.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81478.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79782.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98660.87it/s]
100%|██████████| 353/353 [00:00<00:00, 77279.05it/s]
100%|██████████| 252/252 [00:00<00:00, 79321.92it/s]
100%|██████████| 203/203 [00:00<00:00, 59267.97it/s]
100%|██████████| 153/153 [00:00<00:00, 75854.43it/s]
100%|██████████| 200/200 [00:00<00:00, 74479.34it/s]
100%|██████████| 65/65 [00:00<00:00, 66317.14it/s]
100%|██████████| 144/144 [00:00<00:00, 75715.15it/s]
100%|██████████| 30/30 [00:00<00:00, 57273.15it/s]
100%|██████████| 130/130 [00:00<00:00, 79275.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81430.15it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 236.40it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 57638.79it/s]
100%|██████████| 287/287 [00:00<00:00, 80996.18it/s]
100%|██████████| 771/771 [00:00<00:00, 96379.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98038.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88682.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91210.93it/s]
100%|██████████| 353/353 [00:00<00:00, 79053.30it/s]
100%|██████████| 252/252 [00:00<00:00, 78901.51it/s]
100%|██████████| 203/203 [00:00<00:00, 78560.96it/s]
100%|██████████| 153/153 [00:00<00:00, 66301.12it/s]
100%|██████████| 200/200 [00:00<00:00, 76066.45it/s]
100%|██████████| 65/65 [00:00<00:00, 68863.29it/s]
100%|██████████| 144/144 [00:00<00:00, 75648.77it/s]
100%|██████████| 30/30 [00:00<00:00, 62726.38it/s]
100%|██████████| 130/130 [00:00<00:00, 75478.89it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101385.16it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 232.50it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 59422.38it/s]
100%|██████████| 287/287 [00:00<00:00, 38530.35it/s]
100%|██████████| 771/771 [00:00<00:00, 58937.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 57757.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 99285.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79157.23it/s]
100%|██████████| 353/353 [00:00<00:00, 80057.82it/s]
100%|██████████| 252/252 [00:00<00:00, 80832.41it/s]
100%|██████████| 203/203 [00:00<00:00, 77011.91it/s]
100%|██████████| 153/153 [00:00<00:00, 76936.64it/s]
100%|██████████| 200/200 [00:00<00:00, 81214.13it/s]
100%|██████████| 65/65 [00:00<00:00, 76970.57it/s]
100%|██████████| 144/144 [00:00<00:00, 80821.59it/s]
100%|██████████| 30/30 [00:00<00:00, 33323.39it/s]
100%|██████████| 130/130 [00:00<00:00, 49034.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74031.81it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 235.71it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81918.08it/s]
100%|██████████| 287/287 [00:00<00:00, 71931.00it/s]
100%|██████████| 771/771 [00:00<00:00, 74407.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96173.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80372.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95916.58it/s]
100%|██████████| 353/353 [00:00<00:00, 77404.29it/s]
100%|██████████| 252/252 [00:00<00:00, 79066.77it/s]
100%|██████████| 203/203 [00:00<00:00, 75402.38it/s]
100%|██████████| 153/153 [00:00<00:00, 74437.83it/s]
100%|██████████| 200/200 [00:00<00:00, 65387.86it/s]
100%|██████████| 65/65 [00:00<00:00, 70538.10it/s]
100%|██████████| 144/144 [00:00<00:00, 74889.00it/s]
100%|██████████| 30/30 [00:00<00:00, 69060.99it/s]
100%|██████████| 130/130 [00:00<00:00, 62180.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101658.27it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [01:26<00:00, 67.59it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 71559.75it/s]
100%|██████████| 287/287 [00:00<00:00, 70959.99it/s]
100%|██████████| 771/771 [00:00<00:00, 75280.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75168.76it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89345.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78907.05it/s]
100%|██████████| 353/353 [00:00<00:00, 72048.14it/s]
100%|██████████| 252/252 [00:00<00:00, 75702.95it/s]
100%|██████████| 203/203 [00:00<00:00, 76042.13it/s]
100%|██████████| 153/153 [00:00<00:00, 73736.47it/s]
100%|██████████| 200/200 [00:00<00:00, 77129.53it/s]
100%|██████████| 65/65 [00:00<00:00, 73564.43it/s]
100%|██████████| 144/144 [00:00<00:00, 70533.67it/s]
100%|██████████| 30/30 [00:00<00:00, 43965.45it/s]
100%|██████████| 130/130 [00:00<00:00, 61306.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93242.87it/s]
100%|██████████| 2034/

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 114.46it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73958.34it/s]
100%|██████████| 287/287 [00:00<00:00, 71262.45it/s]
100%|██████████| 771/771 [00:00<00:00, 73619.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90441.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94515.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89921.62it/s]
100%|██████████| 353/353 [00:00<00:00, 66624.19it/s]
100%|██████████| 252/252 [00:00<00:00, 74502.33it/s]
100%|██████████| 203/203 [00:00<00:00, 72426.31it/s]
100%|██████████| 153/153 [00:00<00:00, 64925.99it/s]
100%|██████████| 200/200 [00:00<00:00, 77932.07it/s]
100%|██████████| 65/65 [00:00<00:00, 67902.80it/s]
100%|██████████| 144/144 [00:00<00:00, 67946.88it/s]
100%|██████████| 30/30 [00:00<00:00, 53980.75it/s]
100%|██████████| 130/130 [00:00<00:00, 70895.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74550.64it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 114.08it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 85950.97it/s]
100%|██████████| 287/287 [00:00<00:00, 61404.06it/s]
100%|██████████| 771/771 [00:00<00:00, 77450.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76543.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77888.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80312.70it/s]
100%|██████████| 353/353 [00:00<00:00, 77905.25it/s]
100%|██████████| 252/252 [00:00<00:00, 78760.40it/s]
100%|██████████| 203/203 [00:00<00:00, 73616.09it/s]
100%|██████████| 153/153 [00:00<00:00, 74741.27it/s]
100%|██████████| 200/200 [00:00<00:00, 74071.59it/s]
100%|██████████| 65/65 [00:00<00:00, 65082.30it/s]
100%|██████████| 144/144 [00:00<00:00, 65800.17it/s]
100%|██████████| 30/30 [00:00<00:00, 51108.50it/s]
100%|██████████| 130/130 [00:00<00:00, 73524.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91130.15it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:50<00:00, 114.88it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 90047.92it/s]
100%|██████████| 287/287 [00:00<00:00, 88414.63it/s]
100%|██████████| 771/771 [00:00<00:00, 76927.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79297.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78430.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81141.86it/s]
100%|██████████| 353/353 [00:00<00:00, 76516.24it/s]
100%|██████████| 252/252 [00:00<00:00, 76708.37it/s]
100%|██████████| 203/203 [00:00<00:00, 76548.03it/s]
100%|██████████| 153/153 [00:00<00:00, 73315.26it/s]
100%|██████████| 200/200 [00:00<00:00, 74718.16it/s]
100%|██████████| 65/65 [00:00<00:00, 70356.07it/s]
100%|██████████| 144/144 [00:00<00:00, 79481.48it/s]
100%|██████████| 30/30 [00:00<00:00, 61320.23it/s]
100%|██████████| 130/130 [00:00<00:00, 70666.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86478.97it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.61it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 74635.47it/s]
100%|██████████| 287/287 [00:00<00:00, 66712.77it/s]
100%|██████████| 771/771 [00:00<00:00, 95336.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95127.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77345.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94968.96it/s]
100%|██████████| 353/353 [00:00<00:00, 72389.84it/s]
100%|██████████| 252/252 [00:00<00:00, 83521.50it/s]
100%|██████████| 203/203 [00:00<00:00, 74806.16it/s]
100%|██████████| 153/153 [00:00<00:00, 68458.34it/s]
100%|██████████| 200/200 [00:00<00:00, 77859.74it/s]
100%|██████████| 65/65 [00:00<00:00, 72681.89it/s]
100%|██████████| 144/144 [00:00<00:00, 72567.56it/s]
100%|██████████| 30/30 [00:00<00:00, 59269.49it/s]
100%|██████████| 130/130 [00:00<00:00, 68174.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80723.56it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 114.46it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 79942.57it/s]
100%|██████████| 287/287 [00:00<00:00, 72590.32it/s]
100%|██████████| 771/771 [00:00<00:00, 76270.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74714.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88034.25it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82152.66it/s]
100%|██████████| 353/353 [00:00<00:00, 77656.00it/s]
100%|██████████| 252/252 [00:00<00:00, 73476.86it/s]
100%|██████████| 203/203 [00:00<00:00, 74122.37it/s]
100%|██████████| 153/153 [00:00<00:00, 74351.58it/s]
100%|██████████| 200/200 [00:00<00:00, 72716.78it/s]
100%|██████████| 65/65 [00:00<00:00, 64405.80it/s]
100%|██████████| 144/144 [00:00<00:00, 70132.35it/s]
100%|██████████| 30/30 [00:00<00:00, 56400.32it/s]
100%|██████████| 130/130 [00:00<00:00, 71219.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93942.19it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.81it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 87319.42it/s]
100%|██████████| 287/287 [00:00<00:00, 64472.46it/s]
100%|██████████| 771/771 [00:00<00:00, 77642.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80459.32it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80190.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87157.99it/s]
100%|██████████| 353/353 [00:00<00:00, 76877.79it/s]
100%|██████████| 252/252 [00:00<00:00, 76641.62it/s]
100%|██████████| 203/203 [00:00<00:00, 72284.89it/s]
100%|██████████| 153/153 [00:00<00:00, 72413.51it/s]
100%|██████████| 200/200 [00:00<00:00, 71734.29it/s]
100%|██████████| 65/65 [00:00<00:00, 59774.12it/s]
100%|██████████| 144/144 [00:00<00:00, 73245.18it/s]
100%|██████████| 30/30 [00:00<00:00, 42111.49it/s]
100%|██████████| 130/130 [00:00<00:00, 61926.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70437.71it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 114.50it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 72657.92it/s]
100%|██████████| 287/287 [00:00<00:00, 60363.32it/s]
100%|██████████| 771/771 [00:00<00:00, 77081.70it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73364.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78596.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80595.11it/s]
100%|██████████| 353/353 [00:00<00:00, 67290.34it/s]
100%|██████████| 252/252 [00:00<00:00, 73738.29it/s]
100%|██████████| 203/203 [00:00<00:00, 75089.84it/s]
100%|██████████| 153/153 [00:00<00:00, 73223.24it/s]
100%|██████████| 200/200 [00:00<00:00, 76825.79it/s]
100%|██████████| 65/65 [00:00<00:00, 66349.42it/s]
100%|██████████| 144/144 [00:00<00:00, 74107.95it/s]
100%|██████████| 30/30 [00:00<00:00, 67722.88it/s]
100%|██████████| 130/130 [00:00<00:00, 71867.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87143.25it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.55it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75008.23it/s]
100%|██████████| 287/287 [00:00<00:00, 73895.96it/s]
100%|██████████| 771/771 [00:00<00:00, 75381.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82895.48it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89758.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81659.50it/s]
100%|██████████| 353/353 [00:00<00:00, 75210.27it/s]
100%|██████████| 252/252 [00:00<00:00, 72989.75it/s]
100%|██████████| 203/203 [00:00<00:00, 73387.67it/s]
100%|██████████| 153/153 [00:00<00:00, 72234.19it/s]
100%|██████████| 200/200 [00:00<00:00, 74235.47it/s]
100%|██████████| 65/65 [00:00<00:00, 70960.37it/s]
100%|██████████| 144/144 [00:00<00:00, 69590.94it/s]
100%|██████████| 30/30 [00:00<00:00, 35982.02it/s]
100%|██████████| 130/130 [00:00<00:00, 72788.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83231.17it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 114.39it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76652.09it/s]
100%|██████████| 287/287 [00:00<00:00, 74366.17it/s]
100%|██████████| 771/771 [00:00<00:00, 77536.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83888.60it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78920.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83788.33it/s]
100%|██████████| 353/353 [00:00<00:00, 75023.53it/s]
100%|██████████| 252/252 [00:00<00:00, 75180.64it/s]
100%|██████████| 203/203 [00:00<00:00, 73609.73it/s]
100%|██████████| 153/153 [00:00<00:00, 59298.51it/s]
100%|██████████| 200/200 [00:00<00:00, 61329.20it/s]
100%|██████████| 65/65 [00:00<00:00, 66092.06it/s]
100%|██████████| 144/144 [00:00<00:00, 65077.01it/s]
100%|██████████| 30/30 [00:00<00:00, 47572.45it/s]
100%|██████████| 130/130 [00:00<00:00, 72459.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73534.89it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.30it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76761.62it/s]
100%|██████████| 287/287 [00:00<00:00, 79963.15it/s]
100%|██████████| 771/771 [00:00<00:00, 82051.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80035.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72599.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 99175.66it/s]
100%|██████████| 353/353 [00:00<00:00, 72989.37it/s]
100%|██████████| 252/252 [00:00<00:00, 71013.48it/s]
100%|██████████| 203/203 [00:00<00:00, 60032.69it/s]
100%|██████████| 153/153 [00:00<00:00, 72593.72it/s]
100%|██████████| 200/200 [00:00<00:00, 68383.53it/s]
100%|██████████| 65/65 [00:00<00:00, 64696.19it/s]
100%|██████████| 144/144 [00:00<00:00, 73405.42it/s]
100%|██████████| 30/30 [00:00<00:00, 39053.11it/s]
100%|██████████| 130/130 [00:00<00:00, 66641.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77807.33it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:50<00:00, 114.87it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77120.48it/s]
100%|██████████| 287/287 [00:00<00:00, 78070.25it/s]
100%|██████████| 771/771 [00:00<00:00, 86234.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81138.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78941.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 99832.69it/s]
100%|██████████| 353/353 [00:00<00:00, 73833.81it/s]
100%|██████████| 252/252 [00:00<00:00, 78684.18it/s]
100%|██████████| 203/203 [00:00<00:00, 70806.13it/s]
100%|██████████| 153/153 [00:00<00:00, 56046.16it/s]
100%|██████████| 200/200 [00:00<00:00, 69916.72it/s]
100%|██████████| 65/65 [00:00<00:00, 68004.43it/s]
100%|██████████| 144/144 [00:00<00:00, 75103.18it/s]
100%|██████████| 30/30 [00:00<00:00, 46091.25it/s]
100%|██████████| 130/130 [00:00<00:00, 65144.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85360.62it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.58it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 62980.76it/s]
100%|██████████| 287/287 [00:00<00:00, 77597.19it/s]
100%|██████████| 771/771 [00:00<00:00, 79163.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86985.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81710.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84167.76it/s]
100%|██████████| 353/353 [00:00<00:00, 79175.90it/s]
100%|██████████| 252/252 [00:00<00:00, 78363.33it/s]
100%|██████████| 203/203 [00:00<00:00, 81720.29it/s]
100%|██████████| 153/153 [00:00<00:00, 80518.01it/s]
100%|██████████| 200/200 [00:00<00:00, 78914.47it/s]
100%|██████████| 65/65 [00:00<00:00, 53113.14it/s]
100%|██████████| 144/144 [00:00<00:00, 76337.18it/s]
100%|██████████| 30/30 [00:00<00:00, 65570.15it/s]
100%|██████████| 130/130 [00:00<00:00, 71612.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84923.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.77it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78363.75it/s]
100%|██████████| 287/287 [00:00<00:00, 77218.89it/s]
100%|██████████| 771/771 [00:00<00:00, 80756.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75642.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81537.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79434.57it/s]
100%|██████████| 353/353 [00:00<00:00, 76857.83it/s]
100%|██████████| 252/252 [00:00<00:00, 77672.30it/s]
100%|██████████| 203/203 [00:00<00:00, 77263.49it/s]
100%|██████████| 153/153 [00:00<00:00, 71765.66it/s]
100%|██████████| 200/200 [00:00<00:00, 73603.65it/s]
100%|██████████| 65/65 [00:00<00:00, 66236.58it/s]
100%|██████████| 144/144 [00:00<00:00, 78337.20it/s]
100%|██████████| 30/30 [00:00<00:00, 53957.60it/s]
100%|██████████| 130/130 [00:00<00:00, 57766.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96482.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 112.89it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76035.89it/s]
100%|██████████| 287/287 [00:00<00:00, 77392.65it/s]
100%|██████████| 771/771 [00:00<00:00, 80253.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76532.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94304.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77230.37it/s]
100%|██████████| 353/353 [00:00<00:00, 78338.06it/s]
100%|██████████| 252/252 [00:00<00:00, 79927.75it/s]
100%|██████████| 203/203 [00:00<00:00, 75906.54it/s]
100%|██████████| 153/153 [00:00<00:00, 74325.75it/s]
100%|██████████| 200/200 [00:00<00:00, 79264.93it/s]
100%|██████████| 65/65 [00:00<00:00, 66397.90it/s]
100%|██████████| 144/144 [00:00<00:00, 65224.60it/s]
100%|██████████| 30/30 [00:00<00:00, 53453.32it/s]
100%|██████████| 130/130 [00:00<00:00, 66673.94it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76151.68it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:51<00:00, 113.89it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75936.67it/s]
100%|██████████| 287/287 [00:00<00:00, 59518.68it/s]
100%|██████████| 771/771 [00:00<00:00, 80377.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78385.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 58228.34it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75456.57it/s]
100%|██████████| 353/353 [00:00<00:00, 57950.97it/s]
100%|██████████| 252/252 [00:00<00:00, 56786.36it/s]
100%|██████████| 203/203 [00:00<00:00, 53109.01it/s]
100%|██████████| 153/153 [00:00<00:00, 55269.01it/s]
100%|██████████| 200/200 [00:00<00:00, 55557.37it/s]
100%|██████████| 65/65 [00:00<00:00, 53414.92it/s]
100%|██████████| 144/144 [00:00<00:00, 45449.60it/s]
100%|██████████| 30/30 [00:00<00:00, 49675.93it/s]
100%|██████████| 130/130 [00:00<00:00, 55182.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 65183.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.42it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75721.22it/s]
100%|██████████| 287/287 [00:00<00:00, 73485.46it/s]
100%|██████████| 771/771 [00:00<00:00, 72529.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93948.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76947.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89066.80it/s]
100%|██████████| 353/353 [00:00<00:00, 76366.27it/s]
100%|██████████| 252/252 [00:00<00:00, 73686.88it/s]
100%|██████████| 203/203 [00:00<00:00, 68066.49it/s]
100%|██████████| 153/153 [00:00<00:00, 68751.72it/s]
100%|██████████| 200/200 [00:00<00:00, 72603.50it/s]
100%|██████████| 65/65 [00:00<00:00, 65820.80it/s]
100%|██████████| 144/144 [00:00<00:00, 69136.88it/s]
100%|██████████| 30/30 [00:00<00:00, 53114.87it/s]
100%|██████████| 130/130 [00:00<00:00, 67953.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80394.65it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.33it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76360.14it/s]
100%|██████████| 287/287 [00:00<00:00, 75442.80it/s]
100%|██████████| 771/771 [00:00<00:00, 73592.65it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96133.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76737.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88224.37it/s]
100%|██████████| 353/353 [00:00<00:00, 77097.96it/s]
100%|██████████| 252/252 [00:00<00:00, 77387.95it/s]
100%|██████████| 203/203 [00:00<00:00, 72593.04it/s]
100%|██████████| 153/153 [00:00<00:00, 70411.29it/s]
100%|██████████| 200/200 [00:00<00:00, 72315.59it/s]
100%|██████████| 65/65 [00:00<00:00, 63639.07it/s]
100%|██████████| 144/144 [00:00<00:00, 67071.60it/s]
100%|██████████| 30/30 [00:00<00:00, 66435.65it/s]
100%|██████████| 130/130 [00:00<00:00, 69646.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74533.60it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.89it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77938.13it/s]
100%|██████████| 287/287 [00:00<00:00, 75052.39it/s]
100%|██████████| 771/771 [00:00<00:00, 74841.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87487.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78941.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88554.06it/s]
100%|██████████| 353/353 [00:00<00:00, 76307.24it/s]
100%|██████████| 252/252 [00:00<00:00, 76486.33it/s]
100%|██████████| 203/203 [00:00<00:00, 76069.30it/s]
100%|██████████| 153/153 [00:00<00:00, 51145.97it/s]
100%|██████████| 200/200 [00:00<00:00, 63845.10it/s]
100%|██████████| 65/65 [00:00<00:00, 66204.41it/s]
100%|██████████| 144/144 [00:00<00:00, 72203.20it/s]
100%|██████████| 30/30 [00:00<00:00, 66930.38it/s]
100%|██████████| 130/130 [00:00<00:00, 69735.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79536.57it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.92it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77301.17it/s]
100%|██████████| 287/287 [00:00<00:00, 77817.91it/s]
100%|██████████| 771/771 [00:00<00:00, 75584.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93151.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79660.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89435.24it/s]
100%|██████████| 353/353 [00:00<00:00, 76295.44it/s]
100%|██████████| 252/252 [00:00<00:00, 74549.63it/s]
100%|██████████| 203/203 [00:00<00:00, 65667.42it/s]
100%|██████████| 153/153 [00:00<00:00, 68788.56it/s]
100%|██████████| 200/200 [00:00<00:00, 73135.20it/s]
100%|██████████| 65/65 [00:00<00:00, 45438.29it/s]
100%|██████████| 144/144 [00:00<00:00, 76530.64it/s]
100%|██████████| 30/30 [00:00<00:00, 31758.99it/s]
100%|██████████| 130/130 [00:00<00:00, 76164.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80448.85it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.86it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76901.09it/s]
100%|██████████| 287/287 [00:00<00:00, 74768.03it/s]
100%|██████████| 771/771 [00:00<00:00, 69592.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95970.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77218.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88562.16it/s]
100%|██████████| 353/353 [00:00<00:00, 78826.03it/s]
100%|██████████| 252/252 [00:00<00:00, 74157.34it/s]
100%|██████████| 203/203 [00:00<00:00, 71012.82it/s]
100%|██████████| 153/153 [00:00<00:00, 69003.07it/s]
100%|██████████| 200/200 [00:00<00:00, 75791.54it/s]
100%|██████████| 65/65 [00:00<00:00, 60490.30it/s]
100%|██████████| 144/144 [00:00<00:00, 64493.30it/s]
100%|██████████| 30/30 [00:00<00:00, 51421.79it/s]
100%|██████████| 130/130 [00:00<00:00, 71971.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89460.76it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.08it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77286.91it/s]
100%|██████████| 287/287 [00:00<00:00, 74652.11it/s]
100%|██████████| 771/771 [00:00<00:00, 77454.63it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78096.77it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78096.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82678.97it/s]
100%|██████████| 353/353 [00:00<00:00, 76921.72it/s]
100%|██████████| 252/252 [00:00<00:00, 75551.44it/s]
100%|██████████| 203/203 [00:00<00:00, 75295.69it/s]
100%|██████████| 153/153 [00:00<00:00, 66369.69it/s]
100%|██████████| 200/200 [00:00<00:00, 73648.88it/s]
100%|██████████| 65/65 [00:00<00:00, 68482.73it/s]
100%|██████████| 144/144 [00:00<00:00, 56499.51it/s]
100%|██████████| 30/30 [00:00<00:00, 53092.46it/s]
100%|██████████| 130/130 [00:00<00:00, 45126.17it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73441.08it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.93it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77259.83it/s]
100%|██████████| 287/287 [00:00<00:00, 74954.25it/s]
100%|██████████| 771/771 [00:00<00:00, 74135.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84683.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78291.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86662.75it/s]
100%|██████████| 353/353 [00:00<00:00, 75927.66it/s]
100%|██████████| 252/252 [00:00<00:00, 75887.75it/s]
100%|██████████| 203/203 [00:00<00:00, 68219.19it/s]
100%|██████████| 153/153 [00:00<00:00, 74008.59it/s]
100%|██████████| 200/200 [00:00<00:00, 66772.33it/s]
100%|██████████| 65/65 [00:00<00:00, 61196.35it/s]
100%|██████████| 144/144 [00:00<00:00, 73050.29it/s]
100%|██████████| 30/30 [00:00<00:00, 62107.17it/s]
100%|██████████| 130/130 [00:00<00:00, 74184.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78295.76it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.79it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76723.67it/s]
100%|██████████| 287/287 [00:00<00:00, 75136.71it/s]
100%|██████████| 771/771 [00:00<00:00, 74601.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92766.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78505.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89577.86it/s]
100%|██████████| 353/353 [00:00<00:00, 75776.10it/s]
100%|██████████| 252/252 [00:00<00:00, 74502.33it/s]
100%|██████████| 203/203 [00:00<00:00, 66193.25it/s]
100%|██████████| 153/153 [00:00<00:00, 74663.00it/s]
100%|██████████| 200/200 [00:00<00:00, 73436.12it/s]
100%|██████████| 65/65 [00:00<00:00, 43516.32it/s]
100%|██████████| 144/144 [00:00<00:00, 63310.25it/s]
100%|██████████| 30/30 [00:00<00:00, 64693.63it/s]
100%|██████████| 130/130 [00:00<00:00, 68140.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71060.30it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.92it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76639.47it/s]
100%|██████████| 287/287 [00:00<00:00, 73778.21it/s]
100%|██████████| 771/771 [00:00<00:00, 74694.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93317.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77447.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86268.82it/s]
100%|██████████| 353/353 [00:00<00:00, 73329.17it/s]
100%|██████████| 252/252 [00:00<00:00, 71946.40it/s]
100%|██████████| 203/203 [00:00<00:00, 67990.39it/s]
100%|██████████| 153/153 [00:00<00:00, 75426.48it/s]
100%|██████████| 200/200 [00:00<00:00, 73687.70it/s]
100%|██████████| 65/65 [00:00<00:00, 49300.14it/s]
100%|██████████| 144/144 [00:00<00:00, 71367.10it/s]
100%|██████████| 30/30 [00:00<00:00, 61380.06it/s]
100%|██████████| 130/130 [00:00<00:00, 75930.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76699.95it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.11it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77708.31it/s]
100%|██████████| 287/287 [00:00<00:00, 75471.18it/s]
100%|██████████| 771/771 [00:00<00:00, 81982.72it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93016.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77865.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90112.23it/s]
100%|██████████| 353/353 [00:00<00:00, 77118.04it/s]
100%|██████████| 252/252 [00:00<00:00, 73650.94it/s]
100%|██████████| 203/203 [00:00<00:00, 65855.34it/s]
100%|██████████| 153/153 [00:00<00:00, 76478.19it/s]
100%|██████████| 200/200 [00:00<00:00, 73410.41it/s]
100%|██████████| 65/65 [00:00<00:00, 56786.04it/s]
100%|██████████| 144/144 [00:00<00:00, 68431.88it/s]
100%|██████████| 30/30 [00:00<00:00, 65604.34it/s]
100%|██████████| 130/130 [00:00<00:00, 61500.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74234.72it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.45it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 57753.19it/s]
100%|██████████| 287/287 [00:00<00:00, 56650.44it/s]
100%|██████████| 771/771 [00:00<00:00, 57011.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96707.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 56441.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 61579.82it/s]
100%|██████████| 353/353 [00:00<00:00, 57910.17it/s]
100%|██████████| 252/252 [00:00<00:00, 57722.93it/s]
100%|██████████| 203/203 [00:00<00:00, 57105.55it/s]
100%|██████████| 153/153 [00:00<00:00, 52747.70it/s]
100%|██████████| 200/200 [00:00<00:00, 47286.40it/s]
100%|██████████| 65/65 [00:00<00:00, 49923.05it/s]
100%|██████████| 144/144 [00:00<00:00, 56557.71it/s]
100%|██████████| 30/30 [00:00<00:00, 47428.99it/s]
100%|██████████| 130/130 [00:00<00:00, 56062.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 55536.25it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.96it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77986.00it/s]
100%|██████████| 287/287 [00:00<00:00, 72682.36it/s]
100%|██████████| 771/771 [00:00<00:00, 79006.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76910.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86980.86it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93351.97it/s]
100%|██████████| 353/353 [00:00<00:00, 87232.03it/s]
100%|██████████| 252/252 [00:00<00:00, 72643.62it/s]
100%|██████████| 203/203 [00:00<00:00, 75650.26it/s]
100%|██████████| 153/153 [00:00<00:00, 76606.01it/s]
100%|██████████| 200/200 [00:00<00:00, 74844.83it/s]
100%|██████████| 65/65 [00:00<00:00, 52408.64it/s]
100%|██████████| 144/144 [00:00<00:00, 69049.93it/s]
100%|██████████| 30/30 [00:00<00:00, 40304.01it/s]
100%|██████████| 130/130 [00:00<00:00, 73753.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74401.39it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.33it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80416.65it/s]
100%|██████████| 287/287 [00:00<00:00, 78151.35it/s]
100%|██████████| 771/771 [00:00<00:00, 78198.20it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88018.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81294.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95511.77it/s]
100%|██████████| 353/353 [00:00<00:00, 79383.91it/s]
100%|██████████| 252/252 [00:00<00:00, 77855.38it/s]
100%|██████████| 203/203 [00:00<00:00, 72162.36it/s]
100%|██████████| 153/153 [00:00<00:00, 76487.31it/s]
100%|██████████| 200/200 [00:00<00:00, 66592.11it/s]
100%|██████████| 65/65 [00:00<00:00, 66044.03it/s]
100%|██████████| 144/144 [00:00<00:00, 77492.91it/s]
100%|██████████| 30/30 [00:00<00:00, 63167.23it/s]
100%|██████████| 130/130 [00:00<00:00, 78443.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78253.19it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.21it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80107.63it/s]
100%|██████████| 287/287 [00:00<00:00, 76434.39it/s]
100%|██████████| 771/771 [00:00<00:00, 78132.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91028.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79659.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77338.12it/s]
100%|██████████| 353/353 [00:00<00:00, 78309.06it/s]
100%|██████████| 252/252 [00:00<00:00, 77325.67it/s]
100%|██████████| 203/203 [00:00<00:00, 73750.00it/s]
100%|██████████| 153/153 [00:00<00:00, 78012.22it/s]
100%|██████████| 200/200 [00:00<00:00, 76336.41it/s]
100%|██████████| 65/65 [00:00<00:00, 61848.86it/s]
100%|██████████| 144/144 [00:00<00:00, 69399.03it/s]
100%|██████████| 30/30 [00:00<00:00, 54377.32it/s]
100%|██████████| 130/130 [00:00<00:00, 79160.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76218.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.87it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81007.44it/s]
100%|██████████| 287/287 [00:00<00:00, 78595.28it/s]
100%|██████████| 771/771 [00:00<00:00, 79987.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87281.32it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82724.63it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83667.99it/s]
100%|██████████| 353/353 [00:00<00:00, 81088.19it/s]
100%|██████████| 252/252 [00:00<00:00, 80334.77it/s]
100%|██████████| 203/203 [00:00<00:00, 79499.88it/s]
100%|██████████| 153/153 [00:00<00:00, 77974.30it/s]
100%|██████████| 200/200 [00:00<00:00, 77968.29it/s]
100%|██████████| 65/65 [00:00<00:00, 68637.91it/s]
100%|██████████| 144/144 [00:00<00:00, 73935.58it/s]
100%|██████████| 30/30 [00:00<00:00, 67686.46it/s]
100%|██████████| 130/130 [00:00<00:00, 75468.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 97285.33it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.59it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82513.34it/s]
100%|██████████| 287/287 [00:00<00:00, 77687.33it/s]
100%|██████████| 771/771 [00:00<00:00, 82178.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78152.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82630.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78751.98it/s]
100%|██████████| 353/353 [00:00<00:00, 79188.60it/s]
100%|██████████| 252/252 [00:00<00:00, 78091.22it/s]
100%|██████████| 203/203 [00:00<00:00, 66095.61it/s]
100%|██████████| 153/153 [00:00<00:00, 75899.29it/s]
100%|██████████| 200/200 [00:00<00:00, 71295.33it/s]
100%|██████████| 65/65 [00:00<00:00, 72143.36it/s]
100%|██████████| 144/144 [00:00<00:00, 77116.93it/s]
100%|██████████| 30/30 [00:00<00:00, 55899.21it/s]
100%|██████████| 130/130 [00:00<00:00, 75846.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77742.63it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [02:28<00:00, 39.37it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 50556.95it/s]
100%|██████████| 287/287 [00:00<00:00, 74726.26it/s]
100%|██████████| 771/771 [00:00<00:00, 77806.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87110.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79362.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83631.84it/s]
100%|██████████| 353/353 [00:00<00:00, 85135.38it/s]
100%|██████████| 252/252 [00:00<00:00, 77331.33it/s]
100%|██████████| 203/203 [00:00<00:00, 71785.15it/s]
100%|██████████| 153/153 [00:00<00:00, 75675.53it/s]
100%|██████████| 200/200 [00:00<00:00, 74406.67it/s]
100%|██████████| 65/65 [00:00<00:00, 66657.64it/s]
100%|██████████| 144/144 [00:00<00:00, 77662.31it/s]
100%|██████████| 30/30 [00:00<00:00, 60032.98it/s]
100%|██████████| 130/130 [00:00<00:00, 68114.87it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90304.96it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 102.84it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 69364.64it/s]
100%|██████████| 287/287 [00:00<00:00, 72411.29it/s]
100%|██████████| 771/771 [00:00<00:00, 76454.79it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91077.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78847.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83063.20it/s]
100%|██████████| 353/353 [00:00<00:00, 76433.29it/s]
100%|██████████| 252/252 [00:00<00:00, 74723.55it/s]
100%|██████████| 203/203 [00:00<00:00, 73469.99it/s]
100%|██████████| 153/153 [00:00<00:00, 74051.29it/s]
100%|██████████| 200/200 [00:00<00:00, 73914.95it/s]
100%|██████████| 65/65 [00:00<00:00, 60814.13it/s]
100%|██████████| 144/144 [00:00<00:00, 67265.82it/s]
100%|██████████| 30/30 [00:00<00:00, 53819.13it/s]
100%|██████████| 130/130 [00:00<00:00, 61045.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93206.16it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 102.25it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78179.52it/s]
100%|██████████| 287/287 [00:00<00:00, 74642.85it/s]
100%|██████████| 771/771 [00:00<00:00, 76267.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75959.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 95212.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90025.84it/s]
100%|██████████| 353/353 [00:00<00:00, 75497.90it/s]
100%|██████████| 252/252 [00:00<00:00, 77501.44it/s]
100%|██████████| 203/203 [00:00<00:00, 71730.73it/s]
100%|██████████| 153/153 [00:00<00:00, 50307.97it/s]
100%|██████████| 200/200 [00:00<00:00, 46053.30it/s]
100%|██████████| 65/65 [00:00<00:00, 42320.67it/s]
100%|██████████| 144/144 [00:00<00:00, 43520.66it/s]
100%|██████████| 30/30 [00:00<00:00, 36802.90it/s]
100%|██████████| 130/130 [00:00<00:00, 55553.70it/s]
100%|██████████| 3500/3500 [00:00<00:00, 67077.59it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 103.10it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 94537.92it/s]
100%|██████████| 287/287 [00:00<00:00, 75570.67it/s]
100%|██████████| 771/771 [00:00<00:00, 76469.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78377.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88695.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76968.18it/s]
100%|██████████| 353/353 [00:00<00:00, 74886.92it/s]
100%|██████████| 252/252 [00:00<00:00, 74639.12it/s]
100%|██████████| 203/203 [00:00<00:00, 75017.07it/s]
100%|██████████| 153/153 [00:00<00:00, 73812.80it/s]
100%|██████████| 200/200 [00:00<00:00, 71673.00it/s]
100%|██████████| 65/65 [00:00<00:00, 65567.52it/s]
100%|██████████| 144/144 [00:00<00:00, 68884.55it/s]
100%|██████████| 30/30 [00:00<00:00, 55480.21it/s]
100%|██████████| 130/130 [00:00<00:00, 71313.04it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88015.25it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.64it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76923.68it/s]
100%|██████████| 287/287 [00:00<00:00, 74041.41it/s]
100%|██████████| 771/771 [00:00<00:00, 75802.45it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76594.30it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89119.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89900.42it/s]
100%|██████████| 353/353 [00:00<00:00, 76181.60it/s]
100%|██████████| 252/252 [00:00<00:00, 79149.66it/s]
100%|██████████| 203/203 [00:00<00:00, 71706.56it/s]
100%|██████████| 153/153 [00:00<00:00, 75890.32it/s]
100%|██████████| 200/200 [00:00<00:00, 72988.85it/s]
100%|██████████| 65/65 [00:00<00:00, 72296.41it/s]
100%|██████████| 144/144 [00:00<00:00, 74666.80it/s]
100%|██████████| 30/30 [00:00<00:00, 66611.50it/s]
100%|██████████| 130/130 [00:00<00:00, 66985.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81767.60it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 102.79it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76185.20it/s]
100%|██████████| 287/287 [00:00<00:00, 72367.76it/s]
100%|██████████| 771/771 [00:00<00:00, 75173.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75008.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72465.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91904.44it/s]
100%|██████████| 353/353 [00:00<00:00, 74483.82it/s]
100%|██████████| 252/252 [00:00<00:00, 74277.20it/s]
100%|██████████| 203/203 [00:00<00:00, 74051.46it/s]
100%|██████████| 153/153 [00:00<00:00, 76789.34it/s]
100%|██████████| 200/200 [00:00<00:00, 73192.64it/s]
100%|██████████| 65/65 [00:00<00:00, 65599.08it/s]
100%|██████████| 144/144 [00:00<00:00, 75224.78it/s]
100%|██████████| 30/30 [00:00<00:00, 52802.82it/s]
100%|██████████| 130/130 [00:00<00:00, 70174.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86764.17it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 102.06it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76369.88it/s]
100%|██████████| 287/287 [00:00<00:00, 75622.90it/s]
100%|██████████| 771/771 [00:00<00:00, 74118.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75683.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87794.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87228.08it/s]
100%|██████████| 353/353 [00:00<00:00, 77656.00it/s]
100%|██████████| 252/252 [00:00<00:00, 73497.30it/s]
100%|██████████| 203/203 [00:00<00:00, 74990.64it/s]
100%|██████████| 153/153 [00:00<00:00, 55894.83it/s]
100%|██████████| 200/200 [00:00<00:00, 69957.53it/s]
100%|██████████| 65/65 [00:00<00:00, 71612.76it/s]
100%|██████████| 144/144 [00:00<00:00, 74629.90it/s]
100%|██████████| 30/30 [00:00<00:00, 66611.50it/s]
100%|██████████| 130/130 [00:00<00:00, 61827.82it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82134.96it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 102.50it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77234.20it/s]
100%|██████████| 287/287 [00:00<00:00, 74274.40it/s]
100%|██████████| 771/771 [00:00<00:00, 76734.18it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75550.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90264.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79217.03it/s]
100%|██████████| 353/353 [00:00<00:00, 69167.02it/s]
100%|██████████| 252/252 [00:00<00:00, 77223.98it/s]
100%|██████████| 203/203 [00:00<00:00, 74557.24it/s]
100%|██████████| 153/153 [00:00<00:00, 75038.41it/s]
100%|██████████| 200/200 [00:00<00:00, 72868.38it/s]
100%|██████████| 65/65 [00:00<00:00, 64133.09it/s]
100%|██████████| 144/144 [00:00<00:00, 74345.12it/s]
100%|██████████| 30/30 [00:00<00:00, 52494.42it/s]
100%|██████████| 130/130 [00:00<00:00, 71584.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86469.29it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 102.67it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 79121.37it/s]
100%|██████████| 287/287 [00:00<00:00, 73886.89it/s]
100%|██████████| 771/771 [00:00<00:00, 75813.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76487.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77017.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75577.58it/s]
100%|██████████| 353/353 [00:00<00:00, 74932.40it/s]
100%|██████████| 252/252 [00:00<00:00, 74644.39it/s]
100%|██████████| 203/203 [00:00<00:00, 73311.84it/s]
100%|██████████| 153/153 [00:00<00:00, 75444.22it/s]
100%|██████████| 200/200 [00:00<00:00, 74764.78it/s]
100%|██████████| 65/65 [00:00<00:00, 63877.64it/s]
100%|██████████| 144/144 [00:00<00:00, 71791.25it/s]
100%|██████████| 30/30 [00:00<00:00, 55019.29it/s]
100%|██████████| 130/130 [00:00<00:00, 71990.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86469.29it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 103.02it/s]
INFO:root:The new embedding has 5824 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77487.00it/s]
100%|██████████| 287/287 [00:00<00:00, 74991.61it/s]
100%|██████████| 771/771 [00:00<00:00, 75012.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76590.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86114.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73121.60it/s]
100%|██████████| 353/353 [00:00<00:00, 74003.56it/s]
100%|██████████| 252/252 [00:00<00:00, 73080.59it/s]
100%|██████████| 203/203 [00:00<00:00, 73508.05it/s]
100%|██████████| 153/153 [00:00<00:00, 72717.11it/s]
100%|██████████| 200/200 [00:00<00:00, 73914.95it/s]
100%|██████████| 65/65 [00:00<00:00, 64481.97it/s]
100%|██████████| 144/144 [00:00<00:00, 75715.15it/s]
100%|██████████| 30/30 [00:00<00:00, 50984.25it/s]
100%|██████████| 130/130 [00:00<00:00, 71801.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86997.10it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 102.34it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77673.74it/s]
100%|██████████| 287/287 [00:00<00:00, 79169.04it/s]
100%|██████████| 771/771 [00:00<00:00, 80451.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79956.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77600.44it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87550.35it/s]
100%|██████████| 353/353 [00:00<00:00, 75290.58it/s]
100%|██████████| 252/252 [00:00<00:00, 79506.89it/s]
100%|██████████| 203/203 [00:00<00:00, 78669.84it/s]
100%|██████████| 153/153 [00:00<00:00, 73164.81it/s]
100%|██████████| 200/200 [00:00<00:00, 75207.17it/s]
100%|██████████| 65/65 [00:00<00:00, 75208.21it/s]
100%|██████████| 144/144 [00:00<00:00, 78104.20it/s]
100%|██████████| 30/30 [00:00<00:00, 66859.26it/s]
100%|██████████| 130/130 [00:00<00:00, 67432.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 55515.67it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 103.04it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82544.22it/s]
100%|██████████| 287/287 [00:00<00:00, 79262.87it/s]
100%|██████████| 771/771 [00:00<00:00, 80601.39it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81744.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76158.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80210.82it/s]
100%|██████████| 353/353 [00:00<00:00, 75088.21it/s]
100%|██████████| 252/252 [00:00<00:00, 78725.21it/s]
100%|██████████| 203/203 [00:00<00:00, 77906.83it/s]
100%|██████████| 153/153 [00:00<00:00, 75399.90it/s]
100%|██████████| 200/200 [00:00<00:00, 77729.87it/s]
100%|██████████| 65/65 [00:00<00:00, 66478.85it/s]
100%|██████████| 144/144 [00:00<00:00, 76115.91it/s]
100%|██████████| 30/30 [00:00<00:00, 59493.67it/s]
100%|██████████| 130/130 [00:00<00:00, 79068.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78065.52it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 102.46it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80596.08it/s]
100%|██████████| 287/287 [00:00<00:00, 77552.20it/s]
100%|██████████| 771/771 [00:00<00:00, 80149.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81571.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79418.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79526.44it/s]
100%|██████████| 353/353 [00:00<00:00, 78462.60it/s]
100%|██████████| 252/252 [00:00<00:00, 75610.89it/s]
100%|██████████| 203/203 [00:00<00:00, 71821.49it/s]
100%|██████████| 153/153 [00:00<00:00, 96674.98it/s]
100%|██████████| 200/200 [00:00<00:00, 77122.44it/s]
100%|██████████| 65/65 [00:00<00:00, 65160.08it/s]
100%|██████████| 144/144 [00:00<00:00, 72962.04it/s]
100%|██████████| 30/30 [00:00<00:00, 46260.71it/s]
100%|██████████| 130/130 [00:00<00:00, 76473.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77333.09it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 102.64it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81159.64it/s]
100%|██████████| 287/287 [00:00<00:00, 78754.68it/s]
100%|██████████| 771/771 [00:00<00:00, 79581.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81556.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78161.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78099.92it/s]
100%|██████████| 353/353 [00:00<00:00, 79218.26it/s]
100%|██████████| 252/252 [00:00<00:00, 69854.25it/s]
100%|██████████| 203/203 [00:00<00:00, 77277.52it/s]
100%|██████████| 153/153 [00:00<00:00, 76835.31it/s]
100%|██████████| 200/200 [00:00<00:00, 77722.67it/s]
100%|██████████| 65/65 [00:00<00:00, 63817.83it/s]
100%|██████████| 144/144 [00:00<00:00, 77255.02it/s]
100%|██████████| 30/30 [00:00<00:00, 69866.25it/s]
100%|██████████| 130/130 [00:00<00:00, 75709.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76553.56it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.97it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79988.35it/s]
100%|██████████| 287/287 [00:00<00:00, 77238.71it/s]
100%|██████████| 771/771 [00:00<00:00, 79904.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80285.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91562.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 57798.26it/s]
100%|██████████| 353/353 [00:00<00:00, 78625.10it/s]
100%|██████████| 252/252 [00:00<00:00, 80067.01it/s]
100%|██████████| 203/203 [00:00<00:00, 74688.04it/s]
100%|██████████| 153/153 [00:00<00:00, 80175.98it/s]
100%|██████████| 200/200 [00:00<00:00, 80729.55it/s]
100%|██████████| 65/65 [00:00<00:00, 75458.00it/s]
100%|██████████| 144/144 [00:00<00:00, 73926.53it/s]
100%|██████████| 30/30 [00:00<00:00, 57640.46it/s]
100%|██████████| 130/130 [00:00<00:00, 72219.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78749.37it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:56<00:00, 103.09it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 51171.29it/s]
100%|██████████| 287/287 [00:00<00:00, 47147.32it/s]
100%|██████████| 771/771 [00:00<00:00, 76975.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78996.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76514.66it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78489.65it/s]
100%|██████████| 353/353 [00:00<00:00, 75958.82it/s]
100%|██████████| 252/252 [00:00<00:00, 78224.14it/s]
100%|██████████| 203/203 [00:00<00:00, 74206.35it/s]
100%|██████████| 153/153 [00:00<00:00, 80609.03it/s]
100%|██████████| 200/200 [00:00<00:00, 80281.44it/s]
100%|██████████| 65/65 [00:00<00:00, 68793.78it/s]
100%|██████████| 144/144 [00:00<00:00, 72646.11it/s]
100%|██████████| 30/30 [00:00<00:00, 56425.61it/s]
100%|██████████| 130/130 [00:00<00:00, 71981.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88499.16it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [01:01<00:00, 95.02it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 101308.26it/s]
100%|██████████| 287/287 [00:00<00:00, 75556.44it/s]
100%|██████████| 771/771 [00:00<00:00, 79000.55it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74675.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77689.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78373.79it/s]
100%|██████████| 353/353 [00:00<00:00, 78529.19it/s]
100%|██████████| 252/252 [00:00<00:00, 77924.26it/s]
100%|██████████| 203/203 [00:00<00:00, 75805.17it/s]
100%|██████████| 153/153 [00:00<00:00, 73829.79it/s]
100%|██████████| 200/200 [00:00<00:00, 72011.40it/s]
100%|██████████| 65/65 [00:00<00:00, 64421.02it/s]
100%|██████████| 144/144 [00:00<00:00, 75876.86it/s]
100%|██████████| 30/30 [00:00<00:00, 65638.56it/s]
100%|██████████| 130/130 [00:00<00:00, 53435.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77724.11it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 475.49it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 90751.98it/s]
100%|██████████| 287/287 [00:00<00:00, 76163.57it/s]
100%|██████████| 771/771 [00:00<00:00, 77037.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75460.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 66354.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73127.13it/s]
100%|██████████| 353/353 [00:00<00:00, 76111.10it/s]
100%|██████████| 252/252 [00:00<00:00, 80353.09it/s]
100%|██████████| 203/203 [00:00<00:00, 76376.36it/s]
100%|██████████| 153/153 [00:00<00:00, 78192.82it/s]
100%|██████████| 200/200 [00:00<00:00, 75539.02it/s]
100%|██████████| 65/65 [00:00<00:00, 70265.40it/s]
100%|██████████| 144/144 [00:00<00:00, 73289.62it/s]
100%|██████████| 30/30 [00:00<00:00, 54732.11it/s]
100%|██████████| 130/130 [00:00<00:00, 70721.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92040.33it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 461.88it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 74414.11it/s]
100%|██████████| 287/287 [00:00<00:00, 75244.73it/s]
100%|██████████| 771/771 [00:00<00:00, 98393.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76602.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73469.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77806.30it/s]
100%|██████████| 353/353 [00:00<00:00, 76825.93it/s]
100%|██████████| 252/252 [00:00<00:00, 75492.08it/s]
100%|██████████| 203/203 [00:00<00:00, 74485.50it/s]
100%|██████████| 153/153 [00:00<00:00, 71342.80it/s]
100%|██████████| 200/200 [00:00<00:00, 74585.29it/s]
100%|██████████| 65/65 [00:00<00:00, 74104.31it/s]
100%|██████████| 144/144 [00:00<00:00, 77393.62it/s]
100%|██████████| 30/30 [00:00<00:00, 47180.02it/s]
100%|██████████| 130/130 [00:00<00:00, 69672.82it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92608.77it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 474.53it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 79130.34it/s]
100%|██████████| 287/287 [00:00<00:00, 76192.50it/s]
100%|██████████| 771/771 [00:00<00:00, 78073.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77032.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82625.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76674.58it/s]
100%|██████████| 353/353 [00:00<00:00, 70017.46it/s]
100%|██████████| 252/252 [00:00<00:00, 76475.26it/s]
100%|██████████| 203/203 [00:00<00:00, 79299.96it/s]
100%|██████████| 153/153 [00:00<00:00, 64860.37it/s]
100%|██████████| 200/200 [00:00<00:00, 76524.43it/s]
100%|██████████| 65/65 [00:00<00:00, 64148.18it/s]
100%|██████████| 144/144 [00:00<00:00, 75131.21it/s]
100%|██████████| 30/30 [00:00<00:00, 57221.06it/s]
100%|██████████| 130/130 [00:00<00:00, 67158.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94150.05it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 444.61it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 73428.25it/s]
100%|██████████| 287/287 [00:00<00:00, 75842.06it/s]
100%|██████████| 771/771 [00:00<00:00, 78744.69it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80510.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77315.78it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80023.61it/s]
100%|██████████| 353/353 [00:00<00:00, 78591.71it/s]
100%|██████████| 252/252 [00:00<00:00, 78789.76it/s]
100%|██████████| 203/203 [00:00<00:00, 74589.90it/s]
100%|██████████| 153/153 [00:00<00:00, 78450.92it/s]
100%|██████████| 200/200 [00:00<00:00, 65275.92it/s]
100%|██████████| 65/65 [00:00<00:00, 66124.12it/s]
100%|██████████| 144/144 [00:00<00:00, 72445.70it/s]
100%|██████████| 30/30 [00:00<00:00, 52648.17it/s]
100%|██████████| 130/130 [00:00<00:00, 72392.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93636.59it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 477.60it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 76915.21it/s]
100%|██████████| 287/287 [00:00<00:00, 72055.86it/s]
100%|██████████| 771/771 [00:00<00:00, 76623.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75626.19it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84594.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75220.66it/s]
100%|██████████| 353/353 [00:00<00:00, 73050.59it/s]
100%|██████████| 252/252 [00:00<00:00, 77071.94it/s]
100%|██████████| 203/203 [00:00<00:00, 76082.90it/s]
100%|██████████| 153/153 [00:00<00:00, 73407.52it/s]
100%|██████████| 200/200 [00:00<00:00, 75935.62it/s]
100%|██████████| 65/65 [00:00<00:00, 74003.74it/s]
100%|██████████| 144/144 [00:00<00:00, 66576.25it/s]
100%|██████████| 30/30 [00:00<00:00, 58281.20it/s]
100%|██████████| 130/130 [00:00<00:00, 71219.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92947.68it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 458.05it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75517.88it/s]
100%|██████████| 287/287 [00:00<00:00, 76551.05it/s]
100%|██████████| 771/771 [00:00<00:00, 78160.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77030.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88528.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75336.85it/s]
100%|██████████| 353/353 [00:00<00:00, 76091.55it/s]
100%|██████████| 252/252 [00:00<00:00, 76177.63it/s]
100%|██████████| 203/203 [00:00<00:00, 74970.83it/s]
100%|██████████| 153/153 [00:00<00:00, 72601.94it/s]
100%|██████████| 200/200 [00:00<00:00, 75641.19it/s]
100%|██████████| 65/65 [00:00<00:00, 73663.81it/s]
100%|██████████| 144/144 [00:00<00:00, 71224.03it/s]
100%|██████████| 30/30 [00:00<00:00, 53003.00it/s]
100%|██████████| 130/130 [00:00<00:00, 68568.85it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70331.41it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 472.06it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 90121.51it/s]
100%|██████████| 287/287 [00:00<00:00, 76052.90it/s]
100%|██████████| 771/771 [00:00<00:00, 76854.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76729.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88195.30it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94443.62it/s]
100%|██████████| 353/353 [00:00<00:00, 78127.24it/s]
100%|██████████| 252/252 [00:00<00:00, 73527.97it/s]
100%|██████████| 203/203 [00:00<00:00, 60726.32it/s]
100%|██████████| 153/153 [00:00<00:00, 70334.12it/s]
100%|██████████| 200/200 [00:00<00:00, 70279.89it/s]
100%|██████████| 65/65 [00:00<00:00, 65175.65it/s]
100%|██████████| 144/144 [00:00<00:00, 67288.30it/s]
100%|██████████| 30/30 [00:00<00:00, 60611.33it/s]
100%|██████████| 130/130 [00:00<00:00, 74509.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72967.26it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 464.16it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 79492.13it/s]
100%|██████████| 287/287 [00:00<00:00, 74661.37it/s]
100%|██████████| 771/771 [00:00<00:00, 76825.32it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76131.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76340.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89813.79it/s]
100%|██████████| 353/353 [00:00<00:00, 74796.13it/s]
100%|██████████| 252/252 [00:00<00:00, 77348.31it/s]
100%|██████████| 203/203 [00:00<00:00, 72997.57it/s]
100%|██████████| 153/153 [00:00<00:00, 75187.87it/s]
100%|██████████| 200/200 [00:00<00:00, 94893.76it/s]
100%|██████████| 65/65 [00:00<00:00, 65884.43it/s]
100%|██████████| 144/144 [00:00<00:00, 73827.13it/s]
100%|██████████| 30/30 [00:00<00:00, 56654.26it/s]
100%|██████████| 130/130 [00:00<00:00, 71735.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74110.67it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 476.35it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 78065.91it/s]
100%|██████████| 287/287 [00:00<00:00, 75622.90it/s]
100%|██████████| 771/771 [00:00<00:00, 77786.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78759.62it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85599.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76825.79it/s]
100%|██████████| 353/353 [00:00<00:00, 74641.53it/s]
100%|██████████| 252/252 [00:00<00:00, 80036.70it/s]
100%|██████████| 203/203 [00:00<00:00, 85641.09it/s]
100%|██████████| 153/153 [00:00<00:00, 76314.49it/s]
100%|██████████| 200/200 [00:00<00:00, 78589.17it/s]
100%|██████████| 65/65 [00:00<00:00, 66903.01it/s]
100%|██████████| 144/144 [00:00<00:00, 75000.59it/s]
100%|██████████| 30/30 [00:00<00:00, 59890.11it/s]
100%|██████████| 130/130 [00:00<00:00, 101274.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84056.59it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 138.33it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76120.15it/s]
100%|██████████| 287/287 [00:00<00:00, 61922.08it/s]
100%|██████████| 771/771 [00:00<00:00, 89783.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76009.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79838.28it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74237.22it/s]
100%|██████████| 353/353 [00:00<00:00, 80109.80it/s]
100%|██████████| 252/252 [00:00<00:00, 75621.71it/s]
100%|██████████| 203/203 [00:00<00:00, 72377.06it/s]
100%|██████████| 153/153 [00:00<00:00, 76305.41it/s]
100%|██████████| 200/200 [00:00<00:00, 76692.34it/s]
100%|██████████| 65/65 [00:00<00:00, 70410.58it/s]
100%|██████████| 144/144 [00:00<00:00, 72005.22it/s]
100%|██████████| 30/30 [00:00<00:00, 51909.70it/s]
100%|██████████| 130/130 [00:00<00:00, 65222.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84225.87it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 225.55it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76467.44it/s]
100%|██████████| 287/287 [00:00<00:00, 64980.58it/s]
100%|██████████| 771/771 [00:00<00:00, 89186.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97100.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78126.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73102.49it/s]
100%|██████████| 353/353 [00:00<00:00, 70544.56it/s]
100%|██████████| 252/252 [00:00<00:00, 72603.70it/s]
100%|██████████| 203/203 [00:00<00:00, 73110.40it/s]
100%|██████████| 153/153 [00:00<00:00, 76368.98it/s]
100%|██████████| 200/200 [00:00<00:00, 65316.58it/s]
100%|██████████| 65/65 [00:00<00:00, 62215.83it/s]
100%|██████████| 144/144 [00:00<00:00, 71714.53it/s]
100%|██████████| 30/30 [00:00<00:00, 66191.02it/s]
100%|██████████| 130/130 [00:00<00:00, 67658.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84591.33it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 223.13it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 80327.24it/s]
100%|██████████| 287/287 [00:00<00:00, 70473.93it/s]
100%|██████████| 771/771 [00:00<00:00, 79423.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74696.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83675.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95038.54it/s]
100%|██████████| 353/353 [00:00<00:00, 71733.98it/s]
100%|██████████| 252/252 [00:00<00:00, 63584.47it/s]
100%|██████████| 203/203 [00:00<00:00, 65304.78it/s]
100%|██████████| 153/153 [00:00<00:00, 68524.13it/s]
100%|██████████| 200/200 [00:00<00:00, 75552.63it/s]
100%|██████████| 65/65 [00:00<00:00, 65900.35it/s]
100%|██████████| 144/144 [00:00<00:00, 76366.14it/s]
100%|██████████| 30/30 [00:00<00:00, 65095.25it/s]
100%|██████████| 130/130 [00:00<00:00, 73893.42it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84929.50it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 226.11it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76203.21it/s]
100%|██████████| 287/287 [00:00<00:00, 72233.14it/s]
100%|██████████| 771/771 [00:00<00:00, 77878.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76156.22it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75723.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91997.84it/s]
100%|██████████| 353/353 [00:00<00:00, 75413.30it/s]
100%|██████████| 252/252 [00:00<00:00, 73262.95it/s]
100%|██████████| 203/203 [00:00<00:00, 62436.29it/s]
100%|██████████| 153/153 [00:00<00:00, 64437.04it/s]
100%|██████████| 200/200 [00:00<00:00, 71581.26it/s]
100%|██████████| 65/65 [00:00<00:00, 68396.83it/s]
100%|██████████| 144/144 [00:00<00:00, 72220.47it/s]
100%|██████████| 30/30 [00:00<00:00, 58661.59it/s]
100%|██████████| 130/130 [00:00<00:00, 71359.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73994.12it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 223.31it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76991.52it/s]
100%|██████████| 287/287 [00:00<00:00, 82761.45it/s]
100%|██████████| 771/771 [00:00<00:00, 88097.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76293.36it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79175.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74114.35it/s]
100%|██████████| 353/353 [00:00<00:00, 73507.56it/s]
100%|██████████| 252/252 [00:00<00:00, 69988.39it/s]
100%|██████████| 203/203 [00:00<00:00, 72235.83it/s]
100%|██████████| 153/153 [00:00<00:00, 72956.86it/s]
100%|██████████| 200/200 [00:00<00:00, 76440.75it/s]
100%|██████████| 65/65 [00:00<00:00, 70030.76it/s]
100%|██████████| 144/144 [00:00<00:00, 74244.59it/s]
100%|██████████| 30/30 [00:00<00:00, 66894.80it/s]
100%|██████████| 130/130 [00:00<00:00, 74164.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79272.00it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 227.96it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77508.50it/s]
100%|██████████| 287/287 [00:00<00:00, 75296.51it/s]
100%|██████████| 771/771 [00:00<00:00, 91319.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94325.03it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75844.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92193.99it/s]
100%|██████████| 353/353 [00:00<00:00, 77668.22it/s]
100%|██████████| 252/252 [00:00<00:00, 73232.50it/s]
100%|██████████| 203/203 [00:00<00:00, 73343.42it/s]
100%|██████████| 153/153 [00:00<00:00, 70752.87it/s]
100%|██████████| 200/200 [00:00<00:00, 82136.57it/s]
100%|██████████| 65/65 [00:00<00:00, 70066.76it/s]
100%|██████████| 144/144 [00:00<00:00, 75705.66it/s]
100%|██████████| 30/30 [00:00<00:00, 64133.09it/s]
100%|██████████| 130/130 [00:00<00:00, 72614.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76813.53it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 224.42it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76271.18it/s]
100%|██████████| 287/287 [00:00<00:00, 73588.78it/s]
100%|██████████| 771/771 [00:00<00:00, 73792.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73372.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87658.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74963.43it/s]
100%|██████████| 353/353 [00:00<00:00, 73653.83it/s]
100%|██████████| 252/252 [00:00<00:00, 72658.60it/s]
100%|██████████| 203/203 [00:00<00:00, 72518.84it/s]
100%|██████████| 153/153 [00:00<00:00, 73567.41it/s]
100%|██████████| 200/200 [00:00<00:00, 73403.99it/s]
100%|██████████| 65/65 [00:00<00:00, 62948.46it/s]
100%|██████████| 144/144 [00:00<00:00, 75772.15it/s]
100%|██████████| 30/30 [00:00<00:00, 67759.35it/s]
100%|██████████| 130/130 [00:00<00:00, 61416.93it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83799.89it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 226.97it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75060.63it/s]
100%|██████████| 287/287 [00:00<00:00, 69925.37it/s]
100%|██████████| 771/771 [00:00<00:00, 83028.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75278.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74327.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93241.29it/s]
100%|██████████| 353/353 [00:00<00:00, 68148.27it/s]
100%|██████████| 252/252 [00:00<00:00, 72994.79it/s]
100%|██████████| 203/203 [00:00<00:00, 67350.40it/s]
100%|██████████| 153/153 [00:00<00:00, 75613.12it/s]
100%|██████████| 200/200 [00:00<00:00, 74958.52it/s]
100%|██████████| 65/65 [00:00<00:00, 63490.86it/s]
100%|██████████| 144/144 [00:00<00:00, 76279.34it/s]
100%|██████████| 30/30 [00:00<00:00, 65672.82it/s]
100%|██████████| 130/130 [00:00<00:00, 70868.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77758.28it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 224.46it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 62961.83it/s]
100%|██████████| 287/287 [00:00<00:00, 65883.93it/s]
100%|██████████| 771/771 [00:00<00:00, 91968.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76109.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74226.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75975.51it/s]
100%|██████████| 353/353 [00:00<00:00, 73108.30it/s]
100%|██████████| 252/252 [00:00<00:00, 72868.98it/s]
100%|██████████| 203/203 [00:00<00:00, 76679.01it/s]
100%|██████████| 153/153 [00:00<00:00, 72882.28it/s]
100%|██████████| 200/200 [00:00<00:00, 72434.23it/s]
100%|██████████| 65/65 [00:00<00:00, 62372.40it/s]
100%|██████████| 144/144 [00:00<00:00, 70418.54it/s]
100%|██████████| 30/30 [00:00<00:00, 61680.94it/s]
100%|██████████| 130/130 [00:00<00:00, 57693.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88372.37it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 227.39it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77861.37it/s]
100%|██████████| 287/287 [00:00<00:00, 75808.63it/s]
100%|██████████| 771/771 [00:00<00:00, 76489.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74977.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85284.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74189.51it/s]
100%|██████████| 353/353 [00:00<00:00, 74151.82it/s]
100%|██████████| 252/252 [00:00<00:00, 69569.18it/s]
100%|██████████| 203/203 [00:00<00:00, 75342.33it/s]
100%|██████████| 153/153 [00:00<00:00, 78393.42it/s]
100%|██████████| 200/200 [00:00<00:00, 76594.30it/s]
100%|██████████| 65/65 [00:00<00:00, 66739.23it/s]
100%|██████████| 144/144 [00:00<00:00, 73085.65it/s]
100%|██████████| 30/30 [00:00<00:00, 63743.22it/s]
100%|██████████| 130/130 [00:00<00:00, 75104.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86726.24it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 225.40it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80234.95it/s]
100%|██████████| 287/287 [00:00<00:00, 76922.82it/s]
100%|██████████| 771/771 [00:00<00:00, 71166.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79995.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80076.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98927.71it/s]
100%|██████████| 353/353 [00:00<00:00, 78918.46it/s]
100%|██████████| 252/252 [00:00<00:00, 76067.98it/s]
100%|██████████| 203/203 [00:00<00:00, 54928.31it/s]
100%|██████████| 153/153 [00:00<00:00, 52304.88it/s]
100%|██████████| 200/200 [00:00<00:00, 56178.73it/s]
100%|██████████| 65/65 [00:00<00:00, 53582.89it/s]
100%|██████████| 144/144 [00:00<00:00, 51595.74it/s]
100%|██████████| 30/30 [00:00<00:00, 40906.74it/s]
100%|██████████| 130/130 [00:00<00:00, 56685.68it/s]
100%|██████████| 3500/3500 [00:00<00:00, 56917.34it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 228.13it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80199.63it/s]
100%|██████████| 287/287 [00:00<00:00, 76590.01it/s]
100%|██████████| 771/771 [00:00<00:00, 90514.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79738.10it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80077.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78049.05it/s]
100%|██████████| 353/353 [00:00<00:00, 77307.29it/s]
100%|██████████| 252/252 [00:00<00:00, 77620.96it/s]
100%|██████████| 203/203 [00:00<00:00, 56234.31it/s]
100%|██████████| 153/153 [00:00<00:00, 59380.82it/s]
100%|██████████| 200/200 [00:00<00:00, 59149.68it/s]
100%|██████████| 65/65 [00:00<00:00, 48057.42it/s]
100%|██████████| 144/144 [00:00<00:00, 58953.61it/s]
100%|██████████| 30/30 [00:00<00:00, 42139.69it/s]
100%|██████████| 130/130 [00:00<00:00, 57323.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76379.11it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 223.71it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76713.84it/s]
100%|██████████| 287/287 [00:00<00:00, 75698.98it/s]
100%|██████████| 771/771 [00:00<00:00, 78775.39it/s]
100%|██████████| 2000/2000 [00:00<00:00, 58517.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76147.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77613.85it/s]
100%|██████████| 353/353 [00:00<00:00, 71964.10it/s]
100%|██████████| 252/252 [00:00<00:00, 76530.64it/s]
100%|██████████| 203/203 [00:00<00:00, 80575.73it/s]
100%|██████████| 153/153 [00:00<00:00, 73516.84it/s]
100%|██████████| 200/200 [00:00<00:00, 75942.50it/s]
100%|██████████| 65/65 [00:00<00:00, 66706.57it/s]
100%|██████████| 144/144 [00:00<00:00, 73935.58it/s]
100%|██████████| 30/30 [00:00<00:00, 66859.26it/s]
100%|██████████| 130/130 [00:00<00:00, 66771.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76918.17it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 225.42it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80476.89it/s]
100%|██████████| 287/287 [00:00<00:00, 74949.58it/s]
100%|██████████| 771/771 [00:00<00:00, 72122.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79549.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78049.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77825.06it/s]
100%|██████████| 353/353 [00:00<00:00, 77085.92it/s]
100%|██████████| 252/252 [00:00<00:00, 75953.19it/s]
100%|██████████| 203/203 [00:00<00:00, 70309.14it/s]
100%|██████████| 153/153 [00:00<00:00, 76780.15it/s]
100%|██████████| 200/200 [00:00<00:00, 75491.43it/s]
100%|██████████| 65/65 [00:00<00:00, 66968.74it/s]
100%|██████████| 144/144 [00:00<00:00, 71876.68it/s]
100%|██████████| 30/30 [00:00<00:00, 47698.68it/s]
100%|██████████| 130/130 [00:00<00:00, 66911.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84242.30it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 224.05it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78779.23it/s]
100%|██████████| 287/287 [00:00<00:00, 74009.54it/s]
100%|██████████| 771/771 [00:00<00:00, 77057.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 102253.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79818.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79265.93it/s]
100%|██████████| 353/353 [00:00<00:00, 79734.47it/s]
100%|██████████| 252/252 [00:00<00:00, 77071.94it/s]
100%|██████████| 203/203 [00:00<00:00, 71262.45it/s]
100%|██████████| 153/153 [00:00<00:00, 75818.59it/s]
100%|██████████| 200/200 [00:00<00:00, 70819.82it/s]
100%|██████████| 65/65 [00:00<00:00, 64148.18it/s]
100%|██████████| 144/144 [00:00<00:00, 73863.25it/s]
100%|██████████| 30/30 [00:00<00:00, 68052.53it/s]
100%|██████████| 130/130 [00:00<00:00, 74580.70it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77315.58it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 228.10it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80227.27it/s]
100%|██████████| 287/287 [00:00<00:00, 43723.99it/s]
100%|██████████| 771/771 [00:00<00:00, 79880.65it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79834.48it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80737.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76128.12it/s]
100%|██████████| 353/353 [00:00<00:00, 80144.49it/s]
100%|██████████| 252/252 [00:00<00:00, 63283.72it/s]
100%|██████████| 203/203 [00:00<00:00, 71640.19it/s]
100%|██████████| 153/153 [00:00<00:00, 66260.04it/s]
100%|██████████| 200/200 [00:00<00:00, 75274.66it/s]
100%|██████████| 65/65 [00:00<00:00, 73366.46it/s]
100%|██████████| 144/144 [00:00<00:00, 79137.81it/s]
100%|██████████| 30/30 [00:00<00:00, 69174.89it/s]
100%|██████████| 130/130 [00:00<00:00, 74468.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81078.00it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [04:03<00:00, 24.04it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 51151.30it/s]
100%|██████████| 287/287 [00:00<00:00, 57759.48it/s]
100%|██████████| 771/771 [00:00<00:00, 80790.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 65486.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80554.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78713.06it/s]
100%|██████████| 353/353 [00:00<00:00, 67854.69it/s]
100%|██████████| 252/252 [00:00<00:00, 69250.12it/s]
100%|██████████| 203/203 [00:00<00:00, 70343.99it/s]
100%|██████████| 153/153 [00:00<00:00, 69144.33it/s]
100%|██████████| 200/200 [00:00<00:00, 65917.08it/s]
100%|██████████| 65/65 [00:00<00:00, 60854.86it/s]
100%|██████████| 144/144 [00:00<00:00, 73387.58it/s]
100%|██████████| 30/30 [00:00<00:00, 34332.64it/s]
100%|██████████| 130/130 [00:00<00:00, 65781.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79305.40it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:34<00:00, 37.88it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 67161.03it/s]
100%|██████████| 287/287 [00:00<00:00, 78070.25it/s]
100%|██████████| 771/771 [00:00<00:00, 90636.18it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73957.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90632.78it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76095.43it/s]
100%|██████████| 353/353 [00:00<00:00, 75679.27it/s]
100%|██████████| 252/252 [00:00<00:00, 72788.69it/s]
100%|██████████| 203/203 [00:00<00:00, 74103.02it/s]
100%|██████████| 153/153 [00:00<00:00, 74663.00it/s]
100%|██████████| 200/200 [00:00<00:00, 76357.25it/s]
100%|██████████| 65/65 [00:00<00:00, 65536.00it/s]
100%|██████████| 144/144 [00:00<00:00, 72759.88it/s]
100%|██████████| 30/30 [00:00<00:00, 64067.78it/s]
100%|██████████| 130/130 [00:00<00:00, 70129.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89380.69it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:34<00:00, 37.83it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75556.01it/s]
100%|██████████| 287/287 [00:00<00:00, 74155.44it/s]
100%|██████████| 771/771 [00:00<00:00, 83274.75it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75872.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73262.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74480.22it/s]
100%|██████████| 353/353 [00:00<00:00, 70256.68it/s]
100%|██████████| 252/252 [00:00<00:00, 77100.05it/s]
100%|██████████| 203/203 [00:00<00:00, 71712.60it/s]
100%|██████████| 153/153 [00:00<00:00, 71430.15it/s]
100%|██████████| 200/200 [00:00<00:00, 67007.01it/s]
100%|██████████| 65/65 [00:00<00:00, 65836.70it/s]
100%|██████████| 144/144 [00:00<00:00, 73836.16it/s]
100%|██████████| 30/30 [00:00<00:00, 61923.78it/s]
100%|██████████| 130/130 [00:00<00:00, 75458.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85098.37it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:35<00:00, 37.69it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 69288.93it/s]
100%|██████████| 287/287 [00:00<00:00, 61744.22it/s]
100%|██████████| 771/771 [00:00<00:00, 56887.18it/s]
100%|██████████| 2000/2000 [00:00<00:00, 58597.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 57110.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72679.40it/s]
100%|██████████| 353/353 [00:00<00:00, 77566.50it/s]
100%|██████████| 252/252 [00:00<00:00, 76586.09it/s]
100%|██████████| 203/203 [00:00<00:00, 73807.53it/s]
100%|██████████| 153/153 [00:00<00:00, 75003.33it/s]
100%|██████████| 200/200 [00:00<00:00, 77002.09it/s]
100%|██████████| 65/65 [00:00<00:00, 64726.91it/s]
100%|██████████| 144/144 [00:00<00:00, 64548.44it/s]
100%|██████████| 30/30 [00:00<00:00, 65433.76it/s]
100%|██████████| 130/130 [00:00<00:00, 55655.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96379.00it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:33<00:00, 37.97it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73903.55it/s]
100%|██████████| 287/287 [00:00<00:00, 83322.85it/s]
100%|██████████| 771/771 [00:00<00:00, 78030.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77087.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77590.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91324.79it/s]
100%|██████████| 353/353 [00:00<00:00, 74581.37it/s]
100%|██████████| 252/252 [00:00<00:00, 76419.97it/s]
100%|██████████| 203/203 [00:00<00:00, 75442.47it/s]
100%|██████████| 153/153 [00:00<00:00, 68531.45it/s]
100%|██████████| 200/200 [00:00<00:00, 68804.20it/s]
100%|██████████| 65/65 [00:00<00:00, 65504.51it/s]
100%|██████████| 144/144 [00:00<00:00, 74620.68it/s]
100%|██████████| 30/30 [00:00<00:00, 65331.84it/s]
100%|██████████| 130/130 [00:00<00:00, 73853.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83392.40it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:36<00:00, 37.41it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77021.24it/s]
100%|██████████| 287/287 [00:00<00:00, 80941.72it/s]
100%|██████████| 771/771 [00:00<00:00, 74976.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76487.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77238.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74689.33it/s]
100%|██████████| 353/353 [00:00<00:00, 75263.79it/s]
100%|██████████| 252/252 [00:00<00:00, 73733.14it/s]
100%|██████████| 203/203 [00:00<00:00, 73654.30it/s]
100%|██████████| 153/153 [00:00<00:00, 74907.03it/s]
100%|██████████| 200/200 [00:00<00:00, 74222.33it/s]
100%|██████████| 65/65 [00:00<00:00, 73883.40it/s]
100%|██████████| 144/144 [00:00<00:00, 76569.44it/s]
100%|██████████| 30/30 [00:00<00:00, 66717.45it/s]
100%|██████████| 130/130 [00:00<00:00, 65996.07it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83202.39it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:38<00:00, 36.91it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76750.37it/s]
100%|██████████| 287/287 [00:00<00:00, 69497.45it/s]
100%|██████████| 771/771 [00:00<00:00, 75309.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 65997.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88171.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96022.71it/s]
100%|██████████| 353/353 [00:00<00:00, 69628.92it/s]
100%|██████████| 252/252 [00:00<00:00, 78056.61it/s]
100%|██████████| 203/203 [00:00<00:00, 76997.98it/s]
100%|██████████| 153/153 [00:00<00:00, 72981.75it/s]
100%|██████████| 200/200 [00:00<00:00, 75573.05it/s]
100%|██████████| 65/65 [00:00<00:00, 73169.55it/s]
100%|██████████| 144/144 [00:00<00:00, 76871.55it/s]
100%|██████████| 30/30 [00:00<00:00, 66505.88it/s]
100%|██████████| 130/130 [00:00<00:00, 72594.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82181.40it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:35<00:00, 37.67it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75778.74it/s]
100%|██████████| 287/287 [00:00<00:00, 72634.12it/s]
100%|██████████| 771/771 [00:00<00:00, 87961.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74441.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75505.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93306.97it/s]
100%|██████████| 353/353 [00:00<00:00, 74304.39it/s]
100%|██████████| 252/252 [00:00<00:00, 71648.90it/s]
100%|██████████| 203/203 [00:00<00:00, 68764.64it/s]
100%|██████████| 153/153 [00:00<00:00, 69248.79it/s]
100%|██████████| 200/200 [00:00<00:00, 70891.64it/s]
100%|██████████| 65/65 [00:00<00:00, 64497.22it/s]
100%|██████████| 144/144 [00:00<00:00, 69121.05it/s]
100%|██████████| 30/30 [00:00<00:00, 45507.82it/s]
100%|██████████| 130/130 [00:00<00:00, 75156.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77424.46it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:33<00:00, 37.97it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76279.51it/s]
100%|██████████| 287/287 [00:00<00:00, 74786.61it/s]
100%|██████████| 771/771 [00:00<00:00, 72580.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86409.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76538.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89139.36it/s]
100%|██████████| 353/353 [00:00<00:00, 75811.02it/s]
100%|██████████| 252/252 [00:00<00:00, 74523.35it/s]
100%|██████████| 203/203 [00:00<00:00, 74642.21it/s]
100%|██████████| 153/153 [00:00<00:00, 64716.47it/s]
100%|██████████| 200/200 [00:00<00:00, 71912.63it/s]
100%|██████████| 65/65 [00:00<00:00, 67987.47it/s]
100%|██████████| 144/144 [00:00<00:00, 74685.27it/s]
100%|██████████| 30/30 [00:00<00:00, 64264.11it/s]
100%|██████████| 130/130 [00:00<00:00, 60530.59it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84939.82it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:34<00:00, 37.75it/s]
INFO:root:The new embedding has 5812 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75647.40it/s]
100%|██████████| 287/287 [00:00<00:00, 69642.19it/s]
100%|██████████| 771/771 [00:00<00:00, 74176.72it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76908.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78003.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74774.55it/s]
100%|██████████| 353/353 [00:00<00:00, 74506.31it/s]
100%|██████████| 252/252 [00:00<00:00, 72118.22it/s]
100%|██████████| 203/203 [00:00<00:00, 73890.80it/s]
100%|██████████| 153/153 [00:00<00:00, 76378.07it/s]
100%|██████████| 200/200 [00:00<00:00, 73810.89it/s]
100%|██████████| 65/65 [00:00<00:00, 65980.10it/s]
100%|██████████| 144/144 [00:00<00:00, 73103.34it/s]
100%|██████████| 30/30 [00:00<00:00, 54166.65it/s]
100%|██████████| 130/130 [00:00<00:00, 72210.24it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85332.34it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:35<00:00, 37.67it/s]
INFO:root:The new embedding has 5812 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60694.56it/s]
100%|██████████| 287/287 [00:00<00:00, 76849.16it/s]
100%|██████████| 771/771 [00:00<00:00, 87899.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80191.65it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75384.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78452.95it/s]
100%|██████████| 353/353 [00:00<00:00, 77347.68it/s]
100%|██████████| 252/252 [00:00<00:00, 66782.37it/s]
100%|██████████| 203/203 [00:00<00:00, 74012.84it/s]
100%|██████████| 153/153 [00:00<00:00, 80085.92it/s]
100%|██████████| 200/200 [00:00<00:00, 75702.63it/s]
100%|██████████| 65/65 [00:00<00:00, 73643.91it/s]
100%|██████████| 144/144 [00:00<00:00, 80616.63it/s]
100%|██████████| 30/30 [00:00<00:00, 71009.66it/s]
100%|██████████| 130/130 [00:00<00:00, 74641.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86794.44it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:34<00:00, 37.93it/s]
INFO:root:The new embedding has 5812 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79057.18it/s]
100%|██████████| 287/287 [00:00<00:00, 75528.00it/s]
100%|██████████| 771/771 [00:00<00:00, 79075.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80822.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79905.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78550.90it/s]
100%|██████████| 353/353 [00:00<00:00, 76460.92it/s]
100%|██████████| 252/252 [00:00<00:00, 75697.53it/s]
100%|██████████| 203/203 [00:00<00:00, 75469.22it/s]
100%|██████████| 153/153 [00:00<00:00, 70535.12it/s]
100%|██████████| 200/200 [00:00<00:00, 77030.38it/s]
100%|██████████| 65/65 [00:00<00:00, 74590.91it/s]
100%|██████████| 144/144 [00:00<00:00, 75224.78it/s]
100%|██████████| 30/30 [00:00<00:00, 55188.21it/s]
100%|██████████| 130/130 [00:00<00:00, 73405.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77234.63it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:34<00:00, 37.83it/s]
INFO:root:The new embedding has 5812 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80619.34it/s]
100%|██████████| 287/287 [00:00<00:00, 76976.93it/s]
100%|██████████| 771/771 [00:00<00:00, 76258.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79561.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79689.62it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78862.54it/s]
100%|██████████| 353/353 [00:00<00:00, 76393.86it/s]
100%|██████████| 252/252 [00:00<00:00, 44580.73it/s]
100%|██████████| 203/203 [00:00<00:00, 79211.43it/s]
100%|██████████| 153/153 [00:00<00:00, 79579.43it/s]
100%|██████████| 200/200 [00:00<00:00, 79070.68it/s]
100%|██████████| 65/65 [00:00<00:00, 67001.66it/s]
100%|██████████| 144/144 [00:00<00:00, 72454.39it/s]
100%|██████████| 30/30 [00:00<00:00, 56425.61it/s]
100%|██████████| 130/130 [00:00<00:00, 77199.42it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79191.60it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:33<00:00, 38.02it/s]
INFO:root:The new embedding has 5812 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79380.69it/s]
100%|██████████| 287/287 [00:00<00:00, 68232.92it/s]
100%|██████████| 771/771 [00:00<00:00, 87739.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 100422.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76737.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96974.39it/s]
100%|██████████| 353/353 [00:00<00:00, 74033.17it/s]
100%|██████████| 252/252 [00:00<00:00, 72738.60it/s]
100%|██████████| 203/203 [00:00<00:00, 71773.05it/s]
100%|██████████| 153/153 [00:00<00:00, 68254.47it/s]
100%|██████████| 200/200 [00:00<00:00, 71722.02it/s]
100%|██████████| 65/65 [00:00<00:00, 57601.89it/s]
100%|██████████| 144/144 [00:00<00:00, 63383.33it/s]
100%|██████████| 30/30 [00:00<00:00, 35504.83it/s]
100%|██████████| 130/130 [00:00<00:00, 51993.85it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101919.41it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:33<00:00, 37.99it/s]
INFO:root:The new embedding has 5812 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82202.53it/s]
100%|██████████| 287/287 [00:00<00:00, 78605.54it/s]
100%|██████████| 771/771 [00:00<00:00, 80471.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80928.94it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77587.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79446.60it/s]
100%|██████████| 353/353 [00:00<00:00, 57821.97it/s]
100%|██████████| 252/252 [00:00<00:00, 57801.85it/s]
100%|██████████| 203/203 [00:00<00:00, 57870.16it/s]
100%|██████████| 153/153 [00:00<00:00, 58933.65it/s]
100%|██████████| 200/200 [00:00<00:00, 57295.32it/s]
100%|██████████| 65/65 [00:00<00:00, 55065.59it/s]
100%|██████████| 144/144 [00:00<00:00, 55944.77it/s]
100%|██████████| 30/30 [00:00<00:00, 49872.82it/s]
100%|██████████| 130/130 [00:00<00:00, 57528.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 57571.59it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [02:34<00:00, 37.95it/s]
INFO:root:The new embedding has 5812 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80149.00it/s]
100%|██████████| 287/287 [00:00<00:00, 70964.17it/s]
100%|██████████| 771/771 [00:00<00:00, 80461.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78865.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78253.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79485.75it/s]
100%|██████████| 353/353 [00:00<00:00, 77295.19it/s]
100%|██████████| 252/252 [00:00<00:00, 73908.44it/s]
100%|██████████| 203/203 [00:00<00:00, 76699.73it/s]
100%|██████████| 153/153 [00:00<00:00, 71983.01it/s]
100%|██████████| 200/200 [00:00<00:00, 76818.75it/s]
100%|██████████| 65/65 [00:00<00:00, 75083.93it/s]
100%|██████████| 144/144 [00:00<00:00, 77245.14it/s]
100%|██████████| 30/30 [00:00<00:00, 63710.95it/s]
100%|██████████| 130/130 [00:00<00:00, 71238.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76855.35it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist

100%|██████████| 5846/5846 [00:37<00:00, 155.21it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 54974.61it/s]
100%|██████████| 287/287 [00:00<00:00, 53927.30it/s]
100%|██████████| 771/771 [00:00<00:00, 63367.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 63656.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 63122.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 65059.91it/s]
100%|██████████| 353/353 [00:00<00:00, 55736.69it/s]
100%|██████████| 252/252 [00:00<00:00, 82062.47it/s]
100%|██████████| 203/203 [00:00<00:00, 73242.47it/s]
100%|██████████| 153/153 [00:00<00:00, 72274.86it/s]
100%|██████████| 200/200 [00:00<00:00, 70813.84it/s]
100%|██████████| 65/65 [00:00<00:00, 67549.49it/s]
100%|██████████| 144/144 [00:00<00:00, 69687.29it/s]
100%|██████████| 30/30 [00:00<00:00, 59975.75it/s]
100%|██████████| 130/130 [00:00<00:00, 66373.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77267.15it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:27<00:00, 209.19it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75714.38it/s]
100%|██████████| 287/287 [00:00<00:00, 72656.04it/s]
100%|██████████| 771/771 [00:00<00:00, 84251.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88872.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74691.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92177.10it/s]
100%|██████████| 353/353 [00:00<00:00, 75436.35it/s]
100%|██████████| 252/252 [00:00<00:00, 74292.87it/s]
100%|██████████| 203/203 [00:00<00:00, 85529.25it/s]
100%|██████████| 153/153 [00:00<00:00, 76982.79it/s]
100%|██████████| 200/200 [00:00<00:00, 70849.73it/s]
100%|██████████| 65/65 [00:00<00:00, 71331.70it/s]
100%|██████████| 144/144 [00:00<00:00, 72900.40it/s]
100%|██████████| 30/30 [00:00<00:00, 58146.54it/s]
100%|██████████| 130/130 [00:00<00:00, 73199.02it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89769.85it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 205.42it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 74391.65it/s]
100%|██████████| 287/287 [00:00<00:00, 68559.36it/s]
100%|██████████| 771/771 [00:00<00:00, 77467.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86397.66it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76424.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80936.22it/s]
100%|██████████| 353/353 [00:00<00:00, 76029.03it/s]
100%|██████████| 252/252 [00:00<00:00, 73197.00it/s]
100%|██████████| 203/203 [00:00<00:00, 73141.80it/s]
100%|██████████| 153/153 [00:00<00:00, 71757.63it/s]
100%|██████████| 200/200 [00:00<00:00, 59884.41it/s]
100%|██████████| 65/65 [00:00<00:00, 56703.36it/s]
100%|██████████| 144/144 [00:00<00:00, 67574.38it/s]
100%|██████████| 30/30 [00:00<00:00, 53317.42it/s]
100%|██████████| 130/130 [00:00<00:00, 65678.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85378.50it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 207.73it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75289.92it/s]
100%|██████████| 287/287 [00:00<00:00, 72726.27it/s]
100%|██████████| 771/771 [00:00<00:00, 77155.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83590.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74139.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88543.47it/s]
100%|██████████| 353/353 [00:00<00:00, 75993.91it/s]
100%|██████████| 252/252 [00:00<00:00, 71571.28it/s]
100%|██████████| 203/203 [00:00<00:00, 69647.75it/s]
100%|██████████| 153/153 [00:00<00:00, 75800.67it/s]
100%|██████████| 200/200 [00:00<00:00, 75207.17it/s]
100%|██████████| 65/65 [00:00<00:00, 71858.13it/s]
100%|██████████| 144/144 [00:00<00:00, 70377.51it/s]
100%|██████████| 30/30 [00:00<00:00, 64893.82it/s]
100%|██████████| 130/130 [00:00<00:00, 71669.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90817.25it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 206.23it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77933.78it/s]
100%|██████████| 287/287 [00:00<00:00, 74916.93it/s]
100%|██████████| 771/771 [00:00<00:00, 93608.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85870.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93045.48it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80671.07it/s]
100%|██████████| 353/353 [00:00<00:00, 90495.04it/s]
100%|██████████| 252/252 [00:00<00:00, 75169.95it/s]
100%|██████████| 203/203 [00:00<00:00, 73129.24it/s]
100%|██████████| 153/153 [00:00<00:00, 77494.08it/s]
100%|██████████| 200/200 [00:00<00:00, 77961.04it/s]
100%|██████████| 65/65 [00:00<00:00, 73445.52it/s]
100%|██████████| 144/144 [00:00<00:00, 72229.10it/s]
100%|██████████| 30/30 [00:00<00:00, 53773.13it/s]
100%|██████████| 130/130 [00:00<00:00, 72181.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93495.85it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:27<00:00, 209.06it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76176.89it/s]
100%|██████████| 287/287 [00:00<00:00, 74018.65it/s]
100%|██████████| 771/771 [00:00<00:00, 73280.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89567.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76523.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82220.30it/s]
100%|██████████| 353/353 [00:00<00:00, 76029.03it/s]
100%|██████████| 252/252 [00:00<00:00, 78807.38it/s]
100%|██████████| 203/203 [00:00<00:00, 73935.72it/s]
100%|██████████| 153/153 [00:00<00:00, 73812.80it/s]
100%|██████████| 200/200 [00:00<00:00, 74731.47it/s]
100%|██████████| 65/65 [00:00<00:00, 58391.47it/s]
100%|██████████| 144/144 [00:00<00:00, 71156.90it/s]
100%|██████████| 30/30 [00:00<00:00, 44938.97it/s]
100%|██████████| 130/130 [00:00<00:00, 69063.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74448.18it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 206.51it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75066.01it/s]
100%|██████████| 287/287 [00:00<00:00, 74366.17it/s]
100%|██████████| 771/771 [00:00<00:00, 73450.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94770.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78215.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85270.30it/s]
100%|██████████| 353/353 [00:00<00:00, 75532.56it/s]
100%|██████████| 252/252 [00:00<00:00, 74287.64it/s]
100%|██████████| 203/203 [00:00<00:00, 69149.98it/s]
100%|██████████| 153/153 [00:00<00:00, 71958.79it/s]
100%|██████████| 200/200 [00:00<00:00, 74169.83it/s]
100%|██████████| 65/65 [00:00<00:00, 71650.40it/s]
100%|██████████| 144/144 [00:00<00:00, 45258.88it/s]
100%|██████████| 30/30 [00:00<00:00, 59493.67it/s]
100%|██████████| 130/130 [00:00<00:00, 69512.94it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84840.66it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:27<00:00, 209.62it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76956.17it/s]
100%|██████████| 287/287 [00:00<00:00, 75164.86it/s]
100%|██████████| 771/771 [00:00<00:00, 79933.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90262.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93337.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80622.48it/s]
100%|██████████| 353/353 [00:00<00:00, 74909.65it/s]
100%|██████████| 252/252 [00:00<00:00, 73441.12it/s]
100%|██████████| 203/203 [00:00<00:00, 72978.80it/s]
100%|██████████| 153/153 [00:00<00:00, 64925.99it/s]
100%|██████████| 200/200 [00:00<00:00, 67863.51it/s]
100%|██████████| 65/65 [00:00<00:00, 62031.80it/s]
100%|██████████| 144/144 [00:00<00:00, 72576.28it/s]
100%|██████████| 30/30 [00:00<00:00, 54120.05it/s]
100%|██████████| 130/130 [00:00<00:00, 73723.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94450.50it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 206.97it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77369.68it/s]
100%|██████████| 287/287 [00:00<00:00, 75727.56it/s]
100%|██████████| 771/771 [00:00<00:00, 83807.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87218.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77647.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91106.58it/s]
100%|██████████| 353/353 [00:00<00:00, 75993.91it/s]
100%|██████████| 252/252 [00:00<00:00, 75481.30it/s]
100%|██████████| 203/203 [00:00<00:00, 73267.68it/s]
100%|██████████| 153/153 [00:00<00:00, 69609.34it/s]
100%|██████████| 200/200 [00:00<00:00, 69361.73it/s]
100%|██████████| 65/65 [00:00<00:00, 62230.03it/s]
100%|██████████| 144/144 [00:00<00:00, 71527.69it/s]
100%|██████████| 30/30 [00:00<00:00, 66576.25it/s]
100%|██████████| 130/130 [00:00<00:00, 75698.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90010.39it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:27<00:00, 209.91it/s]
INFO:root:The new embedding has 5827 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73610.13it/s]
100%|██████████| 287/287 [00:00<00:00, 74000.45it/s]
100%|██████████| 771/771 [00:00<00:00, 82301.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89455.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75937.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72597.21it/s]
100%|██████████| 353/353 [00:00<00:00, 74237.33it/s]
100%|██████████| 252/252 [00:00<00:00, 75143.23it/s]
100%|██████████| 203/203 [00:00<00:00, 74733.93it/s]
100%|██████████| 153/153 [00:00<00:00, 71999.16it/s]
100%|██████████| 200/200 [00:00<00:00, 74314.39it/s]
100%|██████████| 65/65 [00:00<00:00, 69212.94it/s]
100%|██████████| 144/144 [00:00<00:00, 75403.22it/s]
100%|██████████| 30/30 [00:00<00:00, 59833.15it/s]
100%|██████████| 130/130 [00:00<00:00, 68655.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91157.31it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 206.03it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80069.36it/s]
100%|██████████| 287/287 [00:00<00:00, 76903.17it/s]
100%|██████████| 771/771 [00:00<00:00, 79025.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77924.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80484.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77450.46it/s]
100%|██████████| 353/353 [00:00<00:00, 79967.02it/s]
100%|██████████| 252/252 [00:00<00:00, 77240.91it/s]
100%|██████████| 203/203 [00:00<00:00, 73362.37it/s]
100%|██████████| 153/153 [00:00<00:00, 76734.25it/s]
100%|██████████| 200/200 [00:00<00:00, 73481.15it/s]
100%|██████████| 65/65 [00:00<00:00, 65900.35it/s]
100%|██████████| 144/144 [00:00<00:00, 73908.44it/s]
100%|██████████| 30/30 [00:00<00:00, 67432.54it/s]
100%|██████████| 130/130 [00:00<00:00, 78229.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76762.92it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 207.79it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79950.19it/s]
100%|██████████| 287/287 [00:00<00:00, 78492.78it/s]
100%|██████████| 771/771 [00:00<00:00, 77006.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77363.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80071.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95211.85it/s]
100%|██████████| 353/353 [00:00<00:00, 78172.61it/s]
100%|██████████| 252/252 [00:00<00:00, 75898.65it/s]
100%|██████████| 203/203 [00:00<00:00, 79012.97it/s]
100%|██████████| 153/153 [00:00<00:00, 58836.39it/s]
100%|██████████| 200/200 [00:00<00:00, 76239.28it/s]
100%|██████████| 65/65 [00:00<00:00, 61694.90it/s]
100%|██████████| 144/144 [00:00<00:00, 77862.55it/s]
100%|██████████| 30/30 [00:00<00:00, 67905.62it/s]
100%|██████████| 130/130 [00:00<00:00, 77495.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77013.40it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 204.48it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81331.35it/s]
100%|██████████| 287/287 [00:00<00:00, 78508.14it/s]
100%|██████████| 771/771 [00:00<00:00, 78439.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94134.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80498.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77714.99it/s]
100%|██████████| 353/353 [00:00<00:00, 80458.06it/s]
100%|██████████| 252/252 [00:00<00:00, 67002.51it/s]
100%|██████████| 203/203 [00:00<00:00, 74064.35it/s]
100%|██████████| 153/153 [00:00<00:00, 64340.14it/s]
100%|██████████| 200/200 [00:00<00:00, 79497.80it/s]
100%|██████████| 65/65 [00:00<00:00, 65269.27it/s]
100%|██████████| 144/144 [00:00<00:00, 74889.00it/s]
100%|██████████| 30/30 [00:00<00:00, 39618.74it/s]
100%|██████████| 130/130 [00:00<00:00, 42815.82it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77317.21it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:27<00:00, 209.69it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81751.86it/s]
100%|██████████| 287/287 [00:00<00:00, 78365.03it/s]
100%|██████████| 771/771 [00:00<00:00, 78625.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82517.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82165.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92138.63it/s]
100%|██████████| 353/353 [00:00<00:00, 79175.90it/s]
100%|██████████| 252/252 [00:00<00:00, 78819.14it/s]
100%|██████████| 203/203 [00:00<00:00, 81066.72it/s]
100%|██████████| 153/153 [00:00<00:00, 67161.54it/s]
100%|██████████| 200/200 [00:00<00:00, 77765.90it/s]
100%|██████████| 65/65 [00:00<00:00, 67432.54it/s]
100%|██████████| 144/144 [00:00<00:00, 65972.67it/s]
100%|██████████| 30/30 [00:00<00:00, 54096.78it/s]
100%|██████████| 130/130 [00:00<00:00, 72527.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83287.84it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 206.16it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79239.58it/s]
100%|██████████| 287/287 [00:00<00:00, 76942.49it/s]
100%|██████████| 771/771 [00:00<00:00, 77819.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76598.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80353.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76596.17it/s]
100%|██████████| 353/353 [00:00<00:00, 73628.19it/s]
100%|██████████| 252/252 [00:00<00:00, 73369.75it/s]
100%|██████████| 203/203 [00:00<00:00, 76610.02it/s]
100%|██████████| 153/153 [00:00<00:00, 68612.05it/s]
100%|██████████| 200/200 [00:00<00:00, 75764.16it/s]
100%|██████████| 65/65 [00:00<00:00, 68465.53it/s]
100%|██████████| 144/144 [00:00<00:00, 74593.03it/s]
100%|██████████| 30/30 [00:00<00:00, 69365.56it/s]
100%|██████████| 130/130 [00:00<00:00, 65012.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75916.97it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 208.20it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80617.79it/s]
100%|██████████| 287/287 [00:00<00:00, 77442.44it/s]
100%|██████████| 771/771 [00:00<00:00, 76675.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78090.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80244.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77135.68it/s]
100%|██████████| 353/353 [00:00<00:00, 76111.10it/s]
100%|██████████| 252/252 [00:00<00:00, 75686.69it/s]
100%|██████████| 203/203 [00:00<00:00, 77235.46it/s]
100%|██████████| 153/153 [00:00<00:00, 72692.40it/s]
100%|██████████| 200/200 [00:00<00:00, 71398.48it/s]
100%|██████████| 65/65 [00:00<00:00, 73307.28it/s]
100%|██████████| 144/144 [00:00<00:00, 78941.29it/s]
100%|██████████| 30/30 [00:00<00:00, 69289.16it/s]
100%|██████████| 130/130 [00:00<00:00, 64896.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75272.34it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.90it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 97671.55it/s]
100%|██████████| 287/287 [00:00<00:00, 68543.74it/s]
100%|██████████| 771/771 [00:00<00:00, 77131.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87478.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 97000.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79105.97it/s]
100%|██████████| 353/353 [00:00<00:00, 74762.13it/s]
100%|██████████| 252/252 [00:00<00:00, 74491.83it/s]
100%|██████████| 203/203 [00:00<00:00, 70618.21it/s]
100%|██████████| 153/153 [00:00<00:00, 68095.13it/s]
100%|██████████| 200/200 [00:00<00:00, 74618.47it/s]
100%|██████████| 65/65 [00:00<00:00, 63787.96it/s]
100%|██████████| 144/144 [00:00<00:00, 67703.15it/s]
100%|██████████| 30/30 [00:00<00:00, 55973.81it/s]
100%|██████████| 130/130 [00:00<00:00, 70465.17it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84775.50it/s]
  0%|          | 0/20

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 51125.83it/s]


['discoverys' 'disclosure']
['discoverys' 'self-discovery']
['nondescripts' 'person']
['subjoined' 'append']
['londoners' 'person']
['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 175.37it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 74612.87it/s]
100%|██████████| 287/287 [00:00<00:00, 72594.70it/s]
100%|██████████| 771/771 [00:00<00:00, 80555.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81046.22it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74493.89it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79878.32it/s]
100%|██████████| 353/353 [00:00<00:00, 78952.13it/s]
100%|██████████| 252/252 [00:00<00:00, 73415.61it/s]
100%|██████████| 203/203 [00:00<00:00, 81368.86it/s]
100%|██████████| 153/153 [00:00<00:00, 75827.54it/s]
100%|██████████| 200/200 [00:00<00:00, 75832.65it/s]
100%|██████████| 65/65 [00:00<00:00, 71275.75it/s]
100%|██████████| 144/144 [00:00<00:00, 63764.76it/s]
100%|██████████| 30/30 [00:00<00:00, 52560.20it/s]
100%|██████████| 130/130 [00:00<00:00, 56892.69it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85019.02it/s]
  0%|          | 0/20

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 62499.74it/s]



['discoverys' 'self-discovery']
['nondescripts' 'person']
['subjoined' 'append']
['londoners' 'person']
['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 172.71it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75523.33it/s]
100%|██████████| 287/287 [00:00<00:00, 73266.30it/s]
100%|██████████| 771/771 [00:00<00:00, 76276.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92468.04it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78010.34it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80722.30it/s]
100%|██████████| 353/353 [00:00<00:00, 75912.09it/s]
100%|██████████| 252/252 [00:00<00:00, 74861.15it/s]
100%|██████████| 203/203 [00:00<00:00, 72872.62it/s]
100%|██████████| 153/153 [00:00<00:00, 72323.74it/s]
100%|██████████| 200/200 [00:00<00:00, 74751.45it/s]
100%|██████████| 65/65 [00:00<00:00, 66804.65it/s]
100%|██████████| 144/144 [00:00<00:00, 66767.61it/s]
100%|██████████| 30/30 [00:00<00:00, 36813.67it/s]
100%|██████████| 130/130 [00:00<00:00, 68413.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93156.48it/s]
100%|██████████| 2034

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['


100%|██████████| 5846/5846 [00:33<00:00, 174.03it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 74200.63it/s]
100%|██████████| 287/287 [00:00<00:00, 67562.73it/s]
100%|██████████| 771/771 [00:00<00:00, 74640.70it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83282.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73607.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84622.86it/s]
100%|██████████| 353/353 [00:00<00:00, 77477.20it/s]
100%|██████████| 252/252 [00:00<00:00, 72029.75it/s]
100%|██████████| 203/203 [00:00<00:00, 74648.76it/s]
100%|██████████| 153/153 [00:00<00:00, 73031.58it/s]
100%|██████████| 200/200 [00:00<00:00, 72215.98it/s]
100%|██████████| 65/65 [00:00<00:00, 70030.76it/s]
100%|██████████| 144/144 [00:00<00:00, 62214.65it/s]
100%|██████████| 30/30 [00:00<00:00, 62168.54it/s]
100%|██████████| 130/130 [00:00<00:00, 65765.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87606.08it/s]
  0%|          | 0/2

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 62285.73it/s]
100%|██████████| 5846/5846 [00:33<00:00, 173.06it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76474.42it/s]
100%|██████████| 287/287 [00:00<00:00, 70465.68it/s]
100%|██████████| 771/771 [00:00<00:00, 75649.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83289.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74827.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81887.48it/s]
100%|██████████| 353/353 [00:00<00:00, 75290.58it/s]
100%|██████████| 252/252 [00:00<00:00, 75865.96it/s]
100%|██████████| 203/203 [00:00<00:00, 73686.17it/s]
100%|██████████| 153/153 [00:00<00:00, 74793.53it/s]
100%|██████████| 200/200 [00:00<00:00, 68517.59it/s]
100%|██████████| 65/65 [00:00<00:00, 65583.30it/s]
100%|██████████| 144/144 [00:00<00:00, 64253.17it/s]
100%|██████████| 30/30 [00:00<00:00, 40893.44it/s]
100%|██████████| 130/130 [00:00<00:00, 71763.56it/s]
100%|██████████| 3500


['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
[

100%|██████████| 2034/2034 [00:00<00:00, 64440.02it/s]



['liverpools' 'england']
['autobuses' 'school']
['dematerialised' 'vanish']
['anaesthetics' 'drug']
['ukrainians' 'slavic']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['discoverys' 'disclosure']
['discoverys' 'self-discovery']
['nondescripts' 'person']
['subjoined' 'append']
['londoners' 'person']
['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 175.57it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76095.27it/s]
100%|██████████| 287/287 [00:00<00:00, 72120.62it/s]
100%|██████████| 771/771 [00:00<00:00, 76059.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76127.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77845.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78289.43it/s]
100%|██████████| 353/353 [00:00<00:00, 72684.80it/s]
100%|██████████| 252/252 [00:00<00:00, 73273.11it/s]
100%|██████████| 203/203 [00:00<00:00, 75422.42it/s]
100%|██████████| 153/153 [00:00<00:00, 77419.29it/s]
100%|██████████| 200/200 [00:00<00:00, 76128.58it/s]
100%|██████████| 65/65 [00:00<00:00, 66349.42it/s]
100%|██████████| 144/144 [00:00<00:00, 58655.90it/s]
100%|██████████| 30/30 [00:00<00:00, 48941.70it/s]
100%|██████████| 130/130 [00:00<00:00, 84799.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87306.50it/s]
  0%|          | 0/20

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 64537.03it/s]



['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 172.67it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76048.31it/s]
100%|██████████| 287/287 [00:00<00:00, 72090.38it/s]
100%|██████████| 771/771 [00:00<00:00, 76285.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85533.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75628.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89507.76it/s]
100%|██████████| 353/353 [00:00<00:00, 74341.70it/s]
100%|██████████| 252/252 [00:00<00:00, 76254.57it/s]
100%|██████████| 203/203 [00:00<00:00, 75953.94it/s]
100%|██████████| 153/153 [00:00<00:00, 75240.77it/s]
100%|██████████| 200/200 [00:00<00:00, 73103.34it/s]
100%|██████████| 65/65 [00:00<00:00, 73110.69it/s]
100%|██████████| 144/144 [00:00<00:00, 68416.38it/s]
100%|██████████| 30/30 [00:00<00:00, 48639.01it/s]
100%|██████████| 130/130 [00:00<00:00, 72344.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91818.69it/s]
100%|██████████| 2034

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['


100%|██████████| 5846/5846 [00:33<00:00, 175.07it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76502.34it/s]
100%|██████████| 287/287 [00:00<00:00, 70145.40it/s]
100%|██████████| 771/771 [00:00<00:00, 76761.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75620.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76580.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76419.86it/s]
100%|██████████| 353/353 [00:00<00:00, 72577.91it/s]
100%|██████████| 252/252 [00:00<00:00, 73242.64it/s]
100%|██████████| 203/203 [00:00<00:00, 73122.96it/s]
100%|██████████| 153/153 [00:00<00:00, 76323.56it/s]
100%|██████████| 200/200 [00:00<00:00, 72609.78it/s]
100%|██████████| 65/65 [00:00<00:00, 65222.43it/s]
100%|██████████| 144/144 [00:00<00:00, 57135.54it/s]
100%|██████████| 30/30 [00:00<00:00, 60845.80it/s]
100%|██████████| 130/130 [00:00<00:00, 70969.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84644.98it/s]
  0%|          | 0/2

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 62254.82it/s]



['syphons' 'tube']
['subserving' 'help']
['discoverys' 'disclosure']
['discoverys' 'self-discovery']
['nondescripts' 'person']
['subjoined' 'append']
['londoners' 'person']
['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 173.05it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77988.90it/s]
100%|██████████| 287/287 [00:00<00:00, 70088.22it/s]
100%|██████████| 771/771 [00:00<00:00, 92643.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76475.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77221.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76723.67it/s]
100%|██████████| 353/353 [00:00<00:00, 72802.74it/s]
100%|██████████| 252/252 [00:00<00:00, 73918.78it/s]
100%|██████████| 203/203 [00:00<00:00, 74374.89it/s]
100%|██████████| 153/153 [00:00<00:00, 72618.37it/s]
100%|██████████| 200/200 [00:00<00:00, 70706.41it/s]
100%|██████████| 65/65 [00:00<00:00, 68259.83it/s]
100%|██████████| 144/144 [00:00<00:00, 68892.41it/s]
100%|██████████| 30/30 [00:00<00:00, 58688.96it/s]
100%|██████████| 130/130 [00:00<00:00, 71612.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71231.33it/s]
  0%|          | 0/20

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 68857.31it/s]


['subsequences' 'result']
['liverpools' 'england']
['autobuses' 'school']
['dematerialised' 'vanish']
['anaesthetics' 'drug']
['ukrainians' 'slavic']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['discoverys' 'disclosure']
['discoverys' 'self-discovery']
['nondescripts' 'person']
['subjoined' 'append']
['londoners' 'person']
['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 174.87it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77738.58it/s]
100%|██████████| 287/287 [00:00<00:00, 68283.24it/s]
100%|██████████| 771/771 [00:00<00:00, 78156.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89021.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87051.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96516.19it/s]
100%|██████████| 353/353 [00:00<00:00, 76017.32it/s]
100%|██████████| 252/252 [00:00<00:00, 74946.08it/s]
100%|██████████| 203/203 [00:00<00:00, 76273.74it/s]
100%|██████████| 153/153 [00:00<00:00, 68429.14it/s]
100%|██████████| 200/200 [00:00<00:00, 76608.29it/s]
100%|██████████| 65/65 [00:00<00:00, 66903.01it/s]
100%|██████████| 144/144 [00:00<00:00, 60259.38it/s]
100%|██████████| 30/30 [00:00<00:00, 65707.11it/s]
100%|██████████| 130/130 [00:00<00:00, 70693.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85093.93it/s]
100%|██████████| 2034

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 5846/5846 [00:33<00:00, 173.24it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80596.08it/s]
100%|██████████| 287/287 [00:00<00:00, 71849.42it/s]
100%|██████████| 771/771 [00:00<00:00, 80695.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78595.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80481.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87996.70it/s]
100%|██████████| 353/353 [00:00<00:00, 76193.36it/s]
100%|██████████| 252/252 [00:00<00:00, 76819.87it/s]
100%|██████████| 203/203 [00:00<00:00, 77707.74it/s]
100%|██████████| 153/153 [00:00<00:00, 74810.97it/s]
100%|██████████| 200/200 [00:00<00:00, 78758.88it/s]
100%|██████████| 65/65 [00:00<00:00, 75856.92it/s]
100%|██████████| 144/144 [00:00<00:00, 60738.11it/s]
100%|██████████| 30/30 [00:00<00:00, 68609.12it/s]
100%|██████████| 130/130 [00:00<00:00, 70184.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80167.67it/s]
  0%|          | 0/2

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 65711.67it/s]





100%|██████████| 5846/5846 [00:33<00:00, 174.59it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80410.48it/s]
100%|██████████| 287/287 [00:00<00:00, 76173.21it/s]
100%|██████████| 771/771 [00:00<00:00, 81651.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94358.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79509.86it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78531.29it/s]
100%|██████████| 353/353 [00:00<00:00, 80628.94it/s]
100%|██████████| 252/252 [00:00<00:00, 74037.87it/s]
100%|██████████| 203/203 [00:00<00:00, 77792.94it/s]
100%|██████████| 153/153 [00:00<00:00, 73778.86it/s]
100%|██████████| 200/200 [00:00<00:00, 79807.90it/s]
100%|██████████| 65/65 [00:00<00:00, 71631.57it/s]
100%|██████████| 144/144 [00:00<00:00, 73450.05it/s]
100%|██████████| 30/30 [00:00<00:00, 68796.68it/s]
100%|██████████| 130/130 [00:00<00:00, 67692.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76204.65it/s]
  0%|          | 0/2

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 65361.77it/s]


['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 173.01it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80159.74it/s]
100%|██████████| 287/287 [00:00<00:00, 71935.30it/s]
100%|██████████| 771/771 [00:00<00:00, 80467.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82988.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 98190.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85949.44it/s]
100%|██████████| 353/353 [00:00<00:00, 71130.88it/s]
100%|██████████| 252/252 [00:00<00:00, 76797.54it/s]
100%|██████████| 203/203 [00:00<00:00, 73597.00it/s]
100%|██████████| 153/153 [00:00<00:00, 79079.30it/s]
100%|██████████| 200/200 [00:00<00:00, 80327.57it/s]
100%|██████████| 65/65 [00:00<00:00, 76970.57it/s]
100%|██████████| 144/144 [00:00<00:00, 55228.58it/s]
100%|██████████| 30/30 [00:00<00:00, 40866.88it/s]
100%|██████████| 130/130 [00:00<00:00, 61299.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78467.35it/s]
  0%|          | 0/2

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 66145.24it/s]



['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 173.78it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79970.03it/s]
100%|██████████| 287/287 [00:00<00:00, 75722.79it/s]
100%|██████████| 771/771 [00:00<00:00, 80227.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79813.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81555.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77853.47it/s]
100%|██████████| 353/353 [00:00<00:00, 71869.78it/s]
100%|██████████| 252/252 [00:00<00:00, 76870.15it/s]
100%|██████████| 203/203 [00:00<00:00, 74032.15it/s]
100%|██████████| 153/153 [00:00<00:00, 76660.91it/s]
100%|██████████| 200/200 [00:00<00:00, 79175.16it/s]
100%|██████████| 65/65 [00:00<00:00, 76281.41it/s]
100%|██████████| 144/144 [00:00<00:00, 68540.60it/s]
100%|██████████| 30/30 [00:00<00:00, 31138.11it/s]
100%|██████████| 130/130 [00:00<00:00, 73189.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86513.62it/s]
  0%|          | 0/2

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 2034/2034 [00:00<00:00, 64697.56it/s]


['subjoined' 'append']
['londoners' 'person']
['concurrencies' 'agreement']
['concurrencies' 'cooperation']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['subspaces' 'mathematical']


100%|██████████| 5846/5846 [00:33<00:00, 172.38it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79460.47it/s]
100%|██████████| 287/287 [00:00<00:00, 77522.23it/s]
100%|██████████| 771/771 [00:00<00:00, 81901.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90521.29it/s]
100%|██████████| 1000/1000 [00:00<00:00, 97338.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85220.64it/s]
100%|██████████| 353/353 [00:00<00:00, 80488.68it/s]
100%|██████████| 252/252 [00:00<00:00, 76920.50it/s]
100%|██████████| 203/203 [00:00<00:00, 80560.48it/s]
100%|██████████| 153/153 [00:00<00:00, 78546.94it/s]
100%|██████████| 200/200 [00:00<00:00, 76622.29it/s]
100%|██████████| 65/65 [00:00<00:00, 75437.12it/s]
100%|██████████| 144/144 [00:00<00:00, 57919.04it/s]
100%|██████████| 30/30 [00:00<00:00, 56577.84it/s]
100%|██████████| 130/130 [00:00<00:00, 75604.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90979.35it/s]
100%|██████████| 203

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['

100%|██████████| 5846/5846 [00:33<00:00, 174.30it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80382.71it/s]
100%|██████████| 287/287 [00:00<00:00, 77100.19it/s]
100%|██████████| 771/771 [00:00<00:00, 80555.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76490.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88687.63it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77796.67it/s]
100%|██████████| 353/353 [00:00<00:00, 87206.34it/s]
100%|██████████| 252/252 [00:00<00:00, 76831.04it/s]
100%|██████████| 203/203 [00:00<00:00, 76246.41it/s]
100%|██████████| 153/153 [00:00<00:00, 76323.56it/s]
100%|██████████| 200/200 [00:00<00:00, 76287.81it/s]
100%|██████████| 65/65 [00:00<00:00, 64102.93it/s]
100%|██████████| 144/144 [00:00<00:00, 72324.25it/s]
100%|██████████| 30/30 [00:00<00:00, 42323.96it/s]
100%|██████████| 130/130 [00:00<00:00, 72720.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 98641.10it/s]
100%|██████████| 203

['reichstag' 'germany']
['trade' 'farley']
['shariff' 'deputy']
['organising' 'developed']
['requiring' 'organising']
['organising' 'shown']
['organising' 'produced']
['affect' 'organising']
['summonings' 'page']
['summonings' 'demand']
['virginals' 'harpsichord']
['hypertexts' 'database']
['capitalised' 'profit']
['capitalised' 'supply']
['antedating' 'chronologize']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['internationaler' 'foreign']
['traversals' 'travel']
['traversals' 'skiing']
['algebras' 'vector']
['decompositions' 'decay']
['decompositions' 'algebra']
['importances' 'standing']
['importances' 'deal']
['catalogued' 'compose']
['


100%|██████████| 5846/5846 [02:48<00:00, 34.80it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 53842.92it/s]
100%|██████████| 287/287 [00:00<00:00, 73079.48it/s]
100%|██████████| 771/771 [00:00<00:00, 77386.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83073.62it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77683.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81671.16it/s]
100%|██████████| 353/353 [00:00<00:00, 76953.71it/s]
100%|██████████| 252/252 [00:00<00:00, 74749.97it/s]
100%|██████████| 203/203 [00:00<00:00, 74799.59it/s]
100%|██████████| 153/153 [00:00<00:00, 72438.03it/s]
100%|██████████| 200/200 [00:00<00:00, 73927.98it/s]
100%|██████████| 65/65 [00:00<00:00, 65599.08it/s]
100%|██████████| 144/144 [00:00<00:00, 71604.00it/s]
100%|██████████| 30/30 [00:00<00:00, 54424.36it/s]
100%|██████████| 130/130 [00:00<00:00, 71322.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86531.98it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:39<00:00, 36.66it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76192.12it/s]
100%|██████████| 287/287 [00:00<00:00, 75117.96it/s]
100%|██████████| 771/771 [00:00<00:00, 79174.63it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97647.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79871.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88137.85it/s]
100%|██████████| 353/353 [00:00<00:00, 93371.34it/s]
100%|██████████| 252/252 [00:00<00:00, 75524.45it/s]
100%|██████████| 203/203 [00:00<00:00, 67457.12it/s]
100%|██████████| 153/153 [00:00<00:00, 73098.13it/s]
100%|██████████| 200/200 [00:00<00:00, 73294.96it/s]
100%|██████████| 65/65 [00:00<00:00, 38194.14it/s]
100%|██████████| 144/144 [00:00<00:00, 72918.00it/s]
100%|██████████| 30/30 [00:00<00:00, 54589.64it/s]
100%|██████████| 130/130 [00:00<00:00, 70057.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90898.23it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:38<00:00, 36.81it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 82326.90it/s]
100%|██████████| 287/287 [00:00<00:00, 75047.71it/s]
100%|██████████| 771/771 [00:00<00:00, 74455.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74762.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76314.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83787.77it/s]
100%|██████████| 353/353 [00:00<00:00, 75951.03it/s]
100%|██████████| 252/252 [00:00<00:00, 77257.85it/s]
100%|██████████| 203/203 [00:00<00:00, 77552.03it/s]
100%|██████████| 153/153 [00:00<00:00, 75720.18it/s]
100%|██████████| 200/200 [00:00<00:00, 71114.00it/s]
100%|██████████| 65/65 [00:00<00:00, 55322.60it/s]
100%|██████████| 144/144 [00:00<00:00, 73836.16it/s]
100%|██████████| 30/30 [00:00<00:00, 53362.65it/s]
100%|██████████| 130/130 [00:00<00:00, 69646.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90830.74it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.15it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 84664.07it/s]
100%|██████████| 287/287 [00:00<00:00, 74320.26it/s]
100%|██████████| 771/771 [00:00<00:00, 78056.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96747.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77646.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88034.25it/s]
100%|██████████| 353/353 [00:00<00:00, 74852.85it/s]
100%|██████████| 252/252 [00:00<00:00, 72803.73it/s]
100%|██████████| 203/203 [00:00<00:00, 73229.87it/s]
100%|██████████| 153/153 [00:00<00:00, 74308.54it/s]
100%|██████████| 200/200 [00:00<00:00, 76190.81it/s]
100%|██████████| 65/65 [00:00<00:00, 64512.48it/s]
100%|██████████| 144/144 [00:00<00:00, 75516.35it/s]
100%|██████████| 30/30 [00:00<00:00, 67144.67it/s]
100%|██████████| 130/130 [00:00<00:00, 71201.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88764.58it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:38<00:00, 36.89it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73658.01it/s]
100%|██████████| 287/287 [00:00<00:00, 75442.80it/s]
100%|██████████| 771/771 [00:00<00:00, 91565.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91802.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85488.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89998.15it/s]
100%|██████████| 353/353 [00:00<00:00, 75986.11it/s]
100%|██████████| 252/252 [00:00<00:00, 73303.60it/s]
100%|██████████| 203/203 [00:00<00:00, 71997.61it/s]
100%|██████████| 153/153 [00:00<00:00, 75267.24it/s]
100%|██████████| 200/200 [00:00<00:00, 70415.58it/s]
100%|██████████| 65/65 [00:00<00:00, 68362.53it/s]
100%|██████████| 144/144 [00:00<00:00, 72168.69it/s]
100%|██████████| 30/30 [00:00<00:00, 65604.34it/s]
100%|██████████| 130/130 [00:00<00:00, 70156.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79634.94it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.13it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 87509.08it/s]
100%|██████████| 287/287 [00:00<00:00, 73656.32it/s]
100%|██████████| 771/771 [00:00<00:00, 87763.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76025.78it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90236.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88210.14it/s]
100%|██████████| 353/353 [00:00<00:00, 74985.53it/s]
100%|██████████| 252/252 [00:00<00:00, 87403.01it/s]
100%|██████████| 203/203 [00:00<00:00, 76548.03it/s]
100%|██████████| 153/153 [00:00<00:00, 75179.07it/s]
100%|██████████| 200/200 [00:00<00:00, 73817.39it/s]
100%|██████████| 65/65 [00:00<00:00, 73346.72it/s]
100%|██████████| 144/144 [00:00<00:00, 76989.14it/s]
100%|██████████| 30/30 [00:00<00:00, 66966.00it/s]
100%|██████████| 130/130 [00:00<00:00, 54657.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83891.35it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:38<00:00, 36.87it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 90744.12it/s]
100%|██████████| 287/287 [00:00<00:00, 75409.71it/s]
100%|██████████| 771/771 [00:00<00:00, 75446.98it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96098.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76525.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80648.84it/s]
100%|██████████| 353/353 [00:00<00:00, 75605.85it/s]
100%|██████████| 252/252 [00:00<00:00, 72623.65it/s]
100%|██████████| 203/203 [00:00<00:00, 73267.68it/s]
100%|██████████| 153/153 [00:00<00:00, 75989.17it/s]
100%|██████████| 200/200 [00:00<00:00, 75207.17it/s]
100%|██████████| 65/65 [00:00<00:00, 64757.66it/s]
100%|██████████| 144/144 [00:00<00:00, 67977.46it/s]
100%|██████████| 30/30 [00:00<00:00, 55750.61it/s]
100%|██████████| 130/130 [00:00<00:00, 68311.14it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89895.19it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.16it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73159.02it/s]
100%|██████████| 287/287 [00:00<00:00, 73837.04it/s]
100%|██████████| 771/771 [00:00<00:00, 82103.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93628.08it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74929.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93061.99it/s]
100%|██████████| 353/353 [00:00<00:00, 74278.30it/s]
100%|██████████| 252/252 [00:00<00:00, 75740.92it/s]
100%|██████████| 203/203 [00:00<00:00, 74277.56it/s]
100%|██████████| 153/153 [00:00<00:00, 72684.17it/s]
100%|██████████| 200/200 [00:00<00:00, 81601.25it/s]
100%|██████████| 65/65 [00:00<00:00, 50863.76it/s]
100%|██████████| 144/144 [00:00<00:00, 77107.08it/s]
100%|██████████| 30/30 [00:00<00:00, 58416.49it/s]
100%|██████████| 130/130 [00:00<00:00, 76324.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90793.10it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.03it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 84263.96it/s]
100%|██████████| 287/287 [00:00<00:00, 77938.83it/s]
100%|██████████| 771/771 [00:00<00:00, 77704.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81496.60it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96469.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86870.37it/s]
100%|██████████| 353/353 [00:00<00:00, 68327.53it/s]
100%|██████████| 252/252 [00:00<00:00, 75063.18it/s]
100%|██████████| 203/203 [00:00<00:00, 74238.71it/s]
100%|██████████| 153/153 [00:00<00:00, 74481.03it/s]
100%|██████████| 200/200 [00:00<00:00, 71222.69it/s]
100%|██████████| 65/65 [00:00<00:00, 35374.30it/s]
100%|██████████| 144/144 [00:00<00:00, 76067.98it/s]
100%|██████████| 30/30 [00:00<00:00, 62508.26it/s]
100%|██████████| 130/130 [00:00<00:00, 74013.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82122.10it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.12it/s]
INFO:root:The new embedding has 5805 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 84936.95it/s]
100%|██████████| 287/287 [00:00<00:00, 74926.26it/s]
100%|██████████| 771/771 [00:00<00:00, 89012.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91980.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85106.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87650.98it/s]
100%|██████████| 353/353 [00:00<00:00, 76806.00it/s]
100%|██████████| 252/252 [00:00<00:00, 68947.46it/s]
100%|██████████| 203/203 [00:00<00:00, 75089.84it/s]
100%|██████████| 153/153 [00:00<00:00, 78126.19it/s]
100%|██████████| 200/200 [00:00<00:00, 63229.12it/s]
100%|██████████| 65/65 [00:00<00:00, 65160.08it/s]
100%|██████████| 144/144 [00:00<00:00, 71190.45it/s]
100%|██████████| 30/30 [00:00<00:00, 66330.59it/s]
100%|██████████| 130/130 [00:00<00:00, 72029.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90276.63it/s]
100%|██████████| 2034/

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.02it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 50939.87it/s]
100%|██████████| 287/287 [00:00<00:00, 76086.55it/s]
100%|██████████| 771/771 [00:00<00:00, 79862.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80538.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75906.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85157.77it/s]
100%|██████████| 353/353 [00:00<00:00, 77880.66it/s]
100%|██████████| 252/252 [00:00<00:00, 64551.40it/s]
100%|██████████| 203/203 [00:00<00:00, 76928.42it/s]
100%|██████████| 153/153 [00:00<00:00, 76505.55it/s]
100%|██████████| 200/200 [00:00<00:00, 76706.36it/s]
100%|██████████| 65/65 [00:00<00:00, 37907.36it/s]
100%|██████████| 144/144 [00:00<00:00, 78094.10it/s]
100%|██████████| 30/30 [00:00<00:00, 68385.39it/s]
100%|██████████| 130/130 [00:00<00:00, 72720.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83372.98it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.09it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79977.66it/s]
100%|██████████| 287/287 [00:00<00:00, 74055.08it/s]
100%|██████████| 771/771 [00:00<00:00, 94060.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79187.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78534.72it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77951.86it/s]
100%|██████████| 353/353 [00:00<00:00, 77651.93it/s]
100%|██████████| 252/252 [00:00<00:00, 76397.88it/s]
100%|██████████| 203/203 [00:00<00:00, 73654.30it/s]
100%|██████████| 153/153 [00:00<00:00, 73281.78it/s]
100%|██████████| 200/200 [00:00<00:00, 72453.00it/s]
100%|██████████| 65/65 [00:00<00:00, 51236.56it/s]
100%|██████████| 144/144 [00:00<00:00, 78714.95it/s]
100%|██████████| 30/30 [00:00<00:00, 66260.73it/s]
100%|██████████| 130/130 [00:00<00:00, 78726.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77226.91it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.10it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75550.56it/s]
100%|██████████| 287/287 [00:00<00:00, 69409.29it/s]
100%|██████████| 771/771 [00:00<00:00, 80762.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90652.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80910.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78918.43it/s]
100%|██████████| 353/353 [00:00<00:00, 81570.67it/s]
100%|██████████| 252/252 [00:00<00:00, 78022.04it/s]
100%|██████████| 203/203 [00:00<00:00, 74019.27it/s]
100%|██████████| 153/153 [00:00<00:00, 80296.36it/s]
100%|██████████| 200/200 [00:00<00:00, 80296.81it/s]
100%|██████████| 65/65 [00:00<00:00, 58105.23it/s]
100%|██████████| 144/144 [00:00<00:00, 76871.55it/s]
100%|██████████| 30/30 [00:00<00:00, 67577.40it/s]
100%|██████████| 130/130 [00:00<00:00, 78095.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85056.46it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.09it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76786.94it/s]
100%|██████████| 287/287 [00:00<00:00, 77762.61it/s]
100%|██████████| 771/771 [00:00<00:00, 77367.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81501.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76124.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79308.40it/s]
100%|██████████| 353/353 [00:00<00:00, 75440.20it/s]
100%|██████████| 252/252 [00:00<00:00, 78200.99it/s]
100%|██████████| 203/203 [00:00<00:00, 77277.52it/s]
100%|██████████| 153/153 [00:00<00:00, 74697.77it/s]
100%|██████████| 200/200 [00:00<00:00, 78899.62it/s]
100%|██████████| 65/65 [00:00<00:00, 77057.59it/s]
100%|██████████| 144/144 [00:00<00:00, 81355.03it/s]
100%|██████████| 30/30 [00:00<00:00, 50211.14it/s]
100%|██████████| 130/130 [00:00<00:00, 55855.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 57072.68it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:38<00:00, 36.88it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79334.10it/s]
100%|██████████| 287/287 [00:00<00:00, 46957.88it/s]
100%|██████████| 771/771 [00:00<00:00, 49636.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80376.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79087.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78286.51it/s]
100%|██████████| 353/353 [00:00<00:00, 74777.24it/s]
100%|██████████| 252/252 [00:00<00:00, 77229.62it/s]
100%|██████████| 203/203 [00:00<00:00, 74433.40it/s]
100%|██████████| 153/153 [00:00<00:00, 74671.69it/s]
100%|██████████| 200/200 [00:00<00:00, 73090.60it/s]
100%|██████████| 65/65 [00:00<00:00, 73386.21it/s]
100%|██████████| 144/144 [00:00<00:00, 74455.10it/s]
100%|██████████| 30/30 [00:00<00:00, 71049.76it/s]
100%|██████████| 130/130 [00:00<00:00, 74468.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78087.52it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [02:37<00:00, 37.06it/s]
INFO:root:The new embedding has 5805 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 72205.92it/s]
100%|██████████| 287/287 [00:00<00:00, 78780.45it/s]
100%|██████████| 771/771 [00:00<00:00, 80076.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82267.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81487.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78954.08it/s]
100%|██████████| 353/353 [00:00<00:00, 80040.51it/s]
100%|██████████| 252/252 [00:00<00:00, 79849.26it/s]
100%|██████████| 203/203 [00:00<00:00, 74642.21it/s]
100%|██████████| 153/153 [00:00<00:00, 75746.99it/s]
100%|██████████| 200/200 [00:00<00:00, 78456.86it/s]
100%|██████████| 65/65 [00:00<00:00, 68379.67it/s]
100%|██████████| 144/144 [00:00<00:00, 75262.28it/s]
100%|██████████| 30/30 [00:00<00:00, 70177.98it/s]
100%|██████████| 130/130 [00:00<00:00, 76292.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78181.51it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['reasoning' 're-argue']
['extravert' 'extroversive']
['deviationism' 'desertion']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['moderatorship' 'position']
['continence' 'self-discipline']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['kazakhstani' 'asian']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecuriti

100%|██████████| 5846/5846 [00:18<00:00, 310.30it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 85320.91it/s]
100%|██████████| 287/287 [00:00<00:00, 78451.85it/s]
100%|██████████| 771/771 [00:00<00:00, 79439.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77345.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84624.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75936.08it/s]
100%|██████████| 353/353 [00:00<00:00, 76965.71it/s]
100%|██████████| 252/252 [00:00<00:00, 79500.91it/s]
100%|██████████| 203/203 [00:00<00:00, 80166.06it/s]
100%|██████████| 153/153 [00:00<00:00, 80457.44it/s]
100%|██████████| 200/200 [00:00<00:00, 77236.06it/s]
100%|██████████| 65/65 [00:00<00:00, 67582.98it/s]
100%|██████████| 144/144 [00:00<00:00, 73764.02it/s]
100%|██████████| 30/30 [00:00<00:00, 65536.00it/s]
100%|██████████| 130/130 [00:00<00:00, 72048.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90956.80it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 334.73it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77274.08it/s]
100%|██████████| 287/287 [00:00<00:00, 68629.72it/s]
100%|██████████| 771/771 [00:00<00:00, 72988.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75688.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77839.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90279.04it/s]
100%|██████████| 353/353 [00:00<00:00, 76778.12it/s]
100%|██████████| 252/252 [00:00<00:00, 75266.30it/s]
100%|██████████| 203/203 [00:00<00:00, 70094.98it/s]
100%|██████████| 153/153 [00:00<00:00, 64134.37it/s]
100%|██████████| 200/200 [00:00<00:00, 74097.77it/s]
100%|██████████| 65/65 [00:00<00:00, 63021.21it/s]
100%|██████████| 144/144 [00:00<00:00, 64178.07it/s]
100%|██████████| 30/30 [00:00<00:00, 47180.02it/s]
100%|██████████| 130/130 [00:00<00:00, 70229.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72372.63it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 329.43it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 63768.64it/s]
100%|██████████| 287/287 [00:00<00:00, 71182.38it/s]
100%|██████████| 771/771 [00:00<00:00, 74127.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77257.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72343.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74179.45it/s]
100%|██████████| 353/353 [00:00<00:00, 76658.86it/s]
100%|██████████| 252/252 [00:00<00:00, 75702.95it/s]
100%|██████████| 203/203 [00:00<00:00, 68033.86it/s]
100%|██████████| 153/153 [00:00<00:00, 73123.12it/s]
100%|██████████| 200/200 [00:00<00:00, 75880.67it/s]
100%|██████████| 65/65 [00:00<00:00, 67734.10it/s]
100%|██████████| 144/144 [00:00<00:00, 73791.05it/s]
100%|██████████| 30/30 [00:00<00:00, 59325.37it/s]
100%|██████████| 130/130 [00:00<00:00, 72749.77it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82073.43it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 333.86it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77754.45it/s]
100%|██████████| 287/287 [00:00<00:00, 64928.01it/s]
100%|██████████| 771/771 [00:00<00:00, 76997.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88671.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73243.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74915.68it/s]
100%|██████████| 353/353 [00:00<00:00, 78036.65it/s]
100%|██████████| 252/252 [00:00<00:00, 80604.33it/s]
100%|██████████| 203/203 [00:00<00:00, 73362.37it/s]
100%|██████████| 153/153 [00:00<00:00, 75003.33it/s]
100%|██████████| 200/200 [00:00<00:00, 75234.15it/s]
100%|██████████| 65/65 [00:00<00:00, 74918.87it/s]
100%|██████████| 144/144 [00:00<00:00, 78347.36it/s]
100%|██████████| 30/30 [00:00<00:00, 70099.79it/s]
100%|██████████| 130/130 [00:00<00:00, 62962.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75943.28it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 328.39it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77659.34it/s]
100%|██████████| 287/287 [00:00<00:00, 77657.26it/s]
100%|██████████| 771/771 [00:00<00:00, 83537.20it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77580.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79632.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97372.12it/s]
100%|██████████| 353/353 [00:00<00:00, 77745.71it/s]
100%|██████████| 252/252 [00:00<00:00, 75298.47it/s]
100%|██████████| 203/203 [00:00<00:00, 76191.83it/s]
100%|██████████| 153/153 [00:00<00:00, 68759.08it/s]
100%|██████████| 200/200 [00:00<00:00, 75119.62it/s]
100%|██████████| 65/65 [00:00<00:00, 65725.59it/s]
100%|██████████| 144/144 [00:00<00:00, 74162.55it/s]
100%|██████████| 30/30 [00:00<00:00, 53317.42it/s]
100%|██████████| 130/130 [00:00<00:00, 74744.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81130.43it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 335.94it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 80087.73it/s]
100%|██████████| 287/287 [00:00<00:00, 78487.66it/s]
100%|██████████| 771/771 [00:00<00:00, 95536.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78598.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72007.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76334.56it/s]
100%|██████████| 353/353 [00:00<00:00, 74435.14it/s]
100%|██████████| 252/252 [00:00<00:00, 75904.10it/s]
100%|██████████| 203/203 [00:00<00:00, 76410.64it/s]
100%|██████████| 153/153 [00:00<00:00, 73306.89it/s]
100%|██████████| 200/200 [00:00<00:00, 72346.77it/s]
100%|██████████| 65/65 [00:00<00:00, 75374.55it/s]
100%|██████████| 144/144 [00:00<00:00, 78154.73it/s]
100%|██████████| 30/30 [00:00<00:00, 69788.75it/s]
100%|██████████| 130/130 [00:00<00:00, 72701.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81780.81it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 326.39it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77361.11it/s]
100%|██████████| 287/287 [00:00<00:00, 73409.27it/s]
100%|██████████| 771/771 [00:00<00:00, 79550.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90233.07it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75784.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91825.97it/s]
100%|██████████| 353/353 [00:00<00:00, 76993.72it/s]
100%|██████████| 252/252 [00:00<00:00, 76084.41it/s]
100%|██████████| 203/203 [00:00<00:00, 77587.36it/s]
100%|██████████| 153/153 [00:00<00:00, 72774.84it/s]
100%|██████████| 200/200 [00:00<00:00, 63034.33it/s]
100%|██████████| 65/65 [00:00<00:00, 72604.46it/s]
100%|██████████| 144/144 [00:00<00:00, 75734.14it/s]
100%|██████████| 30/30 [00:00<00:00, 66260.73it/s]
100%|██████████| 130/130 [00:00<00:00, 61500.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75665.75it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 336.12it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 80167.40it/s]
100%|██████████| 287/287 [00:00<00:00, 74842.41it/s]
100%|██████████| 771/771 [00:00<00:00, 87591.98it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95521.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78322.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96061.56it/s]
100%|██████████| 353/353 [00:00<00:00, 80023.20it/s]
100%|██████████| 252/252 [00:00<00:00, 75871.41it/s]
100%|██████████| 203/203 [00:00<00:00, 72593.04it/s]
100%|██████████| 153/153 [00:00<00:00, 71886.25it/s]
100%|██████████| 200/200 [00:00<00:00, 70474.74it/s]
100%|██████████| 65/65 [00:00<00:00, 73983.65it/s]
100%|██████████| 144/144 [00:00<00:00, 77993.26it/s]
100%|██████████| 30/30 [00:00<00:00, 58826.14it/s]
100%|██████████| 130/130 [00:00<00:00, 77462.64it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74046.37it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 329.13it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 79016.93it/s]
100%|██████████| 287/287 [00:00<00:00, 72341.66it/s]
100%|██████████| 771/771 [00:00<00:00, 89554.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81409.60it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78483.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76502.56it/s]
100%|██████████| 353/353 [00:00<00:00, 78998.47it/s]
100%|██████████| 252/252 [00:00<00:00, 68947.46it/s]
100%|██████████| 203/203 [00:00<00:00, 73546.14it/s]
100%|██████████| 153/153 [00:00<00:00, 75391.04it/s]
100%|██████████| 200/200 [00:00<00:00, 71053.77it/s]
100%|██████████| 65/65 [00:00<00:00, 65836.70it/s]
100%|██████████| 144/144 [00:00<00:00, 75810.19it/s]
100%|██████████| 30/30 [00:00<00:00, 68985.26it/s]
100%|██████████| 130/130 [00:00<00:00, 77407.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73703.98it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:17<00:00, 333.12it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77538.62it/s]
100%|██████████| 287/287 [00:00<00:00, 68167.24it/s]
100%|██████████| 771/771 [00:00<00:00, 88466.61it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82081.92it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76813.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87210.55it/s]
100%|██████████| 353/353 [00:00<00:00, 70686.02it/s]
100%|██████████| 252/252 [00:00<00:00, 76752.93it/s]
100%|██████████| 203/203 [00:00<00:00, 69178.07it/s]
100%|██████████| 153/153 [00:00<00:00, 79050.08it/s]
100%|██████████| 200/200 [00:00<00:00, 77179.21it/s]
100%|██████████| 65/65 [00:00<00:00, 65035.73it/s]
100%|██████████| 144/144 [00:00<00:00, 77752.29it/s]
100%|██████████| 30/30 [00:00<00:00, 48395.82it/s]
100%|██████████| 130/130 [00:00<00:00, 76036.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72793.59it/s]
100%|██████████| 2034

['monotony' 'unvariedness']




100%|██████████| 5846/5846 [00:22<00:00, 256.22it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75770.52it/s]
100%|██████████| 287/287 [00:00<00:00, 74412.14it/s]
100%|██████████| 771/771 [00:00<00:00, 86991.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94967.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93372.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88181.09it/s]
100%|██████████| 353/353 [00:00<00:00, 76236.51it/s]
100%|██████████| 252/252 [00:00<00:00, 73867.12it/s]
100%|██████████| 203/203 [00:00<00:00, 76178.20it/s]
100%|██████████| 153/153 [00:00<00:00, 72039.57it/s]
100%|██████████| 200/200 [00:00<00:00, 72017.58it/s]
100%|██████████| 65/65 [00:00<00:00, 66172.27it/s]
100%|██████████| 144/144 [00:00<00:00, 60983.42it/s]
100%|██████████| 30/30 [00:00<00:00, 38176.31it/s]
100%|██████████| 130/130 [00:00<00:00, 62687.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93842.50it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:19<00:00, 295.05it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78289.08it/s]
100%|██████████| 287/287 [00:00<00:00, 77552.20it/s]
100%|██████████| 771/771 [00:00<00:00, 73779.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92903.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77833.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82871.18it/s]
100%|██████████| 353/353 [00:00<00:00, 76861.82it/s]
100%|██████████| 252/252 [00:00<00:00, 78224.14it/s]
100%|██████████| 203/203 [00:00<00:00, 74990.64it/s]
100%|██████████| 153/153 [00:00<00:00, 77363.29it/s]
100%|██████████| 200/200 [00:00<00:00, 74320.97it/s]
100%|██████████| 65/65 [00:00<00:00, 65316.19it/s]
100%|██████████| 144/144 [00:00<00:00, 67536.60it/s]
100%|██████████| 30/30 [00:00<00:00, 47554.47it/s]
100%|██████████| 130/130 [00:00<00:00, 64973.73it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89131.60it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:20<00:00, 286.73it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77838.23it/s]
100%|██████████| 287/287 [00:00<00:00, 75277.67it/s]
100%|██████████| 771/771 [00:00<00:00, 75843.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89586.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77310.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84083.40it/s]
100%|██████████| 353/353 [00:00<00:00, 76138.50it/s]
100%|██████████| 252/252 [00:00<00:00, 75871.41it/s]
100%|██████████| 203/203 [00:00<00:00, 75994.62it/s]
100%|██████████| 153/153 [00:00<00:00, 77823.01it/s]
100%|██████████| 200/200 [00:00<00:00, 74426.48it/s]
100%|██████████| 65/65 [00:00<00:00, 63431.77it/s]
100%|██████████| 144/144 [00:00<00:00, 69319.38it/s]
100%|██████████| 30/30 [00:00<00:00, 49325.41it/s]
100%|██████████| 130/130 [00:00<00:00, 75364.14it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86230.06it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [00:19<00:00, 294.13it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 74656.74it/s]
100%|██████████| 287/287 [00:00<00:00, 75842.06it/s]
100%|██████████| 771/771 [00:00<00:00, 92275.88it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96131.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78473.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87560.71it/s]
100%|██████████| 353/353 [00:00<00:00, 75183.53it/s]
100%|██████████| 252/252 [00:00<00:00, 75540.64it/s]
100%|██████████| 203/203 [00:00<00:00, 77277.52it/s]
100%|██████████| 153/153 [00:00<00:00, 73702.60it/s]
100%|██████████| 200/200 [00:00<00:00, 68759.08it/s]
100%|██████████| 65/65 [00:00<00:00, 71518.82it/s]
100%|██████████| 144/144 [00:00<00:00, 80199.15it/s]
100%|██████████| 30/30 [00:00<00:00, 62199.27it/s]
100%|██████████| 130/130 [00:00<00:00, 62408.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83926.36it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:20<00:00, 285.63it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76775.68it/s]
100%|██████████| 287/287 [00:00<00:00, 74196.58it/s]
100%|██████████| 771/771 [00:00<00:00, 74455.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87433.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77324.34it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80316.80it/s]
100%|██████████| 353/353 [00:00<00:00, 76111.10it/s]
100%|██████████| 252/252 [00:00<00:00, 75600.07it/s]
100%|██████████| 203/203 [00:00<00:00, 71888.19it/s]
100%|██████████| 153/153 [00:00<00:00, 77121.56it/s]
100%|██████████| 200/200 [00:00<00:00, 73071.50it/s]
100%|██████████| 65/65 [00:00<00:00, 72277.24it/s]
100%|██████████| 144/144 [00:00<00:00, 53115.80it/s]
100%|██████████| 30/30 [00:00<00:00, 34673.22it/s]
100%|██████████| 130/130 [00:00<00:00, 54466.04it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75946.03it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:19<00:00, 293.53it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76836.22it/s]
100%|██████████| 287/287 [00:00<00:00, 74610.47it/s]
100%|██████████| 771/771 [00:00<00:00, 91242.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85678.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77149.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79939.21it/s]
100%|██████████| 353/353 [00:00<00:00, 75524.86it/s]
100%|██████████| 252/252 [00:00<00:00, 78177.86it/s]
100%|██████████| 203/203 [00:00<00:00, 77039.79it/s]
100%|██████████| 153/153 [00:00<00:00, 76651.76it/s]
100%|██████████| 200/200 [00:00<00:00, 75750.48it/s]
100%|██████████| 65/65 [00:00<00:00, 72954.18it/s]
100%|██████████| 144/144 [00:00<00:00, 65507.57it/s]
100%|██████████| 30/30 [00:00<00:00, 44321.63it/s]
100%|██████████| 130/130 [00:00<00:00, 38039.59it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77753.34it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [00:20<00:00, 288.61it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 79226.09it/s]
100%|██████████| 287/287 [00:00<00:00, 74982.26it/s]
100%|██████████| 771/771 [00:00<00:00, 80627.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90286.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78077.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84749.39it/s]
100%|██████████| 353/353 [00:00<00:00, 77081.91it/s]
100%|██████████| 252/252 [00:00<00:00, 75379.02it/s]
100%|██████████| 203/203 [00:00<00:00, 76630.70it/s]
100%|██████████| 153/153 [00:00<00:00, 76350.80it/s]
100%|██████████| 200/200 [00:00<00:00, 75983.77it/s]
100%|██████████| 65/65 [00:00<00:00, 67282.76it/s]
100%|██████████| 144/144 [00:00<00:00, 76029.68it/s]
100%|██████████| 30/30 [00:00<00:00, 63358.07it/s]
100%|██████████| 130/130 [00:00<00:00, 64981.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94482.72it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [00:19<00:00, 294.53it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77363.96it/s]
100%|██████████| 287/287 [00:00<00:00, 74707.70it/s]
100%|██████████| 771/771 [00:00<00:00, 72994.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86409.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76914.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87154.37it/s]
100%|██████████| 353/353 [00:00<00:00, 76453.03it/s]
100%|██████████| 252/252 [00:00<00:00, 76558.35it/s]
100%|██████████| 203/203 [00:00<00:00, 76110.10it/s]
100%|██████████| 153/153 [00:00<00:00, 51861.04it/s]
100%|██████████| 200/200 [00:00<00:00, 74459.51it/s]
100%|██████████| 65/65 [00:00<00:00, 62400.95it/s]
100%|██████████| 144/144 [00:00<00:00, 76414.45it/s]
100%|██████████| 30/30 [00:00<00:00, 64860.37it/s]
100%|██████████| 130/130 [00:00<00:00, 68976.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92427.43it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:20<00:00, 286.16it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75751.34it/s]
100%|██████████| 287/287 [00:00<00:00, 75348.35it/s]
100%|██████████| 771/771 [00:00<00:00, 77319.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91415.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78634.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85055.88it/s]
100%|██████████| 353/353 [00:00<00:00, 76861.82it/s]
100%|██████████| 252/252 [00:00<00:00, 76903.71it/s]
100%|██████████| 203/203 [00:00<00:00, 73129.24it/s]
100%|██████████| 153/153 [00:00<00:00, 73821.29it/s]
100%|██████████| 200/200 [00:00<00:00, 74645.03it/s]
100%|██████████| 65/65 [00:00<00:00, 69655.02it/s]
100%|██████████| 144/144 [00:00<00:00, 76424.11it/s]
100%|██████████| 30/30 [00:00<00:00, 59918.63it/s]
100%|██████████| 130/130 [00:00<00:00, 65214.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86172.36it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [00:19<00:00, 294.64it/s]
INFO:root:The new embedding has 5773 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77896.11it/s]
100%|██████████| 287/287 [00:00<00:00, 74912.27it/s]
100%|██████████| 771/771 [00:00<00:00, 76382.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91564.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77830.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84886.61it/s]
100%|██████████| 353/353 [00:00<00:00, 77823.35it/s]
100%|██████████| 252/252 [00:00<00:00, 74755.26it/s]
100%|██████████| 203/203 [00:00<00:00, 73223.57it/s]
100%|██████████| 153/153 [00:00<00:00, 76927.42it/s]
100%|██████████| 200/200 [00:00<00:00, 73771.95it/s]
100%|██████████| 65/65 [00:00<00:00, 70138.86it/s]
100%|██████████| 144/144 [00:00<00:00, 71868.13it/s]
100%|██████████| 30/30 [00:00<00:00, 75618.46it/s]
100%|██████████| 130/130 [00:00<00:00, 71782.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88517.31it/s]
100%|██████████| 2034

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:20<00:00, 287.39it/s]
INFO:root:The new embedding has 5773 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80334.94it/s]
100%|██████████| 287/287 [00:00<00:00, 77169.39it/s]
100%|██████████| 771/771 [00:00<00:00, 80760.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 71877.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81354.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86174.29it/s]
100%|██████████| 353/353 [00:00<00:00, 77913.45it/s]
100%|██████████| 252/252 [00:00<00:00, 79921.71it/s]
100%|██████████| 203/203 [00:00<00:00, 77144.49it/s]
100%|██████████| 153/153 [00:00<00:00, 77983.78it/s]
100%|██████████| 200/200 [00:00<00:00, 76045.76it/s]
100%|██████████| 65/65 [00:00<00:00, 60597.86it/s]
100%|██████████| 144/144 [00:00<00:00, 77324.26it/s]
100%|██████████| 30/30 [00:00<00:00, 59691.23it/s]
100%|██████████| 130/130 [00:00<00:00, 70611.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77299.30it/s]
100%|██████████| 203

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:19<00:00, 293.64it/s]
INFO:root:The new embedding has 5773 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80709.41it/s]
100%|██████████| 287/287 [00:00<00:00, 77208.98it/s]
100%|██████████| 771/771 [00:00<00:00, 72102.75it/s]
100%|██████████| 2000/2000 [00:00<00:00, 69044.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80698.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81492.91it/s]
100%|██████████| 353/353 [00:00<00:00, 79324.37it/s]
100%|██████████| 252/252 [00:00<00:00, 77655.18it/s]
100%|██████████| 203/203 [00:00<00:00, 76307.91it/s]
100%|██████████| 153/153 [00:00<00:00, 73239.96it/s]
100%|██████████| 200/200 [00:00<00:00, 73371.89it/s]
100%|██████████| 65/65 [00:00<00:00, 64989.22it/s]
100%|██████████| 144/144 [00:00<00:00, 70566.63it/s]
100%|██████████| 30/30 [00:00<00:00, 60875.24it/s]
100%|██████████| 130/130 [00:00<00:00, 77341.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76685.53it/s]
100%|██████████| 203

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:20<00:00, 285.88it/s]
INFO:root:The new embedding has 5773 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77570.20it/s]
100%|██████████| 287/287 [00:00<00:00, 83950.43it/s]
100%|██████████| 771/771 [00:00<00:00, 78060.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75688.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78855.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77475.74it/s]
100%|██████████| 353/353 [00:00<00:00, 78300.77it/s]
100%|██████████| 252/252 [00:00<00:00, 78825.01it/s]
100%|██████████| 203/203 [00:00<00:00, 80476.72it/s]
100%|██████████| 153/153 [00:00<00:00, 77186.49it/s]
100%|██████████| 200/200 [00:00<00:00, 74851.50it/s]
100%|██████████| 65/65 [00:00<00:00, 69072.65it/s]
100%|██████████| 144/144 [00:00<00:00, 76511.25it/s]
100%|██████████| 30/30 [00:00<00:00, 68237.05it/s]
100%|██████████| 130/130 [00:00<00:00, 57113.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 58435.09it/s]
100%|██████████| 203

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [00:19<00:00, 294.47it/s]
INFO:root:The new embedding has 5773 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82012.68it/s]
100%|██████████| 287/287 [00:00<00:00, 77732.48it/s]
100%|██████████| 771/771 [00:00<00:00, 79770.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78886.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81609.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87183.35it/s]
100%|██████████| 353/353 [00:00<00:00, 79867.80it/s]
100%|██████████| 252/252 [00:00<00:00, 76914.90it/s]
100%|██████████| 203/203 [00:00<00:00, 81198.14it/s]
100%|██████████| 153/153 [00:00<00:00, 79628.80it/s]
100%|██████████| 200/200 [00:00<00:00, 71924.96it/s]
100%|██████████| 65/65 [00:00<00:00, 74795.54it/s]
100%|██████████| 144/144 [00:00<00:00, 68556.16it/s]
100%|██████████| 30/30 [00:00<00:00, 52780.67it/s]
100%|██████████| 130/130 [00:00<00:00, 76602.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80128.73it/s]
100%|██████████| 203

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['



100%|██████████| 5846/5846 [00:20<00:00, 287.50it/s]
INFO:root:The new embedding has 5773 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82283.25it/s]
100%|██████████| 287/287 [00:00<00:00, 75033.67it/s]
100%|██████████| 771/771 [00:00<00:00, 78821.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78996.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82205.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78920.90it/s]
100%|██████████| 353/353 [00:00<00:00, 78767.32it/s]
100%|██████████| 252/252 [00:00<00:00, 80844.78it/s]
100%|██████████| 203/203 [00:00<00:00, 78149.95it/s]
100%|██████████| 153/153 [00:00<00:00, 31809.68it/s]
100%|██████████| 200/200 [00:00<00:00, 74373.69it/s]
100%|██████████| 65/65 [00:00<00:00, 64650.17it/s]
100%|██████████| 144/144 [00:00<00:00, 76356.48it/s]
100%|██████████| 30/30 [00:00<00:00, 62260.82it/s]
100%|██████████| 130/130 [00:00<00:00, 77144.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78506.37it/s]
100%|██████████| 203

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [00:19<00:00, 294.79it/s]
INFO:root:The new embedding has 5773 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80161.27it/s]
100%|██████████| 287/287 [00:00<00:00, 79388.33it/s]
100%|██████████| 771/771 [00:00<00:00, 78825.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78000.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80407.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77269.73it/s]
100%|██████████| 353/353 [00:00<00:00, 80213.96it/s]
100%|██████████| 252/252 [00:00<00:00, 80647.38it/s]
100%|██████████| 203/203 [00:00<00:00, 72500.32it/s]
100%|██████████| 153/153 [00:00<00:00, 77065.99it/s]
100%|██████████| 200/200 [00:00<00:00, 73539.13it/s]
100%|██████████| 65/65 [00:00<00:00, 66268.78it/s]
100%|██████████| 144/144 [00:00<00:00, 69615.00it/s]
100%|██████████| 30/30 [00:00<00:00, 68459.80it/s]
100%|██████████| 130/130 [00:00<00:00, 63299.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79767.35it/s]
100%|██████████| 203

['undated' 'undatable']
['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['antifeminism' 'sexism']
['preliterate' 'noncivilized']
['unfeathered' 'unfledged']
['reasoning' 're-argue']
['summonings' 'page']
['summonings' 'demand']
['spoonful' 'containerful']
['hypertexts' 'database']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['antedating' 'chronologize']
['contrastive' 'antonymous']
['snookered' 'flim-flam']
['reenact' 're-create']
['amazings' 'surprise']
['amazings' 'stump']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['spoonfuls' 'containerful']
['cosigns' 'validate']
['cosigns' 'endorse']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['unquenchable' 'insatiate']
['lenience' 'mercifulness']
['unblock' 'unstuff']
['interdisciplinary' 'nonindulgent']
['measurements' 'viscometry']
['nonfunctional' 'run-down']
['globalise' 'widen']
['fluidity' 'changeableness']
['independences' 'independent']
['

100%|██████████| 5846/5846 [01:25<00:00, 68.21it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 82305.87it/s]
100%|██████████| 287/287 [00:00<00:00, 73328.78it/s]
100%|██████████| 771/771 [00:00<00:00, 82147.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80358.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94466.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78176.58it/s]
100%|██████████| 353/353 [00:00<00:00, 74185.25it/s]
100%|██████████| 252/252 [00:00<00:00, 71941.51it/s]
100%|██████████| 203/203 [00:00<00:00, 73635.19it/s]
100%|██████████| 153/153 [00:00<00:00, 75684.46it/s]
100%|██████████| 200/200 [00:00<00:00, 73326.99it/s]
100%|██████████| 65/65 [00:00<00:00, 68328.26it/s]
100%|██████████| 144/144 [00:00<00:00, 67438.56it/s]
100%|██████████| 30/30 [00:00<00:00, 63198.96it/s]
100%|██████████| 130/130 [00:00<00:00, 66422.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82061.96it/s]
100%|██████████| 2034/

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.72it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 81494.28it/s]
100%|██████████| 287/287 [00:00<00:00, 74772.67it/s]
100%|██████████| 771/771 [00:00<00:00, 77745.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75173.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76514.66it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76889.17it/s]
100%|██████████| 353/353 [00:00<00:00, 76702.55it/s]
100%|██████████| 252/252 [00:00<00:00, 74723.55it/s]
100%|██████████| 203/203 [00:00<00:00, 73210.98it/s]
100%|██████████| 153/153 [00:00<00:00, 73660.30it/s]
100%|██████████| 200/200 [00:00<00:00, 75200.43it/s]
100%|██████████| 65/65 [00:00<00:00, 65980.10it/s]
100%|██████████| 144/144 [00:00<00:00, 71587.03it/s]
100%|██████████| 30/30 [00:00<00:00, 63135.53it/s]
100%|██████████| 130/130 [00:00<00:00, 72856.70it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90301.62it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 110.08it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 85352.19it/s]
100%|██████████| 287/287 [00:00<00:00, 78728.92it/s]
100%|██████████| 771/771 [00:00<00:00, 96422.22it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74840.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78696.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78487.70it/s]
100%|██████████| 353/353 [00:00<00:00, 73752.89it/s]
100%|██████████| 252/252 [00:00<00:00, 77878.32it/s]
100%|██████████| 203/203 [00:00<00:00, 74825.88it/s]
100%|██████████| 153/153 [00:00<00:00, 75382.18it/s]
100%|██████████| 200/200 [00:00<00:00, 75818.94it/s]
100%|██████████| 65/65 [00:00<00:00, 65425.91it/s]
100%|██████████| 144/144 [00:00<00:00, 71409.29it/s]
100%|██████████| 30/30 [00:00<00:00, 57299.23it/s]
100%|██████████| 130/130 [00:00<00:00, 69230.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87337.66it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.77it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75595.54it/s]
100%|██████████| 287/287 [00:00<00:00, 70473.93it/s]
100%|██████████| 771/771 [00:00<00:00, 77254.79it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74439.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72849.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76253.60it/s]
100%|██████████| 353/353 [00:00<00:00, 70236.68it/s]
100%|██████████| 252/252 [00:00<00:00, 73430.92it/s]
100%|██████████| 203/203 [00:00<00:00, 76144.13it/s]
100%|██████████| 153/153 [00:00<00:00, 76305.41it/s]
100%|██████████| 200/200 [00:00<00:00, 77342.87it/s]
100%|██████████| 65/65 [00:00<00:00, 73149.92it/s]
100%|██████████| 144/144 [00:00<00:00, 67423.51it/s]
100%|██████████| 30/30 [00:00<00:00, 61802.12it/s]
100%|██████████| 130/130 [00:00<00:00, 70374.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87848.81it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 110.18it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73925.72it/s]
100%|██████████| 287/287 [00:00<00:00, 87898.16it/s]
100%|██████████| 771/771 [00:00<00:00, 89467.65it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77579.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86384.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77849.62it/s]
100%|██████████| 353/353 [00:00<00:00, 82765.35it/s]
100%|██████████| 252/252 [00:00<00:00, 75175.29it/s]
100%|██████████| 203/203 [00:00<00:00, 74433.40it/s]
100%|██████████| 153/153 [00:00<00:00, 71846.00it/s]
100%|██████████| 200/200 [00:00<00:00, 68006.55it/s]
100%|██████████| 65/65 [00:00<00:00, 65253.65it/s]
100%|██████████| 144/144 [00:00<00:00, 73485.80it/s]
100%|██████████| 30/30 [00:00<00:00, 50942.96it/s]
100%|██████████| 130/130 [00:00<00:00, 70492.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92515.39it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.81it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78886.02it/s]
100%|██████████| 287/287 [00:00<00:00, 60649.20it/s]
100%|██████████| 771/771 [00:00<00:00, 85097.98it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82423.07it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85196.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91540.05it/s]
100%|██████████| 353/353 [00:00<00:00, 76453.03it/s]
100%|██████████| 252/252 [00:00<00:00, 74539.11it/s]
100%|██████████| 203/203 [00:00<00:00, 77665.21it/s]
100%|██████████| 153/153 [00:00<00:00, 73098.13it/s]
100%|██████████| 200/200 [00:00<00:00, 74811.45it/s]
100%|██████████| 65/65 [00:00<00:00, 63937.56it/s]
100%|██████████| 144/144 [00:00<00:00, 71383.97it/s]
100%|██████████| 30/30 [00:00<00:00, 54947.21it/s]
100%|██████████| 130/130 [00:00<00:00, 72162.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85448.07it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 110.28it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 81260.37it/s]
100%|██████████| 287/287 [00:00<00:00, 71780.87it/s]
100%|██████████| 771/771 [00:00<00:00, 95479.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97188.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76782.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94566.41it/s]
100%|██████████| 353/353 [00:00<00:00, 77582.76it/s]
100%|██████████| 252/252 [00:00<00:00, 71868.13it/s]
100%|██████████| 203/203 [00:00<00:00, 85632.48it/s]
100%|██████████| 153/153 [00:00<00:00, 60643.41it/s]
100%|██████████| 200/200 [00:00<00:00, 75254.40it/s]
100%|██████████| 65/65 [00:00<00:00, 74064.05it/s]
100%|██████████| 144/144 [00:00<00:00, 77048.06it/s]
100%|██████████| 30/30 [00:00<00:00, 64100.42it/s]
100%|██████████| 130/130 [00:00<00:00, 73110.69it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78543.76it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.31it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 79058.67it/s]
100%|██████████| 287/287 [00:00<00:00, 73324.31it/s]
100%|██████████| 771/771 [00:00<00:00, 75072.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75086.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88506.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72439.65it/s]
100%|██████████| 353/353 [00:00<00:00, 76989.72it/s]
100%|██████████| 252/252 [00:00<00:00, 74612.78it/s]
100%|██████████| 203/203 [00:00<00:00, 66023.86it/s]
100%|██████████| 153/153 [00:00<00:00, 72519.89it/s]
100%|██████████| 200/200 [00:00<00:00, 74724.82it/s]
100%|██████████| 65/65 [00:00<00:00, 70812.92it/s]
100%|██████████| 144/144 [00:00<00:00, 73818.11it/s]
100%|██████████| 30/30 [00:00<00:00, 49344.75it/s]
100%|██████████| 130/130 [00:00<00:00, 66084.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91406.48it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 109.37it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 87481.67it/s]
100%|██████████| 287/287 [00:00<00:00, 72042.93it/s]
100%|██████████| 771/771 [00:00<00:00, 87414.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76467.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80115.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79539.51it/s]
100%|██████████| 353/353 [00:00<00:00, 73734.53it/s]
100%|██████████| 252/252 [00:00<00:00, 75212.74it/s]
100%|██████████| 203/203 [00:00<00:00, 76424.35it/s]
100%|██████████| 153/153 [00:00<00:00, 71813.84it/s]
100%|██████████| 200/200 [00:00<00:00, 76322.52it/s]
100%|██████████| 65/65 [00:00<00:00, 65410.21it/s]
100%|██████████| 144/144 [00:00<00:00, 69295.52it/s]
100%|██████████| 30/30 [00:00<00:00, 48228.87it/s]
100%|██████████| 130/130 [00:00<00:00, 71247.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85609.52it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 110.21it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 88430.65it/s]
100%|██████████| 287/287 [00:00<00:00, 71639.90it/s]
100%|██████████| 771/771 [00:00<00:00, 76136.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74680.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96819.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91530.06it/s]
100%|██████████| 353/353 [00:00<00:00, 76750.26it/s]
100%|██████████| 252/252 [00:00<00:00, 74381.75it/s]
100%|██████████| 203/203 [00:00<00:00, 76376.36it/s]
100%|██████████| 153/153 [00:00<00:00, 73390.73it/s]
100%|██████████| 200/200 [00:00<00:00, 77065.76it/s]
100%|██████████| 65/65 [00:00<00:00, 63006.65it/s]
100%|██████████| 144/144 [00:00<00:00, 74722.23it/s]
100%|██████████| 30/30 [00:00<00:00, 65638.56it/s]
100%|██████████| 130/130 [00:00<00:00, 70365.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81575.40it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 109.45it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 91888.37it/s]
100%|██████████| 287/287 [00:00<00:00, 65801.10it/s]
100%|██████████| 771/771 [00:00<00:00, 79318.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80907.86it/s]
100%|██████████| 1000/1000 [00:00<00:00, 71091.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97256.22it/s]
100%|██████████| 353/353 [00:00<00:00, 79027.99it/s]
100%|██████████| 252/252 [00:00<00:00, 60222.47it/s]
100%|██████████| 203/203 [00:00<00:00, 77928.22it/s]
100%|██████████| 153/153 [00:00<00:00, 76927.42it/s]
100%|██████████| 200/200 [00:00<00:00, 70174.07it/s]
100%|██████████| 65/65 [00:00<00:00, 57480.45it/s]
100%|██████████| 144/144 [00:00<00:00, 61662.05it/s]
100%|██████████| 30/30 [00:00<00:00, 64362.72it/s]
100%|██████████| 130/130 [00:00<00:00, 79252.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86964.63it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.78it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 73848.85it/s]
100%|██████████| 287/287 [00:00<00:00, 73552.81it/s]
100%|██████████| 771/771 [00:00<00:00, 80201.59it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77253.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78655.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75708.55it/s]
100%|██████████| 353/353 [00:00<00:00, 78821.83it/s]
100%|██████████| 252/252 [00:00<00:00, 77240.91it/s]
100%|██████████| 203/203 [00:00<00:00, 76997.98it/s]
100%|██████████| 153/153 [00:00<00:00, 77372.62it/s]
100%|██████████| 200/200 [00:00<00:00, 76392.02it/s]
100%|██████████| 65/65 [00:00<00:00, 69037.67it/s]
100%|██████████| 144/144 [00:00<00:00, 80156.57it/s]
100%|██████████| 30/30 [00:00<00:00, 67396.42it/s]
100%|██████████| 130/130 [00:00<00:00, 78128.60it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79840.67it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 109.50it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 72596.24it/s]
100%|██████████| 287/287 [00:00<00:00, 77652.25it/s]
100%|██████████| 771/771 [00:00<00:00, 80887.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81601.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79236.48it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78957.55it/s]
100%|██████████| 353/353 [00:00<00:00, 79002.68it/s]
100%|██████████| 252/252 [00:00<00:00, 81656.72it/s]
100%|██████████| 203/203 [00:00<00:00, 75162.76it/s]
100%|██████████| 153/153 [00:00<00:00, 79471.02it/s]
100%|██████████| 200/200 [00:00<00:00, 80489.43it/s]
100%|██████████| 65/65 [00:00<00:00, 74124.46it/s]
100%|██████████| 144/144 [00:00<00:00, 74759.22it/s]
100%|██████████| 30/30 [00:00<00:00, 56073.58it/s]
100%|██████████| 130/130 [00:00<00:00, 72517.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 100290.79it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.36it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77888.87it/s]
100%|██████████| 287/287 [00:00<00:00, 78339.53it/s]
100%|██████████| 771/771 [00:00<00:00, 78946.55it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79705.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77439.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79164.20it/s]
100%|██████████| 353/353 [00:00<00:00, 78905.85it/s]
100%|██████████| 252/252 [00:00<00:00, 77735.13it/s]
100%|██████████| 203/203 [00:00<00:00, 79071.67it/s]
100%|██████████| 153/153 [00:00<00:00, 77372.62it/s]
100%|██████████| 200/200 [00:00<00:00, 76004.42it/s]
100%|██████████| 65/65 [00:00<00:00, 69055.16it/s]
100%|██████████| 144/144 [00:00<00:00, 75905.46it/s]
100%|██████████| 30/30 [00:00<00:00, 69827.48it/s]
100%|██████████| 130/130 [00:00<00:00, 74397.53it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76791.43it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 109.14it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75308.86it/s]
100%|██████████| 287/287 [00:00<00:00, 73800.82it/s]
100%|██████████| 771/771 [00:00<00:00, 80623.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78648.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78208.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78197.96it/s]
100%|██████████| 353/353 [00:00<00:00, 79614.42it/s]
100%|██████████| 252/252 [00:00<00:00, 41783.86it/s]
100%|██████████| 203/203 [00:00<00:00, 75342.33it/s]
100%|██████████| 153/153 [00:00<00:00, 76441.75it/s]
100%|██████████| 200/200 [00:00<00:00, 78383.55it/s]
100%|██████████| 65/65 [00:00<00:00, 74407.69it/s]
100%|██████████| 144/144 [00:00<00:00, 72926.80it/s]
100%|██████████| 30/30 [00:00<00:00, 46707.17it/s]
100%|██████████| 130/130 [00:00<00:00, 66665.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77815.99it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 110.68it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78874.14it/s]
100%|██████████| 287/287 [00:00<00:00, 78976.86it/s]
100%|██████████| 771/771 [00:00<00:00, 78118.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78251.94it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79348.91it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77604.27it/s]
100%|██████████| 353/353 [00:00<00:00, 49478.32it/s]
100%|██████████| 252/252 [00:00<00:00, 79208.98it/s]
100%|██████████| 203/203 [00:00<00:00, 74622.59it/s]
100%|██████████| 153/153 [00:00<00:00, 77964.83it/s]
100%|██████████| 200/200 [00:00<00:00, 75153.27it/s]
100%|██████████| 65/65 [00:00<00:00, 59293.12it/s]
100%|██████████| 144/144 [00:00<00:00, 73245.18it/s]
100%|██████████| 30/30 [00:00<00:00, 56705.33it/s]
100%|██████████| 130/130 [00:00<00:00, 72837.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74132.75it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 162.05it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 56559.67it/s]
100%|██████████| 287/287 [00:00<00:00, 56279.64it/s]
100%|██████████| 771/771 [00:00<00:00, 67328.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 55795.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79101.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 54658.17it/s]
100%|██████████| 353/353 [00:00<00:00, 56232.03it/s]
100%|██████████| 252/252 [00:00<00:00, 56380.47it/s]
100%|██████████| 203/203 [00:00<00:00, 54087.39it/s]
100%|██████████| 153/153 [00:00<00:00, 52795.43it/s]
100%|██████████| 200/200 [00:00<00:00, 54949.61it/s]
100%|██████████| 65/65 [00:00<00:00, 45773.97it/s]
100%|██████████| 144/144 [00:00<00:00, 55198.30it/s]
100%|██████████| 30/30 [00:00<00:00, 37583.37it/s]
100%|██████████| 130/130 [00:00<00:00, 56004.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69615.66it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.45it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76116.00it/s]
100%|██████████| 287/287 [00:00<00:00, 78462.08it/s]
100%|██████████| 771/771 [00:00<00:00, 75278.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93492.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77186.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80690.73it/s]
100%|██████████| 353/353 [00:00<00:00, 76762.20it/s]
100%|██████████| 252/252 [00:00<00:00, 77269.14it/s]
100%|██████████| 203/203 [00:00<00:00, 67833.31it/s]
100%|██████████| 153/153 [00:00<00:00, 73173.15it/s]
100%|██████████| 200/200 [00:00<00:00, 84071.04it/s]
100%|██████████| 65/65 [00:00<00:00, 72219.80it/s]
100%|██████████| 144/144 [00:00<00:00, 70989.63it/s]
100%|██████████| 30/30 [00:00<00:00, 61711.19it/s]
100%|██████████| 130/130 [00:00<00:00, 69020.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76537.60it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.37it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76888.39it/s]
100%|██████████| 287/287 [00:00<00:00, 74055.08it/s]
100%|██████████| 771/771 [00:00<00:00, 73442.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89711.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77224.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84441.14it/s]
100%|██████████| 353/353 [00:00<00:00, 74192.69it/s]
100%|██████████| 252/252 [00:00<00:00, 77438.98it/s]
100%|██████████| 203/203 [00:00<00:00, 68493.58it/s]
100%|██████████| 153/153 [00:00<00:00, 64534.24it/s]
100%|██████████| 200/200 [00:00<00:00, 73973.62it/s]
100%|██████████| 65/65 [00:00<00:00, 66204.41it/s]
100%|██████████| 144/144 [00:00<00:00, 66937.80it/s]
100%|██████████| 30/30 [00:00<00:00, 66365.57it/s]
100%|██████████| 130/130 [00:00<00:00, 72759.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77316.80it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.24it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76389.37it/s]
100%|██████████| 287/287 [00:00<00:00, 75856.40it/s]
100%|██████████| 771/771 [00:00<00:00, 86774.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89990.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78273.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85483.48it/s]
100%|██████████| 353/353 [00:00<00:00, 75908.19it/s]
100%|██████████| 252/252 [00:00<00:00, 79970.08it/s]
100%|██████████| 203/203 [00:00<00:00, 78236.12it/s]
100%|██████████| 153/153 [00:00<00:00, 67056.27it/s]
100%|██████████| 200/200 [00:00<00:00, 71795.69it/s]
100%|██████████| 65/65 [00:00<00:00, 46397.17it/s]
100%|██████████| 144/144 [00:00<00:00, 72733.60it/s]
100%|██████████| 30/30 [00:00<00:00, 61530.13it/s]
100%|██████████| 130/130 [00:00<00:00, 67299.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75040.71it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.55it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76034.51it/s]
100%|██████████| 287/287 [00:00<00:00, 74467.38it/s]
100%|██████████| 771/771 [00:00<00:00, 68110.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93519.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77930.62it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87634.50it/s]
100%|██████████| 353/353 [00:00<00:00, 76370.21it/s]
100%|██████████| 252/252 [00:00<00:00, 74749.97it/s]
100%|██████████| 203/203 [00:00<00:00, 67698.47it/s]
100%|██████████| 153/153 [00:00<00:00, 68066.24it/s]
100%|██████████| 200/200 [00:00<00:00, 80807.32it/s]
100%|██████████| 65/65 [00:00<00:00, 51752.04it/s]
100%|██████████| 144/144 [00:00<00:00, 54757.91it/s]
100%|██████████| 30/30 [00:00<00:00, 51254.22it/s]
100%|██████████| 130/130 [00:00<00:00, 50463.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 67248.74it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.62it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 56947.86it/s]
100%|██████████| 287/287 [00:00<00:00, 55011.66it/s]
100%|██████████| 771/771 [00:00<00:00, 55552.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 55349.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 67873.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 59889.25it/s]
100%|██████████| 353/353 [00:00<00:00, 59516.39it/s]
100%|██████████| 252/252 [00:00<00:00, 75180.64it/s]
100%|██████████| 203/203 [00:00<00:00, 74918.06it/s]
100%|██████████| 153/153 [00:00<00:00, 72915.41it/s]
100%|██████████| 200/200 [00:00<00:00, 70374.23it/s]
100%|██████████| 65/65 [00:00<00:00, 64133.09it/s]
100%|██████████| 144/144 [00:00<00:00, 56658.52it/s]
100%|██████████| 30/30 [00:00<00:00, 57221.06it/s]
100%|██████████| 130/130 [00:00<00:00, 70419.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73472.32it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.73it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76963.24it/s]
100%|██████████| 287/287 [00:00<00:00, 74647.48it/s]
100%|██████████| 771/771 [00:00<00:00, 76206.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93444.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79100.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86518.55it/s]
100%|██████████| 353/353 [00:00<00:00, 76087.64it/s]
100%|██████████| 252/252 [00:00<00:00, 70567.81it/s]
100%|██████████| 203/203 [00:00<00:00, 75865.96it/s]
100%|██████████| 153/153 [00:00<00:00, 69256.26it/s]
100%|██████████| 200/200 [00:00<00:00, 73077.86it/s]
100%|██████████| 65/65 [00:00<00:00, 65567.52it/s]
100%|██████████| 144/144 [00:00<00:00, 66030.37it/s]
100%|██████████| 30/30 [00:00<00:00, 62168.54it/s]
100%|██████████| 130/130 [00:00<00:00, 75291.29it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93292.64it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.92it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76695.58it/s]
100%|██████████| 287/287 [00:00<00:00, 75770.46it/s]
100%|██████████| 771/771 [00:00<00:00, 78236.04it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85053.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78065.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79565.66it/s]
100%|██████████| 353/353 [00:00<00:00, 75061.56it/s]
100%|██████████| 252/252 [00:00<00:00, 79752.86it/s]
100%|██████████| 203/203 [00:00<00:00, 78939.71it/s]
100%|██████████| 153/153 [00:00<00:00, 75693.38it/s]
100%|██████████| 200/200 [00:00<00:00, 73046.05it/s]
100%|██████████| 65/65 [00:00<00:00, 50356.44it/s]
100%|██████████| 144/144 [00:00<00:00, 72874.01it/s]
100%|██████████| 30/30 [00:00<00:00, 51952.57it/s]
100%|██████████| 130/130 [00:00<00:00, 67449.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79272.85it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.61it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78660.92it/s]
100%|██████████| 287/287 [00:00<00:00, 75235.33it/s]
100%|██████████| 771/771 [00:00<00:00, 75176.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88230.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79257.45it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83857.01it/s]
100%|██████████| 353/353 [00:00<00:00, 78562.52it/s]
100%|██████████| 252/252 [00:00<00:00, 74381.75it/s]
100%|██████████| 203/203 [00:00<00:00, 76914.52it/s]
100%|██████████| 153/153 [00:00<00:00, 74171.12it/s]
100%|██████████| 200/200 [00:00<00:00, 73623.03it/s]
100%|██████████| 65/65 [00:00<00:00, 63713.43it/s]
100%|██████████| 144/144 [00:00<00:00, 87685.80it/s]
100%|██████████| 30/30 [00:00<00:00, 67432.54it/s]
100%|██████████| 130/130 [00:00<00:00, 72479.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93601.96it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.60it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78542.96it/s]
100%|██████████| 287/287 [00:00<00:00, 76614.39it/s]
100%|██████████| 771/771 [00:00<00:00, 76790.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92268.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78957.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85792.97it/s]
100%|██████████| 353/353 [00:00<00:00, 75444.04it/s]
100%|██████████| 252/252 [00:00<00:00, 76403.40it/s]
100%|██████████| 203/203 [00:00<00:00, 75920.08it/s]
100%|██████████| 153/153 [00:00<00:00, 74602.25it/s]
100%|██████████| 200/200 [00:00<00:00, 68400.26it/s]
100%|██████████| 65/65 [00:00<00:00, 67449.22it/s]
100%|██████████| 144/144 [00:00<00:00, 75905.46it/s]
100%|██████████| 30/30 [00:00<00:00, 67650.06it/s]
100%|██████████| 130/130 [00:00<00:00, 72556.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90090.48it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.05it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81445.17it/s]
100%|██████████| 287/287 [00:00<00:00, 78662.04it/s]
100%|██████████| 771/771 [00:00<00:00, 77240.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90681.77it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81477.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81822.52it/s]
100%|██████████| 353/353 [00:00<00:00, 77717.14it/s]
100%|██████████| 252/252 [00:00<00:00, 71561.58it/s]
100%|██████████| 203/203 [00:00<00:00, 75536.17it/s]
100%|██████████| 153/153 [00:00<00:00, 76478.19it/s]
100%|██████████| 200/200 [00:00<00:00, 74380.28it/s]
100%|██████████| 65/65 [00:00<00:00, 68294.03it/s]
100%|██████████| 144/144 [00:00<00:00, 80745.96it/s]
100%|██████████| 30/30 [00:00<00:00, 70730.25it/s]
100%|██████████| 130/130 [00:00<00:00, 74033.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78614.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.80it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81350.30it/s]
100%|██████████| 287/287 [00:00<00:00, 81688.74it/s]
100%|██████████| 771/771 [00:00<00:00, 82255.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79199.08it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81471.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78843.76it/s]
100%|██████████| 353/353 [00:00<00:00, 78805.05it/s]
100%|██████████| 252/252 [00:00<00:00, 74781.70it/s]
100%|██████████| 203/203 [00:00<00:00, 71888.19it/s]
100%|██████████| 153/153 [00:00<00:00, 78633.56it/s]
100%|██████████| 200/200 [00:00<00:00, 78589.17it/s]
100%|██████████| 65/65 [00:00<00:00, 71952.96it/s]
100%|██████████| 144/144 [00:00<00:00, 77702.27it/s]
100%|██████████| 30/30 [00:00<00:00, 71170.32it/s]
100%|██████████| 130/130 [00:00<00:00, 78465.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77578.71it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.90it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 89606.93it/s]
100%|██████████| 287/287 [00:00<00:00, 74476.60it/s]
100%|██████████| 771/771 [00:00<00:00, 104218.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95525.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93731.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 100050.98it/s]
100%|██████████| 353/353 [00:00<00:00, 84537.47it/s]
100%|██████████| 252/252 [00:00<00:00, 71042.12it/s]
100%|██████████| 203/203 [00:00<00:00, 65829.88it/s]
100%|██████████| 153/153 [00:00<00:00, 78116.68it/s]
100%|██████████| 200/200 [00:00<00:00, 71114.00it/s]
100%|██████████| 65/65 [00:00<00:00, 49175.64it/s]
100%|██████████| 144/144 [00:00<00:00, 66576.25it/s]
100%|██████████| 30/30 [00:00<00:00, 58963.97it/s]
100%|██████████| 130/130 [00:00<00:00, 68114.87it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95346.76it/s]
100%|██████████| 2

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.93it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80365.75it/s]
100%|██████████| 287/287 [00:00<00:00, 77747.55it/s]
100%|██████████| 771/771 [00:00<00:00, 79190.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76317.66it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80925.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77182.05it/s]
100%|██████████| 353/353 [00:00<00:00, 76738.33it/s]
100%|██████████| 252/252 [00:00<00:00, 76370.28it/s]
100%|██████████| 203/203 [00:00<00:00, 74459.44it/s]
100%|██████████| 153/153 [00:00<00:00, 75720.18it/s]
100%|██████████| 200/200 [00:00<00:00, 58875.69it/s]
100%|██████████| 65/65 [00:00<00:00, 69566.15it/s]
100%|██████████| 144/144 [00:00<00:00, 75309.20it/s]
100%|██████████| 30/30 [00:00<00:00, 48526.46it/s]
100%|██████████| 130/130 [00:00<00:00, 72681.89it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78029.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.52it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80793.45it/s]
100%|██████████| 287/287 [00:00<00:00, 77457.39it/s]
100%|██████████| 771/771 [00:00<00:00, 80205.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76414.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80555.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78423.13it/s]
100%|██████████| 353/353 [00:00<00:00, 79154.73it/s]
100%|██████████| 252/252 [00:00<00:00, 78374.95it/s]
100%|██████████| 203/203 [00:00<00:00, 77750.32it/s]
100%|██████████| 153/153 [00:00<00:00, 74025.67it/s]
100%|██████████| 200/200 [00:00<00:00, 76031.98it/s]
100%|██████████| 65/65 [00:00<00:00, 66156.21it/s]
100%|██████████| 144/144 [00:00<00:00, 64253.17it/s]
100%|██████████| 30/30 [00:00<00:00, 56048.61it/s]
100%|██████████| 130/130 [00:00<00:00, 79588.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77125.48it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.97it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 73786.42it/s]
100%|██████████| 287/287 [00:00<00:00, 77427.49it/s]
100%|██████████| 771/771 [00:00<00:00, 78498.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87759.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79544.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76571.00it/s]
100%|██████████| 353/353 [00:00<00:00, 78662.70it/s]
100%|██████████| 252/252 [00:00<00:00, 77145.07it/s]
100%|██████████| 203/203 [00:00<00:00, 76410.64it/s]
100%|██████████| 153/153 [00:00<00:00, 72865.73it/s]
100%|██████████| 200/200 [00:00<00:00, 76973.83it/s]
100%|██████████| 65/65 [00:00<00:00, 61905.03it/s]
100%|██████████| 144/144 [00:00<00:00, 77403.53it/s]
100%|██████████| 30/30 [00:00<00:00, 62230.03it/s]
100%|██████████| 130/130 [00:00<00:00, 73258.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76795.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [01:35<00:00, 61.01it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 69099.25it/s]
100%|██████████| 287/287 [00:00<00:00, 99034.57it/s]
100%|██████████| 771/771 [00:00<00:00, 76154.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89164.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75698.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85662.14it/s]
100%|██████████| 353/353 [00:00<00:00, 76201.20it/s]
100%|██████████| 252/252 [00:00<00:00, 72803.73it/s]
100%|██████████| 203/203 [00:00<00:00, 73330.78it/s]
100%|██████████| 153/153 [00:00<00:00, 70971.97it/s]
100%|██████████| 200/200 [00:00<00:00, 72490.56it/s]
100%|██████████| 65/65 [00:00<00:00, 57809.53it/s]
100%|██████████| 144/144 [00:00<00:00, 65479.16it/s]
100%|██████████| 30/30 [00:00<00:00, 63743.22it/s]
100%|██████████| 130/130 [00:00<00:00, 73534.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82846.01it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.22it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 53279.46it/s]
100%|██████████| 287/287 [00:00<00:00, 73030.71it/s]
100%|██████████| 771/771 [00:00<00:00, 74010.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76443.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73537.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74086.86it/s]
100%|██████████| 353/353 [00:00<00:00, 72020.10it/s]
100%|██████████| 252/252 [00:00<00:00, 71760.79it/s]
100%|██████████| 203/203 [00:00<00:00, 72617.80it/s]
100%|██████████| 153/153 [00:00<00:00, 73139.79it/s]
100%|██████████| 200/200 [00:00<00:00, 75477.85it/s]
100%|██████████| 65/65 [00:00<00:00, 61876.93it/s]
100%|██████████| 144/144 [00:00<00:00, 76744.57it/s]
100%|██████████| 30/30 [00:00<00:00, 58012.50it/s]
100%|██████████| 130/130 [00:00<00:00, 69204.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87261.87it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.35it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 55232.59it/s]
100%|██████████| 287/287 [00:00<00:00, 55269.30it/s]
100%|██████████| 771/771 [00:00<00:00, 54856.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 55906.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75107.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73673.90it/s]
100%|██████████| 353/353 [00:00<00:00, 55003.69it/s]
100%|██████████| 252/252 [00:00<00:00, 55251.68it/s]
100%|██████████| 203/203 [00:00<00:00, 76651.40it/s]
100%|██████████| 153/153 [00:00<00:00, 80396.96it/s]
100%|██████████| 200/200 [00:00<00:00, 70629.01it/s]
100%|██████████| 65/65 [00:00<00:00, 61820.81it/s]
100%|██████████| 144/144 [00:00<00:00, 72619.91it/s]
100%|██████████| 30/30 [00:00<00:00, 58908.76it/s]
100%|██████████| 130/130 [00:00<00:00, 66438.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92879.47it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.65it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77312.58it/s]
100%|██████████| 287/287 [00:00<00:00, 75353.07it/s]
100%|██████████| 771/771 [00:00<00:00, 75704.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75545.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78930.80it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77158.86it/s]
100%|██████████| 353/353 [00:00<00:00, 74274.57it/s]
100%|██████████| 252/252 [00:00<00:00, 75277.02it/s]
100%|██████████| 203/203 [00:00<00:00, 69710.47it/s]
100%|██████████| 153/153 [00:00<00:00, 72626.59it/s]
100%|██████████| 200/200 [00:00<00:00, 71838.73it/s]
100%|██████████| 65/65 [00:00<00:00, 65757.30it/s]
100%|██████████| 144/144 [00:00<00:00, 76979.32it/s]
100%|██████████| 30/30 [00:00<00:00, 61082.10it/s]
100%|██████████| 130/130 [00:00<00:00, 71257.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88194.51it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.31it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78096.47it/s]
100%|██████████| 287/287 [00:00<00:00, 74587.35it/s]
100%|██████████| 771/771 [00:00<00:00, 86527.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75862.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74239.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84432.64it/s]
100%|██████████| 353/353 [00:00<00:00, 74634.00it/s]
100%|██████████| 252/252 [00:00<00:00, 74126.14it/s]
100%|██████████| 203/203 [00:00<00:00, 82488.25it/s]
100%|██████████| 153/153 [00:00<00:00, 70745.07it/s]
100%|██████████| 200/200 [00:00<00:00, 73103.34it/s]
100%|██████████| 65/65 [00:00<00:00, 63137.97it/s]
100%|██████████| 144/144 [00:00<00:00, 71646.47it/s]
100%|██████████| 30/30 [00:00<00:00, 54851.40it/s]
100%|██████████| 130/130 [00:00<00:00, 69504.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80466.48it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.28it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75899.53it/s]
100%|██████████| 287/287 [00:00<00:00, 74972.92it/s]
100%|██████████| 771/771 [00:00<00:00, 75978.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76310.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 71422.80it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84854.55it/s]
100%|██████████| 353/353 [00:00<00:00, 74615.19it/s]
100%|██████████| 252/252 [00:00<00:00, 64673.84it/s]
100%|██████████| 203/203 [00:00<00:00, 71773.05it/s]
100%|██████████| 153/153 [00:00<00:00, 73660.30it/s]
100%|██████████| 200/200 [00:00<00:00, 72415.47it/s]
100%|██████████| 65/65 [00:00<00:00, 62159.09it/s]
100%|██████████| 144/144 [00:00<00:00, 73014.96it/s]
100%|██████████| 30/30 [00:00<00:00, 54027.10it/s]
100%|██████████| 130/130 [00:00<00:00, 73159.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78016.97it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.02it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76292.01it/s]
100%|██████████| 287/287 [00:00<00:00, 73119.43it/s]
100%|██████████| 771/771 [00:00<00:00, 73792.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75974.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79009.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91875.58it/s]
100%|██████████| 353/353 [00:00<00:00, 52641.30it/s]
100%|██████████| 252/252 [00:00<00:00, 68871.09it/s]
100%|██████████| 203/203 [00:00<00:00, 76307.91it/s]
100%|██████████| 153/153 [00:00<00:00, 71019.09it/s]
100%|██████████| 200/200 [00:00<00:00, 73895.42it/s]
100%|██████████| 65/65 [00:00<00:00, 64118.01it/s]
100%|██████████| 144/144 [00:00<00:00, 77403.53it/s]
100%|██████████| 30/30 [00:00<00:00, 42409.54it/s]
100%|██████████| 130/130 [00:00<00:00, 55616.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75864.79it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.38it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 57449.13it/s]
100%|██████████| 287/287 [00:00<00:00, 55570.37it/s]
100%|██████████| 771/771 [00:00<00:00, 56635.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 62049.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93466.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80037.35it/s]
100%|██████████| 353/353 [00:00<00:00, 90911.78it/s]
100%|██████████| 252/252 [00:00<00:00, 74776.41it/s]
100%|██████████| 203/203 [00:00<00:00, 75255.76it/s]
100%|██████████| 153/153 [00:00<00:00, 74317.14it/s]
100%|██████████| 200/200 [00:00<00:00, 74638.38it/s]
100%|██████████| 65/65 [00:00<00:00, 68586.10it/s]
100%|██████████| 144/144 [00:00<00:00, 77264.91it/s]
100%|██████████| 30/30 [00:00<00:00, 56400.32it/s]
100%|██████████| 130/130 [00:00<00:00, 70474.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88318.67it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.68it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78103.74it/s]
100%|██████████| 287/287 [00:00<00:00, 74823.80it/s]
100%|██████████| 771/771 [00:00<00:00, 76736.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77083.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75234.15it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93168.80it/s]
100%|██████████| 353/353 [00:00<00:00, 75436.35it/s]
100%|██████████| 252/252 [00:00<00:00, 76730.64it/s]
100%|██████████| 203/203 [00:00<00:00, 72991.32it/s]
100%|██████████| 153/153 [00:00<00:00, 74481.03it/s]
100%|██████████| 200/200 [00:00<00:00, 73224.58it/s]
100%|██████████| 65/65 [00:00<00:00, 67818.35it/s]
100%|██████████| 144/144 [00:00<00:00, 74071.59it/s]
100%|██████████| 30/30 [00:00<00:00, 54050.31it/s]
100%|██████████| 130/130 [00:00<00:00, 74723.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77065.56it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.00it/s]
INFO:root:The new embedding has 5826 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 63071.77it/s]
100%|██████████| 287/287 [00:00<00:00, 72902.45it/s]
100%|██████████| 771/771 [00:00<00:00, 74945.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74811.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90668.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72898.78it/s]
100%|██████████| 353/353 [00:00<00:00, 74211.28it/s]
100%|██████████| 252/252 [00:00<00:00, 73533.09it/s]
100%|██████████| 203/203 [00:00<00:00, 69133.14it/s]
100%|██████████| 153/153 [00:00<00:00, 71918.47it/s]
100%|██████████| 200/200 [00:00<00:00, 73179.87it/s]
100%|██████████| 65/65 [00:00<00:00, 65536.00it/s]
100%|██████████| 144/144 [00:00<00:00, 71519.22it/s]
100%|██████████| 30/30 [00:00<00:00, 52847.17it/s]
100%|██████████| 130/130 [00:00<00:00, 70003.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82245.40it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.64it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 63098.36it/s]
100%|██████████| 287/287 [00:00<00:00, 77587.19it/s]
100%|██████████| 771/771 [00:00<00:00, 79372.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81809.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80748.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78963.99it/s]
100%|██████████| 353/353 [00:00<00:00, 78189.13it/s]
100%|██████████| 252/252 [00:00<00:00, 81524.46it/s]
100%|██████████| 203/203 [00:00<00:00, 80000.35it/s]
100%|██████████| 153/153 [00:00<00:00, 75373.33it/s]
100%|██████████| 200/200 [00:00<00:00, 77449.99it/s]
100%|██████████| 65/65 [00:00<00:00, 69887.15it/s]
100%|██████████| 144/144 [00:00<00:00, 77245.14it/s]
100%|██████████| 30/30 [00:00<00:00, 63905.09it/s]
100%|██████████| 130/130 [00:00<00:00, 56821.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96198.37it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.14it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81708.81it/s]
100%|██████████| 287/287 [00:00<00:00, 77567.19it/s]
100%|██████████| 771/771 [00:00<00:00, 79845.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80128.07it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78620.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89658.92it/s]
100%|██████████| 353/353 [00:00<00:00, 77933.96it/s]
100%|██████████| 252/252 [00:00<00:00, 72365.10it/s]
100%|██████████| 203/203 [00:00<00:00, 80211.37it/s]
100%|██████████| 153/153 [00:00<00:00, 79030.60it/s]
100%|██████████| 200/200 [00:00<00:00, 63723.85it/s]
100%|██████████| 65/65 [00:00<00:00, 75249.73it/s]
100%|██████████| 144/144 [00:00<00:00, 75516.35it/s]
100%|██████████| 30/30 [00:00<00:00, 70690.52it/s]
100%|██████████| 130/130 [00:00<00:00, 55216.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77635.33it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.65it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81771.00it/s]
100%|██████████| 287/287 [00:00<00:00, 78930.25it/s]
100%|██████████| 771/771 [00:00<00:00, 80507.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80902.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79081.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79411.51it/s]
100%|██████████| 353/353 [00:00<00:00, 47777.90it/s]
100%|██████████| 252/252 [00:00<00:00, 70605.52it/s]
100%|██████████| 203/203 [00:00<00:00, 76479.27it/s]
100%|██████████| 153/153 [00:00<00:00, 71557.60it/s]
100%|██████████| 200/200 [00:00<00:00, 78171.73it/s]
100%|██████████| 65/65 [00:00<00:00, 71443.86it/s]
100%|██████████| 144/144 [00:00<00:00, 76048.83it/s]
100%|██████████| 30/30 [00:00<00:00, 65570.15it/s]
100%|██████████| 130/130 [00:00<00:00, 77760.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75559.82it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.64it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80331.86it/s]
100%|██████████| 287/287 [00:00<00:00, 76775.64it/s]
100%|██████████| 771/771 [00:00<00:00, 78852.22it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79162.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77987.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81459.14it/s]
100%|██████████| 353/353 [00:00<00:00, 77741.63it/s]
100%|██████████| 252/252 [00:00<00:00, 73769.17it/s]
100%|██████████| 203/203 [00:00<00:00, 75415.74it/s]
100%|██████████| 153/153 [00:00<00:00, 68429.14it/s]
100%|██████████| 200/200 [00:00<00:00, 72534.44it/s]
100%|██████████| 65/65 [00:00<00:00, 74693.08it/s]
100%|██████████| 144/144 [00:00<00:00, 75915.00it/s]
100%|██████████| 30/30 [00:00<00:00, 60205.32it/s]
100%|██████████| 130/130 [00:00<00:00, 77949.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86671.45it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:58<00:00, 100.08it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79376.18it/s]
100%|██████████| 287/287 [00:00<00:00, 77989.33it/s]
100%|██████████| 771/771 [00:00<00:00, 78637.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79360.92it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88080.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 104393.92it/s]
100%|██████████| 353/353 [00:00<00:00, 79678.68it/s]
100%|██████████| 252/252 [00:00<00:00, 74702.42it/s]
100%|██████████| 203/203 [00:00<00:00, 73967.83it/s]
100%|██████████| 153/153 [00:00<00:00, 75684.46it/s]
100%|██████████| 200/200 [00:00<00:00, 67340.52it/s]
100%|██████████| 65/65 [00:00<00:00, 68362.53it/s]
100%|██████████| 144/144 [00:00<00:00, 75327.98it/s]
100%|██████████| 30/30 [00:00<00:00, 50860.60it/s]
100%|██████████| 130/130 [00:00<00:00, 74499.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76475.79it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:57<00:00, 101.23it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81235.16it/s]
100%|██████████| 287/287 [00:00<00:00, 77913.61it/s]
100%|██████████| 771/771 [00:00<00:00, 79742.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81497.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83068.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 65846.03it/s]
100%|██████████| 353/353 [00:00<00:00, 58449.70it/s]
100%|██████████| 252/252 [00:00<00:00, 57609.67it/s]
100%|██████████| 203/203 [00:00<00:00, 57316.98it/s]
100%|██████████| 153/153 [00:00<00:00, 56376.04it/s]
100%|██████████| 200/200 [00:00<00:00, 57088.66it/s]
100%|██████████| 65/65 [00:00<00:00, 52835.22it/s]
100%|██████████| 144/144 [00:00<00:00, 55944.77it/s]
100%|██████████| 30/30 [00:00<00:00, 37718.56it/s]
100%|██████████| 130/130 [00:00<00:00, 68967.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78110.79it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:32<00:00, 178.13it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 82233.18it/s]
100%|██████████| 287/287 [00:00<00:00, 76284.24it/s]
100%|██████████| 771/771 [00:00<00:00, 78007.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77438.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85773.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91387.14it/s]
100%|██████████| 353/353 [00:00<00:00, 77631.57it/s]
100%|██████████| 252/252 [00:00<00:00, 77826.71it/s]
100%|██████████| 203/203 [00:00<00:00, 79181.97it/s]
100%|██████████| 153/153 [00:00<00:00, 75675.53it/s]
100%|██████████| 200/200 [00:00<00:00, 74340.73it/s]
100%|██████████| 65/65 [00:00<00:00, 48253.05it/s]
100%|██████████| 144/144 [00:00<00:00, 74080.68it/s]
100%|██████████| 30/30 [00:00<00:00, 66260.73it/s]
100%|██████████| 130/130 [00:00<00:00, 73753.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90718.48it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 439.10it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 82252.56it/s]
100%|██████████| 287/287 [00:00<00:00, 75518.52it/s]
100%|██████████| 771/771 [00:00<00:00, 78149.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76291.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78742.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75490.98it/s]
100%|██████████| 353/353 [00:00<00:00, 76587.49it/s]
100%|██████████| 252/252 [00:00<00:00, 74407.93it/s]
100%|██████████| 203/203 [00:00<00:00, 73839.54it/s]
100%|██████████| 153/153 [00:00<00:00, 78768.69it/s]
100%|██████████| 200/200 [00:00<00:00, 75301.69it/s]
100%|██████████| 65/65 [00:00<00:00, 74428.00it/s]
100%|██████████| 144/144 [00:00<00:00, 72847.64it/s]
100%|██████████| 30/30 [00:00<00:00, 47215.43it/s]
100%|██████████| 130/130 [00:00<00:00, 69842.39it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92362.88it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 428.80it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75017.63it/s]
100%|██████████| 287/287 [00:00<00:00, 75277.67it/s]
100%|██████████| 771/771 [00:00<00:00, 93166.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76535.60it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78379.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73871.56it/s]
100%|██████████| 353/353 [00:00<00:00, 74148.10it/s]
100%|██████████| 252/252 [00:00<00:00, 75540.64it/s]
100%|██████████| 203/203 [00:00<00:00, 73066.48it/s]
100%|██████████| 153/153 [00:00<00:00, 72725.35it/s]
100%|██████████| 200/200 [00:00<00:00, 75573.05it/s]
100%|██████████| 65/65 [00:00<00:00, 67599.74it/s]
100%|██████████| 144/144 [00:00<00:00, 73325.21it/s]
100%|██████████| 30/30 [00:00<00:00, 55529.18it/s]
100%|██████████| 130/130 [00:00<00:00, 64443.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71769.01it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 432.49it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 76086.97it/s]
100%|██████████| 287/287 [00:00<00:00, 74458.17it/s]
100%|██████████| 771/771 [00:00<00:00, 96267.22it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75281.41it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74131.82it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74842.15it/s]
100%|██████████| 353/353 [00:00<00:00, 74652.82it/s]
100%|██████████| 252/252 [00:00<00:00, 75508.26it/s]
100%|██████████| 203/203 [00:00<00:00, 74616.05it/s]
100%|██████████| 153/153 [00:00<00:00, 74076.94it/s]
100%|██████████| 200/200 [00:00<00:00, 72465.51it/s]
100%|██████████| 65/65 [00:00<00:00, 69037.67it/s]
100%|██████████| 144/144 [00:00<00:00, 78479.70it/s]
100%|██████████| 30/30 [00:00<00:00, 64067.78it/s]
100%|██████████| 130/130 [00:00<00:00, 74184.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89712.80it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 426.34it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75962.83it/s]
100%|██████████| 287/287 [00:00<00:00, 76284.24it/s]
100%|██████████| 771/771 [00:00<00:00, 74504.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77135.92it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89867.67it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75281.86it/s]
100%|██████████| 353/353 [00:00<00:00, 75505.60it/s]
100%|██████████| 252/252 [00:00<00:00, 72914.23it/s]
100%|██████████| 203/203 [00:00<00:00, 74038.58it/s]
100%|██████████| 153/153 [00:00<00:00, 73787.34it/s]
100%|██████████| 200/200 [00:00<00:00, 73901.93it/s]
100%|██████████| 65/65 [00:00<00:00, 65425.91it/s]
100%|██████████| 144/144 [00:00<00:00, 73262.95it/s]
100%|██████████| 30/30 [00:00<00:00, 64231.30it/s]
100%|██████████| 130/130 [00:00<00:00, 68715.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85494.35it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 438.88it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 85359.14it/s]
100%|██████████| 287/287 [00:00<00:00, 73827.98it/s]
100%|██████████| 771/771 [00:00<00:00, 76728.71it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75382.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83448.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74645.47it/s]
100%|██████████| 353/353 [00:00<00:00, 76079.82it/s]
100%|██████████| 252/252 [00:00<00:00, 75346.78it/s]
100%|██████████| 203/203 [00:00<00:00, 72760.53it/s]
100%|██████████| 153/153 [00:00<00:00, 74576.24it/s]
100%|██████████| 200/200 [00:00<00:00, 54766.65it/s]
100%|██████████| 65/65 [00:00<00:00, 51352.38it/s]
100%|██████████| 144/144 [00:00<00:00, 71663.48it/s]
100%|██████████| 30/30 [00:00<00:00, 46916.15it/s]
100%|██████████| 130/130 [00:00<00:00, 66665.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71949.46it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:14<00:00, 415.39it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 80751.41it/s]
100%|██████████| 287/287 [00:00<00:00, 75183.64it/s]
100%|██████████| 771/771 [00:00<00:00, 77258.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75902.64it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83255.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91494.12it/s]
100%|██████████| 353/353 [00:00<00:00, 75845.98it/s]
100%|██████████| 252/252 [00:00<00:00, 77586.77it/s]
100%|██████████| 203/203 [00:00<00:00, 74122.37it/s]
100%|██████████| 153/153 [00:00<00:00, 69473.69it/s]
100%|██████████| 200/200 [00:00<00:00, 76699.35it/s]
100%|██████████| 65/65 [00:00<00:00, 67633.28it/s]
100%|██████████| 144/144 [00:00<00:00, 73557.40it/s]
100%|██████████| 30/30 [00:00<00:00, 52494.42it/s]
100%|██████████| 130/130 [00:00<00:00, 71406.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85478.92it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 433.67it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 73387.10it/s]
100%|██████████| 287/287 [00:00<00:00, 75061.75it/s]
100%|██████████| 771/771 [00:00<00:00, 72763.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76005.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 67336.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 64427.31it/s]
100%|██████████| 353/353 [00:00<00:00, 55646.61it/s]
100%|██████████| 252/252 [00:00<00:00, 55156.53it/s]
100%|██████████| 203/203 [00:00<00:00, 55880.01it/s]
100%|██████████| 153/153 [00:00<00:00, 54255.03it/s]
100%|██████████| 200/200 [00:00<00:00, 52958.38it/s]
100%|██████████| 65/65 [00:00<00:00, 49131.33it/s]
100%|██████████| 144/144 [00:00<00:00, 48229.64it/s]
100%|██████████| 30/30 [00:00<00:00, 45623.32it/s]
100%|██████████| 130/130 [00:00<00:00, 63402.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 53395.25it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 427.43it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 83584.87it/s]
100%|██████████| 287/287 [00:00<00:00, 74601.22it/s]
100%|██████████| 771/771 [00:00<00:00, 78077.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76118.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83993.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77482.42it/s]
100%|██████████| 353/353 [00:00<00:00, 77635.64it/s]
100%|██████████| 252/252 [00:00<00:00, 75583.85it/s]
100%|██████████| 203/203 [00:00<00:00, 78910.45it/s]
100%|██████████| 153/153 [00:00<00:00, 77738.16it/s]
100%|██████████| 200/200 [00:00<00:00, 73635.96it/s]
100%|██████████| 65/65 [00:00<00:00, 74529.73it/s]
100%|██████████| 144/144 [00:00<00:00, 73800.07it/s]
100%|██████████| 30/30 [00:00<00:00, 56098.58it/s]
100%|██████████| 130/130 [00:00<00:00, 72954.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88414.95it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 442.82it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75428.16it/s]
100%|██████████| 287/287 [00:00<00:00, 68790.52it/s]
100%|██████████| 771/771 [00:00<00:00, 76251.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77411.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77786.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78562.18it/s]
100%|██████████| 353/353 [00:00<00:00, 76619.19it/s]
100%|██████████| 252/252 [00:00<00:00, 78701.76it/s]
100%|██████████| 203/203 [00:00<00:00, 74070.79it/s]
100%|██████████| 153/153 [00:00<00:00, 74515.62it/s]
100%|██████████| 200/200 [00:00<00:00, 76025.09it/s]
100%|██████████| 65/65 [00:00<00:00, 68038.37it/s]
100%|██████████| 144/144 [00:00<00:00, 78786.82it/s]
100%|██████████| 30/30 [00:00<00:00, 60061.63it/s]
100%|██████████| 130/130 [00:00<00:00, 73475.21it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90755.49it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 173.36it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75648.77it/s]
100%|██████████| 287/287 [00:00<00:00, 67604.47it/s]
100%|██████████| 771/771 [00:00<00:00, 71615.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76597.10it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80349.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92572.46it/s]
100%|██████████| 353/353 [00:00<00:00, 76240.44it/s]
100%|██████████| 252/252 [00:00<00:00, 69231.98it/s]
100%|██████████| 203/203 [00:00<00:00, 73577.92it/s]
100%|██████████| 153/153 [00:00<00:00, 71685.49it/s]
100%|██████████| 200/200 [00:00<00:00, 82678.97it/s]
100%|██████████| 65/65 [00:00<00:00, 71669.23it/s]
100%|██████████| 144/144 [00:00<00:00, 70034.76it/s]
100%|██████████| 30/30 [00:00<00:00, 56023.65it/s]
100%|██████████| 130/130 [00:00<00:00, 68106.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80088.51it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 239.85it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76093.88it/s]
100%|██████████| 287/287 [00:00<00:00, 73516.87it/s]
100%|██████████| 771/771 [00:00<00:00, 86546.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95507.42it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76303.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91996.49it/s]
100%|██████████| 353/353 [00:00<00:00, 75046.34it/s]
100%|██████████| 252/252 [00:00<00:00, 75357.52it/s]
100%|██████████| 203/203 [00:00<00:00, 73820.33it/s]
100%|██████████| 153/153 [00:00<00:00, 65057.64it/s]
100%|██████████| 200/200 [00:00<00:00, 77072.84it/s]
100%|██████████| 65/65 [00:00<00:00, 64178.38it/s]
100%|██████████| 144/144 [00:00<00:00, 70798.24it/s]
100%|██████████| 30/30 [00:00<00:00, 52472.53it/s]
100%|██████████| 130/130 [00:00<00:00, 67482.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78389.00it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 232.87it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75307.51it/s]
100%|██████████| 287/287 [00:00<00:00, 73128.32it/s]
100%|██████████| 771/771 [00:00<00:00, 88057.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94091.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76838.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91260.54it/s]
100%|██████████| 353/353 [00:00<00:00, 76252.22it/s]
100%|██████████| 252/252 [00:00<00:00, 75137.88it/s]
100%|██████████| 203/203 [00:00<00:00, 69161.21it/s]
100%|██████████| 153/153 [00:00<00:00, 72299.29it/s]
100%|██████████| 200/200 [00:00<00:00, 78944.17it/s]
100%|██████████| 65/65 [00:00<00:00, 71839.20it/s]
100%|██████████| 144/144 [00:00<00:00, 71350.24it/s]
100%|██████████| 30/30 [00:00<00:00, 57985.77it/s]
100%|██████████| 130/130 [00:00<00:00, 69353.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74318.90it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 238.73it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75898.16it/s]
100%|██████████| 287/287 [00:00<00:00, 70490.44it/s]
100%|██████████| 771/771 [00:00<00:00, 82642.69it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92922.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96170.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91379.17it/s]
100%|██████████| 353/353 [00:00<00:00, 73325.54it/s]
100%|██████████| 252/252 [00:00<00:00, 72803.73it/s]
100%|██████████| 203/203 [00:00<00:00, 56789.42it/s]
100%|██████████| 153/153 [00:00<00:00, 50509.92it/s]
100%|██████████| 200/200 [00:00<00:00, 47809.23it/s]
100%|██████████| 65/65 [00:00<00:00, 52753.44it/s]
100%|██████████| 144/144 [00:00<00:00, 45749.11it/s]
100%|██████████| 30/30 [00:00<00:00, 38037.82it/s]
100%|██████████| 130/130 [00:00<00:00, 56497.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 68086.51it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 236.00it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76796.79it/s]
100%|██████████| 287/287 [00:00<00:00, 71245.58it/s]
100%|██████████| 771/771 [00:00<00:00, 82130.55it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94206.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77207.62it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90165.83it/s]
100%|██████████| 353/353 [00:00<00:00, 76212.97it/s]
100%|██████████| 252/252 [00:00<00:00, 74633.85it/s]
100%|██████████| 203/203 [00:00<00:00, 71167.14it/s]
100%|██████████| 153/153 [00:00<00:00, 75196.69it/s]
100%|██████████| 200/200 [00:00<00:00, 67934.95it/s]
100%|██████████| 65/65 [00:00<00:00, 66560.00it/s]
100%|██████████| 144/144 [00:00<00:00, 71740.09it/s]
100%|██████████| 30/30 [00:00<00:00, 52017.00it/s]
100%|██████████| 130/130 [00:00<00:00, 66438.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77147.37it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 238.55it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77393.97it/s]
100%|██████████| 287/287 [00:00<00:00, 74196.58it/s]
100%|██████████| 771/771 [00:00<00:00, 74879.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77048.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76918.78it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92532.98it/s]
100%|██████████| 353/353 [00:00<00:00, 76917.73it/s]
100%|██████████| 252/252 [00:00<00:00, 70169.59it/s]
100%|██████████| 203/203 [00:00<00:00, 71555.90it/s]
100%|██████████| 153/153 [00:00<00:00, 71533.67it/s]
100%|██████████| 200/200 [00:00<00:00, 69247.22it/s]
100%|██████████| 65/65 [00:00<00:00, 68898.09it/s]
100%|██████████| 144/144 [00:00<00:00, 75318.59it/s]
100%|██████████| 30/30 [00:00<00:00, 63614.32it/s]
100%|██████████| 130/130 [00:00<00:00, 68863.29it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74695.54it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 235.64it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75633.75it/s]
100%|██████████| 287/287 [00:00<00:00, 69241.60it/s]
100%|██████████| 771/771 [00:00<00:00, 85156.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96064.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76471.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94088.40it/s]
100%|██████████| 353/353 [00:00<00:00, 75656.07it/s]
100%|██████████| 252/252 [00:00<00:00, 74797.58it/s]
100%|██████████| 203/203 [00:00<00:00, 69443.25it/s]
100%|██████████| 153/153 [00:00<00:00, 73483.17it/s]
100%|██████████| 200/200 [00:00<00:00, 65260.68it/s]
100%|██████████| 65/65 [00:00<00:00, 69477.51it/s]
100%|██████████| 144/144 [00:00<00:00, 71140.14it/s]
100%|██████████| 30/30 [00:00<00:00, 62137.84it/s]
100%|██████████| 130/130 [00:00<00:00, 69521.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91875.58it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 237.43it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 74903.64it/s]
100%|██████████| 287/287 [00:00<00:00, 71499.48it/s]
100%|██████████| 771/771 [00:00<00:00, 72541.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94640.03it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75270.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85985.85it/s]
100%|██████████| 353/353 [00:00<00:00, 75313.56it/s]
100%|██████████| 252/252 [00:00<00:00, 69983.75it/s]
100%|██████████| 203/203 [00:00<00:00, 64926.32it/s]
100%|██████████| 153/153 [00:00<00:00, 69496.27it/s]
100%|██████████| 200/200 [00:00<00:00, 74724.82it/s]
100%|██████████| 65/65 [00:00<00:00, 49659.34it/s]
100%|██████████| 144/144 [00:00<00:00, 70931.27it/s]
100%|██████████| 30/30 [00:00<00:00, 46898.67it/s]
100%|██████████| 130/130 [00:00<00:00, 66236.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79171.53it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 234.04it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75382.02it/s]
100%|██████████| 287/287 [00:00<00:00, 72064.49it/s]
100%|██████████| 771/771 [00:00<00:00, 87527.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94061.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74758.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92508.49it/s]
100%|██████████| 353/353 [00:00<00:00, 73650.17it/s]
100%|██████████| 252/252 [00:00<00:00, 72618.66it/s]
100%|██████████| 203/203 [00:00<00:00, 65901.22it/s]
100%|██████████| 153/153 [00:00<00:00, 70706.09it/s]
100%|██████████| 200/200 [00:00<00:00, 71906.46it/s]
100%|██████████| 65/65 [00:00<00:00, 63832.77it/s]
100%|██████████| 144/144 [00:00<00:00, 73467.92it/s]
100%|██████████| 30/30 [00:00<00:00, 50351.79it/s]
100%|██████████| 130/130 [00:00<00:00, 69486.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75490.66it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 237.57it/s]
INFO:root:The new embedding has 5825 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76289.23it/s]
100%|██████████| 287/287 [00:00<00:00, 70219.05it/s]
100%|██████████| 771/771 [00:00<00:00, 82486.69it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90485.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77695.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90941.31it/s]
100%|██████████| 353/353 [00:00<00:00, 75072.98it/s]
100%|██████████| 252/252 [00:00<00:00, 73425.82it/s]
100%|██████████| 203/203 [00:00<00:00, 73769.17it/s]
100%|██████████| 153/153 [00:00<00:00, 71661.48it/s]
100%|██████████| 200/200 [00:00<00:00, 69505.41it/s]
100%|██████████| 65/65 [00:00<00:00, 71933.97it/s]
100%|██████████| 144/144 [00:00<00:00, 73728.00it/s]
100%|██████████| 30/30 [00:00<00:00, 47608.44it/s]
100%|██████████| 130/130 [00:00<00:00, 71678.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88765.12it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 236.01it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80957.35it/s]
100%|██████████| 287/287 [00:00<00:00, 76619.26it/s]
100%|██████████| 771/771 [00:00<00:00, 75517.45it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79050.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79284.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77545.45it/s]
100%|██████████| 353/353 [00:00<00:00, 79430.76it/s]
100%|██████████| 252/252 [00:00<00:00, 77240.91it/s]
100%|██████████| 203/203 [00:00<00:00, 76949.27it/s]
100%|██████████| 153/153 [00:00<00:00, 75541.91it/s]
100%|██████████| 200/200 [00:00<00:00, 77997.28it/s]
100%|██████████| 65/65 [00:00<00:00, 68845.90it/s]
100%|██████████| 144/144 [00:00<00:00, 57472.62it/s]
100%|██████████| 30/30 [00:00<00:00, 48210.39it/s]
100%|██████████| 130/130 [00:00<00:00, 56480.17it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69927.38it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 239.21it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80106.10it/s]
100%|██████████| 287/287 [00:00<00:00, 77337.95it/s]
100%|██████████| 771/771 [00:00<00:00, 76231.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77853.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78932.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78152.31it/s]
100%|██████████| 353/353 [00:00<00:00, 73249.36it/s]
100%|██████████| 252/252 [00:00<00:00, 74712.99it/s]
100%|██████████| 203/203 [00:00<00:00, 74472.47it/s]
100%|██████████| 153/153 [00:00<00:00, 75161.46it/s]
100%|██████████| 200/200 [00:00<00:00, 78266.54it/s]
100%|██████████| 65/65 [00:00<00:00, 71219.90it/s]
100%|██████████| 144/144 [00:00<00:00, 74326.82it/s]
100%|██████████| 30/30 [00:00<00:00, 63389.98it/s]
100%|██████████| 130/130 [00:00<00:00, 72095.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101176.93it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 233.99it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 86982.27it/s]
100%|██████████| 287/287 [00:00<00:00, 75005.62it/s]
100%|██████████| 771/771 [00:00<00:00, 74671.72it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98866.30it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80664.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96199.63it/s]
100%|██████████| 353/353 [00:00<00:00, 76662.83it/s]
100%|██████████| 252/252 [00:00<00:00, 77524.18it/s]
100%|██████████| 203/203 [00:00<00:00, 79322.13it/s]
100%|██████████| 153/153 [00:00<00:00, 76332.64it/s]
100%|██████████| 200/200 [00:00<00:00, 75784.70it/s]
100%|██████████| 65/65 [00:00<00:00, 70538.10it/s]
100%|██████████| 144/144 [00:00<00:00, 70328.34it/s]
100%|██████████| 30/30 [00:00<00:00, 62446.21it/s]
100%|██████████| 130/130 [00:00<00:00, 74397.53it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73348.24it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 238.68it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78198.49it/s]
100%|██████████| 287/287 [00:00<00:00, 73827.98it/s]
100%|██████████| 771/771 [00:00<00:00, 72448.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96218.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78695.34it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92353.68it/s]
100%|██████████| 353/353 [00:00<00:00, 74811.24it/s]
100%|██████████| 252/252 [00:00<00:00, 77632.36it/s]
100%|██████████| 203/203 [00:00<00:00, 78178.65it/s]
100%|██████████| 153/153 [00:00<00:00, 78923.69it/s]
100%|██████████| 200/200 [00:00<00:00, 73791.41it/s]
100%|██████████| 65/65 [00:00<00:00, 75646.44it/s]
100%|██████████| 144/144 [00:00<00:00, 78807.38it/s]
100%|██████████| 30/30 [00:00<00:00, 63421.94it/s]
100%|██████████| 130/130 [00:00<00:00, 73833.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76609.09it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:25<00:00, 231.66it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80690.76it/s]
100%|██████████| 287/287 [00:00<00:00, 79002.77it/s]
100%|██████████| 771/771 [00:00<00:00, 77919.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79052.79it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81617.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77163.59it/s]
100%|██████████| 353/353 [00:00<00:00, 78859.62it/s]
100%|██████████| 252/252 [00:00<00:00, 78766.27it/s]
100%|██████████| 203/203 [00:00<00:00, 68022.99it/s]
100%|██████████| 153/153 [00:00<00:00, 68619.39it/s]
100%|██████████| 200/200 [00:00<00:00, 80574.47it/s]
100%|██████████| 65/65 [00:00<00:00, 75793.65it/s]
100%|██████████| 144/144 [00:00<00:00, 72997.31it/s]
100%|██████████| 30/30 [00:00<00:00, 68311.14it/s]
100%|██████████| 130/130 [00:00<00:00, 74275.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79185.62it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:24<00:00, 239.15it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81739.10it/s]
100%|██████████| 287/287 [00:00<00:00, 79236.79it/s]
100%|██████████| 771/771 [00:00<00:00, 90297.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 103070.61it/s]
100%|██████████| 1000/1000 [00:00<00:00, 102922.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94227.20it/s]
100%|██████████| 353/353 [00:00<00:00, 79734.47it/s]
100%|██████████| 252/252 [00:00<00:00, 77603.86it/s]
100%|██████████| 203/203 [00:00<00:00, 77242.47it/s]
100%|██████████| 153/153 [00:00<00:00, 73508.42it/s]
100%|██████████| 200/200 [00:00<00:00, 74439.68it/s]
100%|██████████| 65/65 [00:00<00:00, 49840.91it/s]
100%|██████████| 144/144 [00:00<00:00, 74565.40it/s]
100%|██████████| 30/30 [00:00<00:00, 68909.70it/s]
100%|██████████| 130/130 [00:00<00:00, 74053.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101807.03it/s]
100%|██████████| 

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']






100%|██████████| 5846/5846 [01:04<00:00, 91.26it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77554.41it/s]
100%|██████████| 287/287 [00:00<00:00, 75837.29it/s]
100%|██████████| 771/771 [00:00<00:00, 77664.83it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87784.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79402.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83120.81it/s]
100%|██████████| 353/353 [00:00<00:00, 77505.59it/s]
100%|██████████| 252/252 [00:00<00:00, 75991.42it/s]
100%|██████████| 203/203 [00:00<00:00, 73628.82it/s]
100%|██████████| 153/153 [00:00<00:00, 75012.10it/s]
100%|██████████| 200/200 [00:00<00:00, 74301.22it/s]
100%|██████████| 65/65 [00:00<00:00, 68345.39it/s]
100%|██████████| 144/144 [00:00<00:00, 73467.92it/s]
100%|██████████| 30/30 [00:00<00:00, 49695.55it/s]
100%|██████████| 130/130 [00:00<00:00, 76270.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90599.78it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 101.23it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75839.09it/s]
100%|██████████| 287/287 [00:00<00:00, 74689.16it/s]
100%|██████████| 771/771 [00:00<00:00, 87527.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88460.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78656.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82746.93it/s]
100%|██████████| 353/353 [00:00<00:00, 77025.77it/s]
100%|██████████| 252/252 [00:00<00:00, 76243.57it/s]
100%|██████████| 203/203 [00:00<00:00, 75422.42it/s]
100%|██████████| 153/153 [00:00<00:00, 73306.89it/s]
100%|██████████| 200/200 [00:00<00:00, 85059.91it/s]
100%|██████████| 65/65 [00:00<00:00, 68932.94it/s]
100%|██████████| 144/144 [00:00<00:00, 71443.08it/s]
100%|██████████| 30/30 [00:00<00:00, 63840.24it/s]
100%|██████████| 130/130 [00:00<00:00, 62322.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90965.82it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 101.08it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76652.09it/s]
100%|██████████| 287/287 [00:00<00:00, 75456.98it/s]
100%|██████████| 771/771 [00:00<00:00, 83740.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86916.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79917.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89584.23it/s]
100%|██████████| 353/353 [00:00<00:00, 76228.66it/s]
100%|██████████| 252/252 [00:00<00:00, 54827.50it/s]
100%|██████████| 203/203 [00:00<00:00, 55378.45it/s]
100%|██████████| 153/153 [00:00<00:00, 54657.06it/s]
100%|██████████| 200/200 [00:00<00:00, 54460.87it/s]
100%|██████████| 65/65 [00:00<00:00, 68123.38it/s]
100%|██████████| 144/144 [00:00<00:00, 73059.12it/s]
100%|██████████| 30/30 [00:00<00:00, 24657.87it/s]
100%|██████████| 130/130 [00:00<00:00, 73883.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92559.72it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 100.99it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76267.01it/s]
100%|██████████| 287/287 [00:00<00:00, 82557.11it/s]
100%|██████████| 771/771 [00:00<00:00, 69252.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76537.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77408.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73452.84it/s]
100%|██████████| 353/353 [00:00<00:00, 74577.61it/s]
100%|██████████| 252/252 [00:00<00:00, 76051.56it/s]
100%|██████████| 203/203 [00:00<00:00, 75017.07it/s]
100%|██████████| 153/153 [00:00<00:00, 74239.76it/s]
100%|██████████| 200/200 [00:00<00:00, 74998.73it/s]
100%|██████████| 65/65 [00:00<00:00, 71462.58it/s]
100%|██████████| 144/144 [00:00<00:00, 68540.60it/s]
100%|██████████| 30/30 [00:00<00:00, 48639.01it/s]
100%|██████████| 130/130 [00:00<00:00, 71145.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84546.02it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.53it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75854.19it/s]
100%|██████████| 287/287 [00:00<00:00, 73760.13it/s]
100%|██████████| 771/771 [00:00<00:00, 83567.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89596.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76354.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88529.14it/s]
100%|██████████| 353/353 [00:00<00:00, 76185.52it/s]
100%|██████████| 252/252 [00:00<00:00, 76100.84it/s]
100%|██████████| 203/203 [00:00<00:00, 74799.59it/s]
100%|██████████| 153/153 [00:00<00:00, 72651.25it/s]
100%|██████████| 200/200 [00:00<00:00, 72023.77it/s]
100%|██████████| 65/65 [00:00<00:00, 60302.98it/s]
100%|██████████| 144/144 [00:00<00:00, 71123.38it/s]
100%|██████████| 30/30 [00:00<00:00, 41147.52it/s]
100%|██████████| 130/130 [00:00<00:00, 68405.41it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88456.50it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 100.98it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76833.40it/s]
100%|██████████| 287/287 [00:00<00:00, 77807.85it/s]
100%|██████████| 771/771 [00:00<00:00, 70491.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76911.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79122.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91759.00it/s]
100%|██████████| 353/353 [00:00<00:00, 78387.83it/s]
100%|██████████| 252/252 [00:00<00:00, 75931.37it/s]
100%|██████████| 203/203 [00:00<00:00, 78735.32it/s]
100%|██████████| 153/153 [00:00<00:00, 79392.37it/s]
100%|██████████| 200/200 [00:00<00:00, 77421.39it/s]
100%|██████████| 65/65 [00:00<00:00, 67549.49it/s]
100%|██████████| 144/144 [00:00<00:00, 67176.04it/s]
100%|██████████| 30/30 [00:00<00:00, 47608.44it/s]
100%|██████████| 130/130 [00:00<00:00, 81007.21it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92888.28it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.77it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77754.45it/s]
100%|██████████| 287/287 [00:00<00:00, 73918.65it/s]
100%|██████████| 771/771 [00:00<00:00, 89031.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94421.65it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78834.37it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82021.46it/s]
100%|██████████| 353/353 [00:00<00:00, 75721.85it/s]
100%|██████████| 252/252 [00:00<00:00, 77038.24it/s]
100%|██████████| 203/203 [00:00<00:00, 78365.74it/s]
100%|██████████| 153/153 [00:00<00:00, 77898.58it/s]
100%|██████████| 200/200 [00:00<00:00, 75559.43it/s]
100%|██████████| 65/65 [00:00<00:00, 53709.57it/s]
100%|██████████| 144/144 [00:00<00:00, 71190.45it/s]
100%|██████████| 30/30 [00:00<00:00, 56577.84it/s]
100%|██████████| 130/130 [00:00<00:00, 72623.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95822.87it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.11it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76474.42it/s]
100%|██████████| 287/287 [00:00<00:00, 74036.86it/s]
100%|██████████| 771/771 [00:00<00:00, 72386.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94161.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 57639.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79587.81it/s]
100%|██████████| 353/353 [00:00<00:00, 56027.75it/s]
100%|██████████| 252/252 [00:00<00:00, 53172.58it/s]
100%|██████████| 203/203 [00:00<00:00, 81229.13it/s]
100%|██████████| 153/153 [00:00<00:00, 55240.47it/s]
100%|██████████| 200/200 [00:00<00:00, 77715.47it/s]
100%|██████████| 65/65 [00:00<00:00, 53847.47it/s]
100%|██████████| 144/144 [00:00<00:00, 54476.39it/s]
100%|██████████| 30/30 [00:00<00:00, 41887.19it/s]
100%|██████████| 130/130 [00:00<00:00, 51169.25it/s]
100%|██████████| 3500/3500 [00:00<00:00, 62975.65it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.47it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75173.75it/s]
100%|██████████| 287/287 [00:00<00:00, 73530.34it/s]
100%|██████████| 771/771 [00:00<00:00, 72469.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75913.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74664.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92745.09it/s]
100%|██████████| 353/353 [00:00<00:00, 76189.44it/s]
100%|██████████| 252/252 [00:00<00:00, 74818.76it/s]
100%|██████████| 203/203 [00:00<00:00, 68290.32it/s]
100%|██████████| 153/153 [00:00<00:00, 75613.12it/s]
100%|██████████| 200/200 [00:00<00:00, 75573.05it/s]
100%|██████████| 65/65 [00:00<00:00, 65441.61it/s]
100%|██████████| 144/144 [00:00<00:00, 68346.70it/s]
100%|██████████| 30/30 [00:00<00:00, 57403.80it/s]
100%|██████████| 130/130 [00:00<00:00, 70822.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93706.52it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 100.89it/s]
INFO:root:The new embedding has 5721 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76278.12it/s]
100%|██████████| 287/287 [00:00<00:00, 74758.74it/s]
100%|██████████| 771/771 [00:00<00:00, 86860.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93274.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75853.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85250.08it/s]
100%|██████████| 353/353 [00:00<00:00, 76366.27it/s]
100%|██████████| 252/252 [00:00<00:00, 74755.26it/s]
100%|██████████| 203/203 [00:00<00:00, 74219.29it/s]
100%|██████████| 153/153 [00:00<00:00, 72915.41it/s]
100%|██████████| 200/200 [00:00<00:00, 70138.86it/s]
100%|██████████| 65/65 [00:00<00:00, 68655.19it/s]
100%|██████████| 144/144 [00:00<00:00, 62517.31it/s]
100%|██████████| 30/30 [00:00<00:00, 64296.94it/s]
100%|██████████| 130/130 [00:00<00:00, 70365.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90127.54it/s]
100%|██████████| 2034

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.40it/s]
INFO:root:The new embedding has 5721 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78730.38it/s]
100%|██████████| 287/287 [00:00<00:00, 77627.22it/s]
100%|██████████| 771/771 [00:00<00:00, 77136.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77033.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81420.66it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76696.55it/s]
100%|██████████| 353/353 [00:00<00:00, 78350.50it/s]
100%|██████████| 252/252 [00:00<00:00, 76276.58it/s]
100%|██████████| 203/203 [00:00<00:00, 73324.47it/s]
100%|██████████| 153/153 [00:00<00:00, 75729.11it/s]
100%|██████████| 200/200 [00:00<00:00, 76818.75it/s]
100%|██████████| 65/65 [00:00<00:00, 61458.47it/s]
100%|██████████| 144/144 [00:00<00:00, 69208.18it/s]
100%|██████████| 30/30 [00:00<00:00, 58963.97it/s]
100%|██████████| 130/130 [00:00<00:00, 72172.01it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75864.00it/s]
100%|██████████| 203

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 101.22it/s]
INFO:root:The new embedding has 5721 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 93874.98it/s]
100%|██████████| 287/287 [00:00<00:00, 77742.52it/s]
100%|██████████| 771/771 [00:00<00:00, 77926.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95415.08it/s]
100%|██████████| 1000/1000 [00:00<00:00, 98068.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98214.99it/s]
100%|██████████| 353/353 [00:00<00:00, 85096.23it/s]
100%|██████████| 252/252 [00:00<00:00, 76569.44it/s]
100%|██████████| 203/203 [00:00<00:00, 76831.23it/s]
100%|██████████| 153/153 [00:00<00:00, 68494.88it/s]
100%|██████████| 200/200 [00:00<00:00, 87018.76it/s]
100%|██████████| 65/65 [00:00<00:00, 60329.67it/s]
100%|██████████| 144/144 [00:00<00:00, 65259.84it/s]
100%|██████████| 30/30 [00:00<00:00, 53430.62it/s]
100%|██████████| 130/130 [00:00<00:00, 69923.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86975.96it/s]
100%|██████████| 203

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.01it/s]
INFO:root:The new embedding has 5721 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81131.35it/s]
100%|██████████| 287/287 [00:00<00:00, 79482.68it/s]
100%|██████████| 771/771 [00:00<00:00, 78175.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 100349.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81745.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81483.41it/s]
100%|██████████| 353/353 [00:00<00:00, 80703.66it/s]
100%|██████████| 252/252 [00:00<00:00, 79054.94it/s]
100%|██████████| 203/203 [00:00<00:00, 61878.18it/s]
100%|██████████| 153/153 [00:00<00:00, 73965.94it/s]
100%|██████████| 200/200 [00:00<00:00, 72944.42it/s]
100%|██████████| 65/65 [00:00<00:00, 69512.94it/s]
100%|██████████| 144/144 [00:00<00:00, 51675.20it/s]
100%|██████████| 30/30 [00:00<00:00, 48358.62it/s]
100%|██████████| 130/130 [00:00<00:00, 75001.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77298.48it/s]
100%|██████████| 20

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:57<00:00, 100.98it/s]
INFO:root:The new embedding has 5721 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80735.85it/s]
100%|██████████| 287/287 [00:00<00:00, 78080.38it/s]
100%|██████████| 771/771 [00:00<00:00, 79415.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85263.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81382.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93510.84it/s]
100%|██████████| 353/353 [00:00<00:00, 77150.19it/s]
100%|██████████| 252/252 [00:00<00:00, 79632.68it/s]
100%|██████████| 203/203 [00:00<00:00, 77892.57it/s]
100%|██████████| 153/153 [00:00<00:00, 80026.00it/s]
100%|██████████| 200/200 [00:00<00:00, 79982.91it/s]
100%|██████████| 65/65 [00:00<00:00, 75920.29it/s]
100%|██████████| 144/144 [00:00<00:00, 76773.84it/s]
100%|██████████| 30/30 [00:00<00:00, 69327.34it/s]
100%|██████████| 130/130 [00:00<00:00, 62955.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 57011.73it/s]
100%|██████████| 203

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.32it/s]
INFO:root:The new embedding has 5721 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 64126.81it/s]
100%|██████████| 287/287 [00:00<00:00, 76888.43it/s]
100%|██████████| 771/771 [00:00<00:00, 76763.32it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79659.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81096.37it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79245.96it/s]
100%|██████████| 353/353 [00:00<00:00, 80005.91it/s]
100%|██████████| 252/252 [00:00<00:00, 78270.48it/s]
100%|██████████| 203/203 [00:00<00:00, 88821.58it/s]
100%|██████████| 153/153 [00:00<00:00, 74446.46it/s]
100%|██████████| 200/200 [00:00<00:00, 76980.89it/s]
100%|██████████| 65/65 [00:00<00:00, 75625.45it/s]
100%|██████████| 144/144 [00:00<00:00, 76754.32it/s]
100%|██████████| 30/30 [00:00<00:00, 63009.07it/s]
100%|██████████| 130/130 [00:00<00:00, 71546.98it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75807.98it/s]
100%|██████████| 203

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr





100%|██████████| 5846/5846 [00:58<00:00, 100.79it/s]
INFO:root:The new embedding has 5721 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 84599.12it/s]
100%|██████████| 287/287 [00:00<00:00, 81127.19it/s]
100%|██████████| 771/771 [00:00<00:00, 76617.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78921.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80473.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77720.75it/s]
100%|██████████| 353/353 [00:00<00:00, 41933.54it/s]
100%|██████████| 252/252 [00:00<00:00, 56446.71it/s]
100%|██████████| 203/203 [00:00<00:00, 73041.41it/s]
100%|██████████| 153/153 [00:00<00:00, 76542.05it/s]
100%|██████████| 200/200 [00:00<00:00, 69098.91it/s]
100%|██████████| 65/65 [00:00<00:00, 74184.97it/s]
100%|██████████| 144/144 [00:00<00:00, 76346.83it/s]
100%|██████████| 30/30 [00:00<00:00, 49152.00it/s]
100%|██████████| 130/130 [00:00<00:00, 75983.77it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77139.67it/s]
100%|██████████| 203

['squishing' 'squirt']
['circumcising' 'cut']
['circumcising' 'remove']
['blithering' 'chatter']
['retrying' 'hear']
['inabilities' 'insufficiency']
['inabilities' 'incomprehension']
['interwove' 'braid']
['unisons' 'concurrence']
['unisons' 'agreement']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['unzipping' 'unfasten']
['hypertexts' 'database']
['brained' 'kill']
['brained' 'hit']
['autografts' 'graft']
['sheikhdoms' 'domain']
['disfavoring' 'prejudice']
['anticyclones' 'high']
['companionships' 'friendship']
['postboxes' 'maildrop']
['snookered' 'play']
['snookered' 'flim-flam']
['papered' 'cover']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['combusts' 'blow']
['combusts' 'ablaze']
['baggers' 'machine']
['baggers' 'workman']
['retrials' 'trial']
['venders' 'selling']
['interlinks' 'intercommunicate']
['interlinks' 'connect']
['amazings' 'surprise']
['amazings' 'stump']
['cosponsoring' 'sponsor']
['noncitizens' 'tr

100%|██████████| 5846/5846 [00:44<00:00, 131.80it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75346.78it/s]
100%|██████████| 287/287 [00:00<00:00, 73882.36it/s]
100%|██████████| 771/771 [00:00<00:00, 76445.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75535.62it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93771.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78413.35it/s]
100%|██████████| 353/353 [00:00<00:00, 75663.80it/s]
100%|██████████| 252/252 [00:00<00:00, 72514.04it/s]
100%|██████████| 203/203 [00:00<00:00, 75409.06it/s]
100%|██████████| 153/153 [00:00<00:00, 72965.15it/s]
100%|██████████| 200/200 [00:00<00:00, 71617.93it/s]
100%|██████████| 65/65 [00:00<00:00, 63446.53it/s]
100%|██████████| 144/144 [00:00<00:00, 72865.22it/s]
100%|██████████| 30/30 [00:00<00:00, 50071.28it/s]
100%|██████████| 130/130 [00:00<00:00, 69699.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78500.50it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.36it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 72627.70it/s]
100%|██████████| 287/287 [00:00<00:00, 74954.25it/s]
100%|██████████| 771/771 [00:00<00:00, 75925.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75271.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83986.86it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91294.97it/s]
100%|██████████| 353/353 [00:00<00:00, 69170.26it/s]
100%|██████████| 252/252 [00:00<00:00, 72939.38it/s]
100%|██████████| 203/203 [00:00<00:00, 69032.25it/s]
100%|██████████| 153/153 [00:00<00:00, 69136.88it/s]
100%|██████████| 200/200 [00:00<00:00, 74658.31it/s]
100%|██████████| 65/65 [00:00<00:00, 62832.39it/s]
100%|██████████| 144/144 [00:00<00:00, 69896.98it/s]
100%|██████████| 30/30 [00:00<00:00, 57825.88it/s]
100%|██████████| 130/130 [00:00<00:00, 69151.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83424.62it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.00it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76491.17it/s]
100%|██████████| 287/287 [00:00<00:00, 65585.99it/s]
100%|██████████| 771/771 [00:00<00:00, 55432.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74488.60it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84996.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77990.03it/s]
100%|██████████| 353/353 [00:00<00:00, 76095.46it/s]
100%|██████████| 252/252 [00:00<00:00, 74350.35it/s]
100%|██████████| 203/203 [00:00<00:00, 72457.13it/s]
100%|██████████| 153/153 [00:00<00:00, 72144.86it/s]
100%|██████████| 200/200 [00:00<00:00, 72584.65it/s]
100%|██████████| 65/65 [00:00<00:00, 64148.18it/s]
100%|██████████| 144/144 [00:00<00:00, 61630.59it/s]
100%|██████████| 30/30 [00:00<00:00, 36503.95it/s]
100%|██████████| 130/130 [00:00<00:00, 49663.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92053.02it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.57it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 83428.43it/s]
100%|██████████| 287/287 [00:00<00:00, 74393.75it/s]
100%|██████████| 771/771 [00:00<00:00, 75559.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77764.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84190.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77010.10it/s]
100%|██████████| 353/353 [00:00<00:00, 75923.76it/s]
100%|██████████| 252/252 [00:00<00:00, 74660.21it/s]
100%|██████████| 203/203 [00:00<00:00, 72272.62it/s]
100%|██████████| 153/153 [00:00<00:00, 70226.36it/s]
100%|██████████| 200/200 [00:00<00:00, 72836.75it/s]
100%|██████████| 65/65 [00:00<00:00, 67516.04it/s]
100%|██████████| 144/144 [00:00<00:00, 70981.29it/s]
100%|██████████| 30/30 [00:00<00:00, 29488.90it/s]
100%|██████████| 130/130 [00:00<00:00, 67133.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93028.97it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.67it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76057.97it/s]
100%|██████████| 287/287 [00:00<00:00, 73782.73it/s]
100%|██████████| 771/771 [00:00<00:00, 85282.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75890.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96111.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77674.21it/s]
100%|██████████| 353/353 [00:00<00:00, 88293.24it/s]
100%|██████████| 252/252 [00:00<00:00, 90038.73it/s]
100%|██████████| 203/203 [00:00<00:00, 77743.22it/s]
100%|██████████| 153/153 [00:00<00:00, 75962.18it/s]
100%|██████████| 200/200 [00:00<00:00, 73103.34it/s]
100%|██████████| 65/65 [00:00<00:00, 70084.77it/s]
100%|██████████| 144/144 [00:00<00:00, 72953.23it/s]
100%|██████████| 30/30 [00:00<00:00, 64527.75it/s]
100%|██████████| 130/130 [00:00<00:00, 73554.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84974.24it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.43it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77564.46it/s]
100%|██████████| 287/287 [00:00<00:00, 64847.56it/s]
100%|██████████| 771/771 [00:00<00:00, 75637.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78335.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83513.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92895.73it/s]
100%|██████████| 353/353 [00:00<00:00, 75386.42it/s]
100%|██████████| 252/252 [00:00<00:00, 71276.86it/s]
100%|██████████| 203/203 [00:00<00:00, 74368.39it/s]
100%|██████████| 153/153 [00:00<00:00, 73148.13it/s]
100%|██████████| 200/200 [00:00<00:00, 72328.06it/s]
100%|██████████| 65/65 [00:00<00:00, 64012.62it/s]
100%|██████████| 144/144 [00:00<00:00, 72445.70it/s]
100%|██████████| 30/30 [00:00<00:00, 51653.99it/s]
100%|██████████| 130/130 [00:00<00:00, 75667.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88306.98it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.70it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 90216.59it/s]
100%|██████████| 287/287 [00:00<00:00, 60836.17it/s]
100%|██████████| 771/771 [00:00<00:00, 75902.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77575.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76682.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80132.16it/s]
100%|██████████| 353/353 [00:00<00:00, 74875.56it/s]
100%|██████████| 252/252 [00:00<00:00, 76982.13it/s]
100%|██████████| 203/203 [00:00<00:00, 76417.49it/s]
100%|██████████| 153/153 [00:00<00:00, 73089.81it/s]
100%|██████████| 200/200 [00:00<00:00, 73384.73it/s]
100%|██████████| 65/65 [00:00<00:00, 72450.11it/s]
100%|██████████| 144/144 [00:00<00:00, 71073.17it/s]
100%|██████████| 30/30 [00:00<00:00, 28879.76it/s]
100%|██████████| 130/130 [00:00<00:00, 70075.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90364.44it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.77it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 66801.27it/s]
100%|██████████| 287/287 [00:00<00:00, 75899.45it/s]
100%|██████████| 771/771 [00:00<00:00, 76218.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74883.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84879.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79787.15it/s]
100%|██████████| 353/353 [00:00<00:00, 79567.35it/s]
100%|██████████| 252/252 [00:00<00:00, 76194.10it/s]
100%|██████████| 203/203 [00:00<00:00, 74511.57it/s]
100%|██████████| 153/153 [00:00<00:00, 71677.48it/s]
100%|██████████| 200/200 [00:00<00:00, 74327.56it/s]
100%|██████████| 65/65 [00:00<00:00, 65551.76it/s]
100%|██████████| 144/144 [00:00<00:00, 73041.45it/s]
100%|██████████| 30/30 [00:00<00:00, 52913.84it/s]
100%|██████████| 130/130 [00:00<00:00, 57932.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85459.01it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.46it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 94721.71it/s]
100%|██████████| 287/287 [00:00<00:00, 71772.31it/s]
100%|██████████| 771/771 [00:00<00:00, 81294.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75150.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73707.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91316.84it/s]
100%|██████████| 353/353 [00:00<00:00, 69472.10it/s]
100%|██████████| 252/252 [00:00<00:00, 69647.11it/s]
100%|██████████| 203/203 [00:00<00:00, 70571.38it/s]
100%|██████████| 153/153 [00:00<00:00, 68973.40it/s]
100%|██████████| 200/200 [00:00<00:00, 70533.99it/s]
100%|██████████| 65/65 [00:00<00:00, 61210.09it/s]
100%|██████████| 144/144 [00:00<00:00, 71434.63it/s]
100%|██████████| 30/30 [00:00<00:00, 54899.27it/s]
100%|██████████| 130/130 [00:00<00:00, 74195.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83443.59it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.98it/s]
INFO:root:The new embedding has 5844 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 73770.84it/s]
100%|██████████| 287/287 [00:00<00:00, 74781.96it/s]
100%|██████████| 771/771 [00:00<00:00, 77840.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76595.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82919.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86453.76it/s]
100%|██████████| 353/353 [00:00<00:00, 74939.99it/s]
100%|██████████| 252/252 [00:00<00:00, 75379.02it/s]
100%|██████████| 203/203 [00:00<00:00, 73438.31it/s]
100%|██████████| 153/153 [00:00<00:00, 73457.93it/s]
100%|██████████| 200/200 [00:00<00:00, 71186.42it/s]
100%|██████████| 65/65 [00:00<00:00, 67432.54it/s]
100%|██████████| 144/144 [00:00<00:00, 73174.19it/s]
100%|██████████| 30/30 [00:00<00:00, 59691.23it/s]
100%|██████████| 130/130 [00:00<00:00, 72373.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72193.25it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.42it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88612.06it/s]
100%|██████████| 287/287 [00:00<00:00, 60239.47it/s]
100%|██████████| 771/771 [00:00<00:00, 80587.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81335.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88704.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 99820.81it/s]
100%|██████████| 353/353 [00:00<00:00, 77550.25it/s]
100%|██████████| 252/252 [00:00<00:00, 75180.64it/s]
100%|██████████| 203/203 [00:00<00:00, 67307.80it/s]
100%|██████████| 153/153 [00:00<00:00, 73056.52it/s]
100%|██████████| 200/200 [00:00<00:00, 74019.31it/s]
100%|██████████| 65/65 [00:00<00:00, 67382.54it/s]
100%|██████████| 144/144 [00:00<00:00, 78449.12it/s]
100%|██████████| 30/30 [00:00<00:00, 64627.18it/s]
100%|██████████| 130/130 [00:00<00:00, 76927.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81286.31it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.88it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 71527.99it/s]
100%|██████████| 287/287 [00:00<00:00, 74091.54it/s]
100%|██████████| 771/771 [00:00<00:00, 79380.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75571.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82315.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87893.43it/s]
100%|██████████| 353/353 [00:00<00:00, 78391.98it/s]
100%|██████████| 252/252 [00:00<00:00, 74407.93it/s]
100%|██████████| 203/203 [00:00<00:00, 76035.34it/s]
100%|██████████| 153/153 [00:00<00:00, 78211.88it/s]
100%|██████████| 200/200 [00:00<00:00, 76762.52it/s]
100%|██████████| 65/65 [00:00<00:00, 67650.06it/s]
100%|██████████| 144/144 [00:00<00:00, 74464.28it/s]
100%|██████████| 30/30 [00:00<00:00, 67432.54it/s]
100%|██████████| 130/130 [00:00<00:00, 73465.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90937.64it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.90it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75181.84it/s]
100%|██████████| 287/287 [00:00<00:00, 74814.50it/s]
100%|██████████| 771/771 [00:00<00:00, 77887.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74537.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75067.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75490.98it/s]
100%|██████████| 353/353 [00:00<00:00, 79286.14it/s]
100%|██████████| 252/252 [00:00<00:00, 77535.55it/s]
100%|██████████| 203/203 [00:00<00:00, 78655.31it/s]
100%|██████████| 153/153 [00:00<00:00, 79108.54it/s]
100%|██████████| 200/200 [00:00<00:00, 79482.74it/s]
100%|██████████| 65/65 [00:00<00:00, 66301.01it/s]
100%|██████████| 144/144 [00:00<00:00, 72997.31it/s]
100%|██████████| 30/30 [00:00<00:00, 58963.97it/s]
100%|██████████| 130/130 [00:00<00:00, 75021.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78482.03it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 162.18it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 66376.92it/s]
100%|██████████| 287/287 [00:00<00:00, 60487.68it/s]
100%|██████████| 771/771 [00:00<00:00, 58615.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 56580.77it/s]
100%|██████████| 1000/1000 [00:00<00:00, 61246.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98355.48it/s]
100%|██████████| 353/353 [00:00<00:00, 77198.46it/s]
100%|██████████| 252/252 [00:00<00:00, 76803.13it/s]
100%|██████████| 203/203 [00:00<00:00, 65824.79it/s]
100%|██████████| 153/153 [00:00<00:00, 64573.21it/s]
100%|██████████| 200/200 [00:00<00:00, 72334.29it/s]
100%|██████████| 65/65 [00:00<00:00, 60302.98it/s]
100%|██████████| 144/144 [00:00<00:00, 71140.14it/s]
100%|██████████| 30/30 [00:00<00:00, 64760.23it/s]
100%|██████████| 130/130 [00:00<00:00, 72798.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74485.57it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.16it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78278.84it/s]
100%|██████████| 287/287 [00:00<00:00, 75827.73it/s]
100%|██████████| 771/771 [00:00<00:00, 80974.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76832.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85251.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78597.52it/s]
100%|██████████| 353/353 [00:00<00:00, 75586.55it/s]
100%|██████████| 252/252 [00:00<00:00, 77546.93it/s]
100%|██████████| 203/203 [00:00<00:00, 78954.35it/s]
100%|██████████| 153/153 [00:00<00:00, 76260.07it/s]
100%|██████████| 200/200 [00:00<00:00, 76156.22it/s]
100%|██████████| 65/65 [00:00<00:00, 69495.22it/s]
100%|██████████| 144/144 [00:00<00:00, 77912.77it/s]
100%|██████████| 30/30 [00:00<00:00, 55504.68it/s]
100%|██████████| 130/130 [00:00<00:00, 68924.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74282.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 162.00it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77128.99it/s]
100%|██████████| 287/287 [00:00<00:00, 78090.51it/s]
100%|██████████| 771/771 [00:00<00:00, 77043.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80115.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78036.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78319.15it/s]
100%|██████████| 353/353 [00:00<00:00, 79648.68it/s]
100%|██████████| 252/252 [00:00<00:00, 73476.86it/s]
100%|██████████| 203/203 [00:00<00:00, 78488.54it/s]
100%|██████████| 153/153 [00:00<00:00, 63081.54it/s]
100%|██████████| 200/200 [00:00<00:00, 76461.65it/s]
100%|██████████| 65/65 [00:00<00:00, 69107.67it/s]
100%|██████████| 144/144 [00:00<00:00, 78704.69it/s]
100%|██████████| 30/30 [00:00<00:00, 60875.24it/s]
100%|██████████| 130/130 [00:00<00:00, 29034.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76291.78it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [01:18<00:00, 74.23it/s] 
INFO:root:The new embedding has 5846 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 85482.79it/s]
100%|██████████| 287/287 [00:00<00:00, 75513.79it/s]
100%|██████████| 771/771 [00:00<00:00, 85318.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78439.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77176.37it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79161.21it/s]
100%|██████████| 353/353 [00:00<00:00, 77319.41it/s]
100%|██████████| 252/252 [00:00<00:00, 76029.68it/s]
100%|██████████| 203/203 [00:00<00:00, 77750.32it/s]
100%|██████████| 153/153 [00:00<00:00, 78691.42it/s]
100%|██████████| 200/200 [00:00<00:00, 74565.40it/s]
100%|██████████| 65/65 [00:00<00:00, 65630.66it/s]
100%|██████████| 144/144 [00:00<00:00, 75810.19it/s]
100%|██████████| 30/30 [00:00<00:00, 44651.92it/s]
100%|██████████| 130/130 [00:00<00:00, 73943.52it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93560.80it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.73it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76459.07it/s]
100%|██████████| 287/287 [00:00<00:00, 74856.37it/s]
100%|██████████| 771/771 [00:00<00:00, 75051.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81077.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85531.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77527.29it/s]
100%|██████████| 353/353 [00:00<00:00, 84421.79it/s]
100%|██████████| 252/252 [00:00<00:00, 75169.95it/s]
100%|██████████| 203/203 [00:00<00:00, 75974.28it/s]
100%|██████████| 153/153 [00:00<00:00, 76862.92it/s]
100%|██████████| 200/200 [00:00<00:00, 78106.22it/s]
100%|██████████| 65/65 [00:00<00:00, 73504.92it/s]
100%|██████████| 144/144 [00:00<00:00, 72979.67it/s]
100%|██████████| 30/30 [00:00<00:00, 60699.04it/s]
100%|██████████| 130/130 [00:00<00:00, 71593.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87835.15it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.86it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 87232.16it/s]
100%|██████████| 287/287 [00:00<00:00, 72955.47it/s]
100%|██████████| 771/771 [00:00<00:00, 76391.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73571.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 71637.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 66331.98it/s]
100%|██████████| 353/353 [00:00<00:00, 78425.20it/s]
100%|██████████| 252/252 [00:00<00:00, 55539.10it/s]
100%|██████████| 203/203 [00:00<00:00, 56112.01it/s]
100%|██████████| 153/153 [00:00<00:00, 54872.04it/s]
100%|██████████| 200/200 [00:00<00:00, 50576.44it/s]
100%|██████████| 65/65 [00:00<00:00, 54233.09it/s]
100%|██████████| 144/144 [00:00<00:00, 54777.78it/s]
100%|██████████| 30/30 [00:00<00:00, 48228.87it/s]
100%|██████████| 130/130 [00:00<00:00, 51707.87it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85526.73it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 67.07it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 84517.21it/s]
100%|██████████| 287/287 [00:00<00:00, 71469.76it/s]
100%|██████████| 771/771 [00:00<00:00, 74601.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87410.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74537.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96471.05it/s]
100%|██████████| 353/353 [00:00<00:00, 77283.08it/s]
100%|██████████| 252/252 [00:00<00:00, 72949.45it/s]
100%|██████████| 203/203 [00:00<00:00, 65309.79it/s]
100%|██████████| 153/153 [00:00<00:00, 80740.88it/s]
100%|██████████| 200/200 [00:00<00:00, 89250.01it/s]
100%|██████████| 65/65 [00:00<00:00, 66755.57it/s]
100%|██████████| 144/144 [00:00<00:00, 61794.53it/s]
100%|██████████| 30/30 [00:00<00:00, 53092.46it/s]
100%|██████████| 130/130 [00:00<00:00, 69530.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86987.82it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.56it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 84981.74it/s]
100%|██████████| 287/287 [00:00<00:00, 81688.74it/s]
100%|██████████| 771/771 [00:00<00:00, 79122.32it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73875.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88030.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75277.36it/s]
100%|██████████| 353/353 [00:00<00:00, 74237.33it/s]
100%|██████████| 252/252 [00:00<00:00, 69683.85it/s]
100%|██████████| 203/203 [00:00<00:00, 73337.10it/s]
100%|██████████| 153/153 [00:00<00:00, 89576.84it/s]
100%|██████████| 200/200 [00:00<00:00, 76080.25it/s]
100%|██████████| 65/65 [00:00<00:00, 71257.12it/s]
100%|██████████| 144/144 [00:00<00:00, 73458.99it/s]
100%|██████████| 30/30 [00:00<00:00, 66260.73it/s]
100%|██████████| 130/130 [00:00<00:00, 70283.52it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84791.17it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.61it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 72631.47it/s]
100%|██████████| 287/287 [00:00<00:00, 64214.51it/s]
100%|██████████| 771/771 [00:00<00:00, 76225.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76322.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82096.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72391.72it/s]
100%|██████████| 353/353 [00:00<00:00, 70851.76it/s]
100%|██████████| 252/252 [00:00<00:00, 72828.82it/s]
100%|██████████| 203/203 [00:00<00:00, 72897.58it/s]
100%|██████████| 153/153 [00:00<00:00, 71200.32it/s]
100%|██████████| 200/200 [00:00<00:00, 72855.72it/s]
100%|██████████| 65/65 [00:00<00:00, 64436.25it/s]
100%|██████████| 144/144 [00:00<00:00, 72142.83it/s]
100%|██████████| 30/30 [00:00<00:00, 48620.22it/s]
100%|██████████| 130/130 [00:00<00:00, 69896.11it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83671.88it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:28<00:00, 66.21it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 80133.67it/s]
100%|██████████| 287/287 [00:00<00:00, 91848.41it/s]
100%|██████████| 771/771 [00:00<00:00, 84047.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75809.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89769.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74394.79it/s]
100%|██████████| 353/353 [00:00<00:00, 83418.18it/s]
100%|██████████| 252/252 [00:00<00:00, 68518.39it/s]
100%|██████████| 203/203 [00:00<00:00, 77537.90it/s]
100%|██████████| 153/153 [00:00<00:00, 79304.07it/s]
100%|██████████| 200/200 [00:00<00:00, 78251.94it/s]
100%|██████████| 65/65 [00:00<00:00, 68208.60it/s]
100%|██████████| 144/144 [00:00<00:00, 72900.40it/s]
100%|██████████| 30/30 [00:00<00:00, 55800.05it/s]
100%|██████████| 130/130 [00:00<00:00, 71313.04it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88740.44it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 67.16it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78941.01it/s]
100%|██████████| 287/287 [00:00<00:00, 76216.62it/s]
100%|██████████| 771/771 [00:00<00:00, 76850.88it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76563.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90083.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89806.10it/s]
100%|██████████| 353/353 [00:00<00:00, 76698.58it/s]
100%|██████████| 252/252 [00:00<00:00, 69798.89it/s]
100%|██████████| 203/203 [00:00<00:00, 75609.96it/s]
100%|██████████| 153/153 [00:00<00:00, 75604.21it/s]
100%|██████████| 200/200 [00:00<00:00, 75539.02it/s]
100%|██████████| 65/65 [00:00<00:00, 67449.22it/s]
100%|██████████| 144/144 [00:00<00:00, 77107.08it/s]
100%|██████████| 30/30 [00:00<00:00, 69098.91it/s]
100%|██████████| 130/130 [00:00<00:00, 73893.42it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87419.32it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:28<00:00, 66.18it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 83929.77it/s]
100%|██████████| 287/287 [00:00<00:00, 68481.35it/s]
100%|██████████| 771/771 [00:00<00:00, 92954.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74961.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82894.66it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75527.68it/s]
100%|██████████| 353/353 [00:00<00:00, 86513.34it/s]
100%|██████████| 252/252 [00:00<00:00, 83952.71it/s]
100%|██████████| 203/203 [00:00<00:00, 72260.35it/s]
100%|██████████| 153/153 [00:00<00:00, 73223.24it/s]
100%|██████████| 200/200 [00:00<00:00, 67221.80it/s]
100%|██████████| 65/65 [00:00<00:00, 65004.71it/s]
100%|██████████| 144/144 [00:00<00:00, 74363.43it/s]
100%|██████████| 30/30 [00:00<00:00, 45722.79it/s]
100%|██████████| 130/130 [00:00<00:00, 62926.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81795.85it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.71it/s]
INFO:root:The new embedding has 5819 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 89446.25it/s]
100%|██████████| 287/287 [00:00<00:00, 72424.36it/s]
100%|██████████| 771/771 [00:00<00:00, 74638.98it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88303.93it/s]
100%|██████████| 1000/1000 [00:00<00:00, 71974.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95047.87it/s]
100%|██████████| 353/353 [00:00<00:00, 75038.74it/s]
100%|██████████| 252/252 [00:00<00:00, 75228.80it/s]
100%|██████████| 203/203 [00:00<00:00, 60613.92it/s]
100%|██████████| 153/153 [00:00<00:00, 72055.75it/s]
100%|██████████| 200/200 [00:00<00:00, 81159.13it/s]
100%|██████████| 65/65 [00:00<00:00, 67818.35it/s]
100%|██████████| 144/144 [00:00<00:00, 73271.84it/s]
100%|██████████| 30/30 [00:00<00:00, 62788.98it/s]
100%|██████████| 130/130 [00:00<00:00, 69530.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80444.44it/s]
100%|██████████| 2034/

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.99it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 59743.49it/s]
100%|██████████| 287/287 [00:00<00:00, 92292.05it/s]
100%|██████████| 771/771 [00:00<00:00, 81715.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76100.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 66614.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84489.33it/s]
100%|██████████| 353/353 [00:00<00:00, 79371.14it/s]
100%|██████████| 252/252 [00:00<00:00, 78766.27it/s]
100%|██████████| 203/203 [00:00<00:00, 80805.14it/s]
100%|██████████| 153/153 [00:00<00:00, 77606.54it/s]
100%|██████████| 200/200 [00:00<00:00, 79535.49it/s]
100%|██████████| 65/65 [00:00<00:00, 69090.16it/s]
100%|██████████| 144/144 [00:00<00:00, 75934.09it/s]
100%|██████████| 30/30 [00:00<00:00, 55578.23it/s]
100%|██████████| 130/130 [00:00<00:00, 75228.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77172.92it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.87it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76142.28it/s]
100%|██████████| 287/287 [00:00<00:00, 71883.75it/s]
100%|██████████| 771/771 [00:00<00:00, 80575.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80353.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 68788.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78883.30it/s]
100%|██████████| 353/353 [00:00<00:00, 79648.68it/s]
100%|██████████| 252/252 [00:00<00:00, 75681.27it/s]
100%|██████████| 203/203 [00:00<00:00, 60168.45it/s]
100%|██████████| 153/153 [00:00<00:00, 73265.04it/s]
100%|██████████| 200/200 [00:00<00:00, 83693.58it/s]
100%|██████████| 65/65 [00:00<00:00, 75520.71it/s]
100%|██████████| 144/144 [00:00<00:00, 76608.29it/s]
100%|██████████| 30/30 [00:00<00:00, 70099.79it/s]
100%|██████████| 130/130 [00:00<00:00, 78624.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79891.07it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.58it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80407.39it/s]
100%|██████████| 287/287 [00:00<00:00, 78400.76it/s]
100%|██████████| 771/771 [00:00<00:00, 80944.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78882.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80624.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79012.09it/s]
100%|██████████| 353/353 [00:00<00:00, 79988.62it/s]
100%|██████████| 252/252 [00:00<00:00, 77541.24it/s]
100%|██████████| 203/203 [00:00<00:00, 78648.04it/s]
100%|██████████| 153/153 [00:00<00:00, 75267.24it/s]
100%|██████████| 200/200 [00:00<00:00, 78317.69it/s]
100%|██████████| 65/65 [00:00<00:00, 68793.78it/s]
100%|██████████| 144/144 [00:00<00:00, 74787.00it/s]
100%|██████████| 30/30 [00:00<00:00, 57039.49it/s]
100%|██████████| 130/130 [00:00<00:00, 78207.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79148.48it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 67.09it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79822.26it/s]
100%|██████████| 287/287 [00:00<00:00, 64300.26it/s]
100%|██████████| 771/771 [00:00<00:00, 80911.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80167.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75355.80it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94338.11it/s]
100%|██████████| 353/353 [00:00<00:00, 78809.25it/s]
100%|██████████| 252/252 [00:00<00:00, 78901.51it/s]
100%|██████████| 203/203 [00:00<00:00, 76396.92it/s]
100%|██████████| 153/153 [00:00<00:00, 79727.73it/s]
100%|██████████| 200/200 [00:00<00:00, 77285.87it/s]
100%|██████████| 65/65 [00:00<00:00, 75416.25it/s]
100%|██████████| 144/144 [00:00<00:00, 74299.39it/s]
100%|██████████| 30/30 [00:00<00:00, 63389.98it/s]
100%|██████████| 130/130 [00:00<00:00, 65717.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78812.79it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:27<00:00, 66.87it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78382.81it/s]
100%|██████████| 287/287 [00:00<00:00, 77522.23it/s]
100%|██████████| 771/771 [00:00<00:00, 92800.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79814.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77660.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 64258.53it/s]
100%|██████████| 353/353 [00:00<00:00, 78579.20it/s]
100%|██████████| 252/252 [00:00<00:00, 57188.87it/s]
100%|██████████| 203/203 [00:00<00:00, 45047.55it/s]
100%|██████████| 153/153 [00:00<00:00, 49020.59it/s]
100%|██████████| 200/200 [00:00<00:00, 60000.06it/s]
100%|██████████| 65/65 [00:00<00:00, 56281.95it/s]
100%|██████████| 144/144 [00:00<00:00, 58844.48it/s]
100%|██████████| 30/30 [00:00<00:00, 22314.08it/s]
100%|██████████| 130/130 [00:00<00:00, 59532.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79756.52it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [01:28<00:00, 66.40it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79379.19it/s]
100%|██████████| 287/287 [00:00<00:00, 62872.94it/s]
100%|██████████| 771/771 [00:00<00:00, 79851.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79308.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83820.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 104735.41it/s]
100%|██████████| 353/353 [00:00<00:00, 75038.74it/s]
100%|██████████| 252/252 [00:00<00:00, 59830.44it/s]
100%|██████████| 203/203 [00:00<00:00, 68548.72it/s]
100%|██████████| 153/153 [00:00<00:00, 56880.74it/s]
100%|██████████| 200/200 [00:00<00:00, 59940.04it/s]
100%|██████████| 65/65 [00:00<00:00, 58117.62it/s]
100%|██████████| 144/144 [00:00<00:00, 56478.38it/s]
100%|██████████| 30/30 [00:00<00:00, 48063.07it/s]
100%|██████████| 130/130 [00:00<00:00, 56981.87it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75432.47it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:34<00:00, 169.16it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77077.92it/s]
100%|██████████| 287/287 [00:00<00:00, 73521.36it/s]
100%|██████████| 771/771 [00:00<00:00, 76386.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91227.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79698.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85254.70it/s]
100%|██████████| 353/353 [00:00<00:00, 75263.79it/s]
100%|██████████| 252/252 [00:00<00:00, 75443.58it/s]
100%|██████████| 203/203 [00:00<00:00, 73961.41it/s]
100%|██████████| 153/153 [00:00<00:00, 70995.52it/s]
100%|██████████| 200/200 [00:00<00:00, 65296.24it/s]
100%|██████████| 65/65 [00:00<00:00, 52078.27it/s]
100%|██████████| 144/144 [00:00<00:00, 74879.71it/s]
100%|██████████| 30/30 [00:00<00:00, 64100.42it/s]
100%|██████████| 130/130 [00:00<00:00, 62933.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70073.24it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 171.08it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77783.32it/s]
100%|██████████| 287/287 [00:00<00:00, 73328.78it/s]
100%|██████████| 771/771 [00:00<00:00, 76641.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81109.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77949.45it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80425.12it/s]
100%|██████████| 353/353 [00:00<00:00, 77254.86it/s]
100%|██████████| 252/252 [00:00<00:00, 76232.57it/s]
100%|██████████| 203/203 [00:00<00:00, 75215.88it/s]
100%|██████████| 153/153 [00:00<00:00, 73156.47it/s]
100%|██████████| 200/200 [00:00<00:00, 76643.29it/s]
100%|██████████| 65/65 [00:00<00:00, 68793.78it/s]
100%|██████████| 144/144 [00:00<00:00, 70989.63it/s]
100%|██████████| 30/30 [00:00<00:00, 57013.65it/s]
100%|██████████| 130/130 [00:00<00:00, 35422.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91105.26it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.01it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 84875.01it/s]
100%|██████████| 287/287 [00:00<00:00, 85610.22it/s]
100%|██████████| 771/771 [00:00<00:00, 89066.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90741.61it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76378.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80429.75it/s]
100%|██████████| 353/353 [00:00<00:00, 75367.23it/s]
100%|██████████| 252/252 [00:00<00:00, 75020.56it/s]
100%|██████████| 203/203 [00:00<00:00, 77643.96it/s]
100%|██████████| 153/153 [00:00<00:00, 75302.57it/s]
100%|██████████| 200/200 [00:00<00:00, 72215.98it/s]
100%|██████████| 65/65 [00:00<00:00, 55266.52it/s]
100%|██████████| 144/144 [00:00<00:00, 66738.10it/s]
100%|██████████| 30/30 [00:00<00:00, 58881.20it/s]
100%|██████████| 130/130 [00:00<00:00, 68285.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93417.32it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 171.29it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76488.38it/s]
100%|██████████| 287/287 [00:00<00:00, 77707.39it/s]
100%|██████████| 771/771 [00:00<00:00, 74668.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93226.44it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76457.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86513.79it/s]
100%|██████████| 353/353 [00:00<00:00, 74939.99it/s]
100%|██████████| 252/252 [00:00<00:00, 74470.84it/s]
100%|██████████| 203/203 [00:00<00:00, 75362.34it/s]
100%|██████████| 153/153 [00:00<00:00, 67479.34it/s]
100%|██████████| 200/200 [00:00<00:00, 62170.07it/s]
100%|██████████| 65/65 [00:00<00:00, 63773.04it/s]
100%|██████████| 144/144 [00:00<00:00, 55329.77it/s]
100%|██████████| 30/30 [00:00<00:00, 52714.34it/s]
100%|██████████| 130/130 [00:00<00:00, 75458.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77722.05it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.39it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76855.95it/s]
100%|██████████| 287/287 [00:00<00:00, 74954.25it/s]
100%|██████████| 771/771 [00:00<00:00, 75124.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82863.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77495.78it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90841.51it/s]
100%|██████████| 353/353 [00:00<00:00, 87216.62it/s]
100%|██████████| 252/252 [00:00<00:00, 74131.34it/s]
100%|██████████| 203/203 [00:00<00:00, 59181.46it/s]
100%|██████████| 153/153 [00:00<00:00, 66069.03it/s]
100%|██████████| 200/200 [00:00<00:00, 72843.07it/s]
100%|██████████| 65/65 [00:00<00:00, 62315.37it/s]
100%|██████████| 144/144 [00:00<00:00, 70814.84it/s]
100%|██████████| 30/30 [00:00<00:00, 61290.37it/s]
100%|██████████| 130/130 [00:00<00:00, 70365.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85557.13it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.98it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76912.38it/s]
100%|██████████| 287/287 [00:00<00:00, 74666.00it/s]
100%|██████████| 771/771 [00:00<00:00, 75782.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91524.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78257.78it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88115.01it/s]
100%|██████████| 353/353 [00:00<00:00, 51817.78it/s]
100%|██████████| 252/252 [00:00<00:00, 74834.65it/s]
100%|██████████| 203/203 [00:00<00:00, 79115.75it/s]
100%|██████████| 153/153 [00:00<00:00, 81489.33it/s]
100%|██████████| 200/200 [00:00<00:00, 54489.17it/s]
100%|██████████| 65/65 [00:00<00:00, 61045.62it/s]
100%|██████████| 144/144 [00:00<00:00, 71098.27it/s]
100%|██████████| 30/30 [00:00<00:00, 51170.85it/s]
100%|██████████| 130/130 [00:00<00:00, 62272.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78311.22it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.03it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77035.40it/s]
100%|██████████| 287/287 [00:00<00:00, 75485.37it/s]
100%|██████████| 771/771 [00:00<00:00, 92328.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92715.36it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79389.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88298.04it/s]
100%|██████████| 353/353 [00:00<00:00, 76726.40it/s]
100%|██████████| 252/252 [00:00<00:00, 76525.09it/s]
100%|██████████| 203/203 [00:00<00:00, 75731.01it/s]
100%|██████████| 153/153 [00:00<00:00, 66307.97it/s]
100%|██████████| 200/200 [00:00<00:00, 63961.94it/s]
100%|██████████| 65/65 [00:00<00:00, 63520.45it/s]
100%|██████████| 144/144 [00:00<00:00, 75506.91it/s]
100%|██████████| 30/30 [00:00<00:00, 54803.62it/s]
100%|██████████| 130/130 [00:00<00:00, 76174.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76622.29it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 171.16it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76133.98it/s]
100%|██████████| 287/287 [00:00<00:00, 74132.61it/s]
100%|██████████| 771/771 [00:00<00:00, 76400.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92630.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 56305.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85982.33it/s]
100%|██████████| 353/353 [00:00<00:00, 55467.33it/s]
100%|██████████| 252/252 [00:00<00:00, 53748.52it/s]
100%|██████████| 203/203 [00:00<00:00, 49419.22it/s]
100%|██████████| 153/153 [00:00<00:00, 53881.49it/s]
100%|██████████| 200/200 [00:00<00:00, 54127.04it/s]
100%|██████████| 65/65 [00:00<00:00, 52038.51it/s]
100%|██████████| 144/144 [00:00<00:00, 53950.85it/s]
100%|██████████| 30/30 [00:00<00:00, 48321.47it/s]
100%|██████████| 130/130 [00:00<00:00, 52881.34it/s]
100%|██████████| 3500/3500 [00:00<00:00, 59849.98it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.13it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75439.02it/s]
100%|██████████| 287/287 [00:00<00:00, 74800.55it/s]
100%|██████████| 771/771 [00:00<00:00, 73952.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87072.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77621.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88526.02it/s]
100%|██████████| 353/353 [00:00<00:00, 76252.22it/s]
100%|██████████| 252/252 [00:00<00:00, 74808.17it/s]
100%|██████████| 203/203 [00:00<00:00, 69347.10it/s]
100%|██████████| 153/153 [00:00<00:00, 83984.89it/s]
100%|██████████| 200/200 [00:00<00:00, 88815.33it/s]
100%|██████████| 65/65 [00:00<00:00, 64696.19it/s]
100%|██████████| 144/144 [00:00<00:00, 70018.52it/s]
100%|██████████| 30/30 [00:00<00:00, 54779.76it/s]
100%|██████████| 130/130 [00:00<00:00, 67075.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89981.70it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.83it/s]
INFO:root:The new embedding has 5843 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 78079.00it/s]
100%|██████████| 287/287 [00:00<00:00, 74014.10it/s]
100%|██████████| 771/771 [00:00<00:00, 72246.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79982.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77655.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91107.90it/s]
100%|██████████| 353/353 [00:00<00:00, 76782.10it/s]
100%|██████████| 252/252 [00:00<00:00, 78166.29it/s]
100%|██████████| 203/203 [00:00<00:00, 72897.58it/s]
100%|██████████| 153/153 [00:00<00:00, 69047.61it/s]
100%|██████████| 200/200 [00:00<00:00, 68450.49it/s]
100%|██████████| 65/65 [00:00<00:00, 63609.37it/s]
100%|██████████| 144/144 [00:00<00:00, 76734.82it/s]
100%|██████████| 30/30 [00:00<00:00, 52254.62it/s]
100%|██████████| 130/130 [00:00<00:00, 74448.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89856.12it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.33it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81140.78it/s]
100%|██████████| 287/287 [00:00<00:00, 79111.81it/s]
100%|██████████| 771/771 [00:00<00:00, 81408.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97031.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81168.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91535.39it/s]
100%|██████████| 353/353 [00:00<00:00, 79142.04it/s]
100%|██████████| 252/252 [00:00<00:00, 78357.52it/s]
100%|██████████| 203/203 [00:00<00:00, 76069.30it/s]
100%|██████████| 153/153 [00:00<00:00, 78059.67it/s]
100%|██████████| 200/200 [00:00<00:00, 79648.77it/s]
100%|██████████| 65/65 [00:00<00:00, 47554.47it/s]
100%|██████████| 144/144 [00:00<00:00, 79148.18it/s]
100%|██████████| 30/30 [00:00<00:00, 70138.86it/s]
100%|██████████| 130/130 [00:00<00:00, 78207.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 102108.69it/s]
100%|██████████| 20

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.94it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81443.59it/s]
100%|██████████| 287/287 [00:00<00:00, 78899.21it/s]
100%|██████████| 771/771 [00:00<00:00, 81343.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81762.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80247.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82535.25it/s]
100%|██████████| 353/353 [00:00<00:00, 78876.42it/s]
100%|██████████| 252/252 [00:00<00:00, 80054.88it/s]
100%|██████████| 203/203 [00:00<00:00, 80697.92it/s]
100%|██████████| 153/153 [00:00<00:00, 76432.65it/s]
100%|██████████| 200/200 [00:00<00:00, 76903.26it/s]
100%|██████████| 65/65 [00:00<00:00, 69318.53it/s]
100%|██████████| 144/144 [00:00<00:00, 76163.91it/s]
100%|██████████| 30/30 [00:00<00:00, 56173.71it/s]
100%|██████████| 130/130 [00:00<00:00, 73584.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85513.28it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.28it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79406.26it/s]
100%|██████████| 287/287 [00:00<00:00, 78303.86it/s]
100%|██████████| 771/771 [00:00<00:00, 80716.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82306.62it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82000.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92411.33it/s]
100%|██████████| 353/353 [00:00<00:00, 78926.88it/s]
100%|██████████| 252/252 [00:00<00:00, 79704.74it/s]
100%|██████████| 203/203 [00:00<00:00, 81353.31it/s]
100%|██████████| 153/153 [00:00<00:00, 78884.88it/s]
100%|██████████| 200/200 [00:00<00:00, 69980.88it/s]
100%|██████████| 65/65 [00:00<00:00, 68379.67it/s]
100%|██████████| 144/144 [00:00<00:00, 77097.24it/s]
100%|██████████| 30/30 [00:00<00:00, 67468.70it/s]
100%|██████████| 130/130 [00:00<00:00, 74519.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 99918.08it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.96it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79175.20it/s]
100%|██████████| 287/287 [00:00<00:00, 77878.32it/s]
100%|██████████| 771/771 [00:00<00:00, 79370.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77998.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81199.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76834.23it/s]
100%|██████████| 353/353 [00:00<00:00, 80305.33it/s]
100%|██████████| 252/252 [00:00<00:00, 77410.62it/s]
100%|██████████| 203/203 [00:00<00:00, 68493.58it/s]
100%|██████████| 153/153 [00:00<00:00, 73508.42it/s]
100%|██████████| 200/200 [00:00<00:00, 75288.17it/s]
100%|██████████| 65/65 [00:00<00:00, 64850.09it/s]
100%|██████████| 144/144 [00:00<00:00, 74473.46it/s]
100%|██████████| 30/30 [00:00<00:00, 61711.19it/s]
100%|██████████| 130/130 [00:00<00:00, 77683.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75343.81it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.10it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80675.22it/s]
100%|██████████| 287/287 [00:00<00:00, 77482.32it/s]
100%|██████████| 771/771 [00:00<00:00, 81791.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83379.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79937.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91149.48it/s]
100%|██████████| 353/353 [00:00<00:00, 78658.52it/s]
100%|██████████| 252/252 [00:00<00:00, 80006.40it/s]
100%|██████████| 203/203 [00:00<00:00, 78983.65it/s]
100%|██████████| 153/153 [00:00<00:00, 70419.02it/s]
100%|██████████| 200/200 [00:00<00:00, 77392.82it/s]
100%|██████████| 65/65 [00:00<00:00, 38605.18it/s]
100%|██████████| 144/144 [00:00<00:00, 74436.75it/s]
100%|██████████| 30/30 [00:00<00:00, 51316.93it/s]
100%|██████████| 130/130 [00:00<00:00, 74356.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77879.15it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 170.99it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80296.45it/s]
100%|██████████| 287/287 [00:00<00:00, 78837.20it/s]
100%|██████████| 771/771 [00:00<00:00, 82634.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96847.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79556.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87664.42it/s]
100%|██████████| 353/353 [00:00<00:00, 79256.43it/s]
100%|██████████| 252/252 [00:00<00:00, 80444.83it/s]
100%|██████████| 203/203 [00:00<00:00, 76831.23it/s]
100%|██████████| 153/153 [00:00<00:00, 75953.19it/s]
100%|██████████| 200/200 [00:00<00:00, 75281.41it/s]
100%|██████████| 65/65 [00:00<00:00, 64927.31it/s]
100%|██████████| 144/144 [00:00<00:00, 66723.35it/s]
100%|██████████| 30/30 [00:00<00:00, 46500.04it/s]
100%|██████████| 130/130 [00:00<00:00, 71247.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 104832.14it/s]
100%|██████████| 20

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:26<00:00, 219.94it/s]
INFO:root:The new embedding has 5846 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 78398.94it/s]
100%|██████████| 287/287 [00:00<00:00, 75164.86it/s]
100%|██████████| 771/771 [00:00<00:00, 77930.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87165.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77974.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87197.85it/s]
100%|██████████| 353/353 [00:00<00:00, 77966.79it/s]
100%|██████████| 252/252 [00:00<00:00, 78444.75it/s]
100%|██████████| 203/203 [00:00<00:00, 79410.90it/s]
100%|██████████| 153/153 [00:00<00:00, 72799.60it/s]
100%|██████████| 200/200 [00:00<00:00, 70927.61it/s]
100%|██████████| 65/65 [00:00<00:00, 61806.79it/s]
100%|██████████| 144/144 [00:00<00:00, 72759.88it/s]
100%|██████████| 30/30 [00:00<00:00, 54565.97it/s]
100%|██████████| 130/130 [00:00<00:00, 63424.39it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85483.90it/s]
100%|██████████| 2034

100%|██████████| 130/130 [00:00<00:00, 76538.39it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90357.20it/s]
100%|██████████| 2034/2034 [00:00<00:00, 69177.80it/s]
  0%|          | 0/5846 [00:00<?, ?it/s]

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 176.01it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76028.99it/s]
100%|██████████| 287/287 [00:00<00:00, 74619.72it/s]
100%|██████████| 771/771 [00:00<00:00, 78292.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86849.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78948.63it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83047.85it/s]
100%|██████████| 353/353 [00:00<00:00, 72917.47it/s]
100%|██████████| 252/252 [00:00<00:00, 78602.26it/s]
100%|██████████| 203/203 [00:00<00:00, 73406.65it/s]
100%|██████████| 153/153 [00:00<00:00, 72331.89it/s]
100%|██████████| 200/200 [00:00<00:00, 74631.74it/s]
100%|██████████| 65/65 [00:00<00:00, 72915.15it/s]
100%|██████████| 144/144 [00:00<00:00, 71409.29it/s]
100%|██████████| 30/30 [00:00<00:00, 56884.77it/s]
100%|██████████| 130/130 [00:00<00:00, 70721.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87654.73it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 173.49it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 75082.15it/s]
100%|██████████| 287/287 [00:00<00:00, 75937.75it/s]
100%|██████████| 771/771 [00:00<00:00, 76909.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81928.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82656.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74387.76it/s]
100%|██████████| 353/353 [00:00<00:00, 77412.39it/s]
100%|██████████| 252/252 [00:00<00:00, 75271.66it/s]
100%|██████████| 203/203 [00:00<00:00, 70729.67it/s]
100%|██████████| 153/153 [00:00<00:00, 69518.85it/s]
100%|██████████| 200/200 [00:00<00:00, 74202.64it/s]
100%|██████████| 65/65 [00:00<00:00, 58092.85it/s]
100%|██████████| 144/144 [00:00<00:00, 76269.70it/s]
100%|██████████| 30/30 [00:00<00:00, 59549.99it/s]
100%|██████████| 130/130 [00:00<00:00, 69619.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78364.73it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 175.50it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77692.46it/s]
100%|██████████| 287/287 [00:00<00:00, 86038.54it/s]
100%|██████████| 771/771 [00:00<00:00, 79060.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87482.48it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78844.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82147.83it/s]
100%|██████████| 353/353 [00:00<00:00, 77529.94it/s]
100%|██████████| 252/252 [00:00<00:00, 75991.42it/s]
100%|██████████| 203/203 [00:00<00:00, 77333.67it/s]
100%|██████████| 153/153 [00:00<00:00, 70776.28it/s]
100%|██████████| 200/200 [00:00<00:00, 75288.17it/s]
100%|██████████| 65/65 [00:00<00:00, 74023.83it/s]
100%|██████████| 144/144 [00:00<00:00, 75610.89it/s]
100%|██████████| 30/30 [00:00<00:00, 66225.85it/s]
100%|██████████| 130/130 [00:00<00:00, 66454.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86847.84it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 174.38it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77181.56it/s]
100%|██████████| 287/287 [00:00<00:00, 73877.82it/s]
100%|██████████| 771/771 [00:00<00:00, 78391.55it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86004.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75480.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84547.24it/s]
100%|██████████| 353/353 [00:00<00:00, 78868.02it/s]
100%|██████████| 252/252 [00:00<00:00, 79102.28it/s]
100%|██████████| 203/203 [00:00<00:00, 65035.42it/s]
100%|██████████| 153/153 [00:00<00:00, 71358.67it/s]
100%|██████████| 200/200 [00:00<00:00, 64468.24it/s]
100%|██████████| 65/65 [00:00<00:00, 62832.39it/s]
100%|██████████| 144/144 [00:00<00:00, 70881.33it/s]
100%|██████████| 30/30 [00:00<00:00, 50635.46it/s]
100%|██████████| 130/130 [00:00<00:00, 73277.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93120.43it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 171.97it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76892.62it/s]
100%|██████████| 287/287 [00:00<00:00, 74605.84it/s]
100%|██████████| 771/771 [00:00<00:00, 76814.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87902.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77520.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82844.99it/s]
100%|██████████| 353/353 [00:00<00:00, 76267.93it/s]
100%|██████████| 252/252 [00:00<00:00, 76491.87it/s]
100%|██████████| 203/203 [00:00<00:00, 76103.30it/s]
100%|██████████| 153/153 [00:00<00:00, 74584.90it/s]
100%|██████████| 200/200 [00:00<00:00, 72565.81it/s]
100%|██████████| 65/65 [00:00<00:00, 65693.92it/s]
100%|██████████| 144/144 [00:00<00:00, 76048.83it/s]
100%|██████████| 30/30 [00:00<00:00, 59747.92it/s]
100%|██████████| 130/130 [00:00<00:00, 44980.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87622.82it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 173.53it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77403.98it/s]
100%|██████████| 287/287 [00:00<00:00, 79936.60it/s]
100%|██████████| 771/771 [00:00<00:00, 76614.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88030.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78269.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82221.91it/s]
100%|██████████| 353/353 [00:00<00:00, 75939.34it/s]
100%|██████████| 252/252 [00:00<00:00, 75223.44it/s]
100%|██████████| 203/203 [00:00<00:00, 75362.34it/s]
100%|██████████| 153/153 [00:00<00:00, 71176.63it/s]
100%|██████████| 200/200 [00:00<00:00, 73817.39it/s]
100%|██████████| 65/65 [00:00<00:00, 67150.19it/s]
100%|██████████| 144/144 [00:00<00:00, 70246.54it/s]
100%|██████████| 30/30 [00:00<00:00, 62260.82it/s]
100%|██████████| 130/130 [00:00<00:00, 70238.25it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91546.14it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 174.63it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76541.47it/s]
100%|██████████| 287/287 [00:00<00:00, 80379.62it/s]
100%|██████████| 771/771 [00:00<00:00, 72728.69it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88767.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73504.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80807.32it/s]
100%|██████████| 353/353 [00:00<00:00, 70160.13it/s]
100%|██████████| 252/252 [00:00<00:00, 74032.68it/s]
100%|██████████| 203/203 [00:00<00:00, 71760.95it/s]
100%|██████████| 153/153 [00:00<00:00, 72169.20it/s]
100%|██████████| 200/200 [00:00<00:00, 71906.46it/s]
100%|██████████| 65/65 [00:00<00:00, 71990.96it/s]
100%|██████████| 144/144 [00:00<00:00, 64465.77it/s]
100%|██████████| 30/30 [00:00<00:00, 61380.06it/s]
100%|██████████| 130/130 [00:00<00:00, 58167.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88637.56it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 174.09it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76556.85it/s]
100%|██████████| 287/287 [00:00<00:00, 75551.70it/s]
100%|██████████| 771/771 [00:00<00:00, 78130.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86875.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78508.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81767.22it/s]
100%|██████████| 353/353 [00:00<00:00, 75648.34it/s]
100%|██████████| 252/252 [00:00<00:00, 77507.12it/s]
100%|██████████| 203/203 [00:00<00:00, 74264.61it/s]
100%|██████████| 153/153 [00:00<00:00, 74550.25it/s]
100%|██████████| 200/200 [00:00<00:00, 74985.32it/s]
100%|██████████| 65/65 [00:00<00:00, 75146.02it/s]
100%|██████████| 144/144 [00:00<00:00, 78063.82it/s]
100%|██████████| 30/30 [00:00<00:00, 59269.49it/s]
100%|██████████| 130/130 [00:00<00:00, 76581.39it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90724.64it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 175.58it/s]
INFO:root:The new embedding has 5818 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77848.35it/s]
100%|██████████| 287/287 [00:00<00:00, 74930.92it/s]
100%|██████████| 771/771 [00:00<00:00, 77825.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84219.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76360.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80665.38it/s]
100%|██████████| 353/353 [00:00<00:00, 76001.71it/s]
100%|██████████| 252/252 [00:00<00:00, 74649.67it/s]
100%|██████████| 203/203 [00:00<00:00, 77193.45it/s]
100%|██████████| 153/153 [00:00<00:00, 76070.24it/s]
100%|██████████| 200/200 [00:00<00:00, 75072.56it/s]
100%|██████████| 65/65 [00:00<00:00, 66220.49it/s]
100%|██████████| 144/144 [00:00<00:00, 70947.94it/s]
100%|██████████| 30/30 [00:00<00:00, 57772.78it/s]
100%|██████████| 130/130 [00:00<00:00, 76238.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88894.12it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 172.59it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80095.38it/s]
100%|██████████| 287/287 [00:00<00:00, 79215.93it/s]
100%|██████████| 771/771 [00:00<00:00, 80541.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76747.07it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80874.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77511.05it/s]
100%|██████████| 353/353 [00:00<00:00, 78246.98it/s]
100%|██████████| 252/252 [00:00<00:00, 77184.50it/s]
100%|██████████| 203/203 [00:00<00:00, 78452.38it/s]
100%|██████████| 153/153 [00:00<00:00, 79698.03it/s]
100%|██████████| 200/200 [00:00<00:00, 75976.89it/s]
100%|██████████| 65/65 [00:00<00:00, 75146.02it/s]
100%|██████████| 144/144 [00:00<00:00, 76443.46it/s]
100%|██████████| 30/30 [00:00<00:00, 69365.56it/s]
100%|██████████| 130/130 [00:00<00:00, 75166.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93937.38it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 175.91it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81540.27it/s]
100%|██████████| 287/287 [00:00<00:00, 79941.91it/s]
100%|██████████| 771/771 [00:00<00:00, 80859.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82031.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82289.66it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82569.37it/s]
100%|██████████| 353/353 [00:00<00:00, 80813.78it/s]
100%|██████████| 252/252 [00:00<00:00, 80103.42it/s]
100%|██████████| 203/203 [00:00<00:00, 79760.54it/s]
100%|██████████| 153/153 [00:00<00:00, 79412.02it/s]
100%|██████████| 200/200 [00:00<00:00, 79845.88it/s]
100%|██████████| 65/65 [00:00<00:00, 75920.29it/s]
100%|██████████| 144/144 [00:00<00:00, 77274.79it/s]
100%|██████████| 30/30 [00:00<00:00, 69136.88it/s]
100%|██████████| 130/130 [00:00<00:00, 75541.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96263.35it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 173.30it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80982.39it/s]
100%|██████████| 287/287 [00:00<00:00, 78795.92it/s]
100%|██████████| 771/771 [00:00<00:00, 79858.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84031.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81579.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84487.06it/s]
100%|██████████| 353/353 [00:00<00:00, 79053.30it/s]
100%|██████████| 252/252 [00:00<00:00, 81549.62it/s]
100%|██████████| 203/203 [00:00<00:00, 77277.52it/s]
100%|██████████| 153/153 [00:00<00:00, 74567.57it/s]
100%|██████████| 200/200 [00:00<00:00, 75963.13it/s]
100%|██████████| 65/65 [00:00<00:00, 70156.91it/s]
100%|██████████| 144/144 [00:00<00:00, 74991.28it/s]
100%|██████████| 30/30 [00:00<00:00, 55480.21it/s]
100%|██████████| 130/130 [00:00<00:00, 64650.17it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96907.71it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 176.10it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78955.88it/s]
100%|██████████| 287/287 [00:00<00:00, 77278.38it/s]
100%|██████████| 771/771 [00:00<00:00, 79931.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80438.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80942.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79749.73it/s]
100%|██████████| 353/353 [00:00<00:00, 77287.12it/s]
100%|██████████| 252/252 [00:00<00:00, 77518.49it/s]
100%|██████████| 203/203 [00:00<00:00, 76035.34it/s]
100%|██████████| 153/153 [00:00<00:00, 79274.68it/s]
100%|██████████| 200/200 [00:00<00:00, 79460.15it/s]
100%|██████████| 65/65 [00:00<00:00, 78341.89it/s]
100%|██████████| 144/144 [00:00<00:00, 80908.21it/s]
100%|██████████| 30/30 [00:00<00:00, 64693.63it/s]
100%|██████████| 130/130 [00:00<00:00, 68004.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75535.33it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 172.27it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80098.44it/s]
100%|██████████| 287/287 [00:00<00:00, 76878.61it/s]
100%|██████████| 771/771 [00:00<00:00, 80247.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78942.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80996.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80875.36it/s]
100%|██████████| 353/353 [00:00<00:00, 77603.09it/s]
100%|██████████| 252/252 [00:00<00:00, 77832.45it/s]
100%|██████████| 203/203 [00:00<00:00, 75455.84it/s]
100%|██████████| 153/153 [00:00<00:00, 75666.61it/s]
100%|██████████| 200/200 [00:00<00:00, 75566.24it/s]
100%|██████████| 65/65 [00:00<00:00, 67067.59it/s]
100%|██████████| 144/144 [00:00<00:00, 51950.78it/s]
100%|██████████| 30/30 [00:00<00:00, 50291.41it/s]
100%|██████████| 130/130 [00:00<00:00, 72344.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 97271.79it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:33<00:00, 174.97it/s]
INFO:root:The new embedding has 5818 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 50905.21it/s]
100%|██████████| 287/287 [00:00<00:00, 57787.20it/s]
100%|██████████| 771/771 [00:00<00:00, 58002.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98958.44it/s]
100%|██████████| 1000/1000 [00:00<00:00, 58528.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88765.83it/s]
100%|██████████| 353/353 [00:00<00:00, 57810.68it/s]
100%|██████████| 252/252 [00:00<00:00, 58004.86it/s]
100%|██████████| 203/203 [00:00<00:00, 58012.11it/s]
100%|██████████| 153/153 [00:00<00:00, 52025.01it/s]
100%|██████████| 200/200 [00:00<00:00, 92355.04it/s]
100%|██████████| 65/65 [00:00<00:00, 69887.15it/s]
100%|██████████| 144/144 [00:00<00:00, 80231.11it/s]
100%|██████████| 30/30 [00:00<00:00, 55849.59it/s]
100%|██████████| 130/130 [00:00<00:00, 79137.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95426.09it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['secluding' 'isolate']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:18<00:00, 307.70it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 74400.90it/s]
100%|██████████| 287/287 [00:00<00:00, 75561.19it/s]
100%|██████████| 771/771 [00:00<00:00, 88319.22it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77011.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77949.45it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78660.90it/s]
100%|██████████| 353/353 [00:00<00:00, 67864.02it/s]
100%|██████████| 252/252 [00:00<00:00, 75405.91it/s]
100%|██████████| 203/203 [00:00<00:00, 77319.63it/s]
100%|██████████| 153/153 [00:00<00:00, 78817.06it/s]
100%|██████████| 200/200 [00:00<00:00, 75328.74it/s]
100%|██████████| 65/65 [00:00<00:00, 75499.80it/s]
100%|██████████| 144/144 [00:00<00:00, 78327.04it/s]
100%|██████████| 30/30 [00:00<00:00, 67722.88it/s]
100%|██████████| 130/130 [00:00<00:00, 74407.69it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91081.52it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:11<00:00, 488.16it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77119.06it/s]
100%|██████████| 287/287 [00:00<00:00, 74283.57it/s]
100%|██████████| 771/771 [00:00<00:00, 73012.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98424.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82325.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75238.20it/s]
100%|██████████| 353/353 [00:00<00:00, 75880.96it/s]
100%|██████████| 252/252 [00:00<00:00, 85026.52it/s]
100%|██████████| 203/203 [00:00<00:00, 91780.07it/s]
100%|██████████| 153/153 [00:00<00:00, 74689.07it/s]
100%|██████████| 200/200 [00:00<00:00, 74958.52it/s]
100%|██████████| 65/65 [00:00<00:00, 75353.72it/s]
100%|██████████| 144/144 [00:00<00:00, 67756.31it/s]
100%|██████████| 30/30 [00:00<00:00, 62883.12it/s]
100%|██████████| 130/130 [00:00<00:00, 70265.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82078.94it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:13<00:00, 436.60it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75791.08it/s]
100%|██████████| 287/287 [00:00<00:00, 70210.86it/s]
100%|██████████| 771/771 [00:00<00:00, 73597.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96406.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75727.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91962.87it/s]
100%|██████████| 353/353 [00:00<00:00, 75764.47it/s]
100%|██████████| 252/252 [00:00<00:00, 73507.52it/s]
100%|██████████| 203/203 [00:00<00:00, 67005.88it/s]
100%|██████████| 153/153 [00:00<00:00, 73181.49it/s]
100%|██████████| 200/200 [00:00<00:00, 74831.47it/s]
100%|██████████| 65/65 [00:00<00:00, 30931.45it/s]
100%|██████████| 144/144 [00:00<00:00, 49088.08it/s]
100%|██████████| 30/30 [00:00<00:00, 54875.32it/s]
100%|██████████| 130/130 [00:00<00:00, 77894.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73275.02it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 465.73it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 79734.16it/s]
100%|██████████| 287/287 [00:00<00:00, 73485.46it/s]
100%|██████████| 771/771 [00:00<00:00, 76825.32it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77568.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85580.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77606.19it/s]
100%|██████████| 353/353 [00:00<00:00, 82904.38it/s]
100%|██████████| 252/252 [00:00<00:00, 74032.68it/s]
100%|██████████| 203/203 [00:00<00:00, 79196.70it/s]
100%|██████████| 153/153 [00:00<00:00, 74386.06it/s]
100%|██████████| 200/200 [00:00<00:00, 78508.26it/s]
100%|██████████| 65/65 [00:00<00:00, 75835.82it/s]
100%|██████████| 144/144 [00:00<00:00, 77453.16it/s]
100%|██████████| 30/30 [00:00<00:00, 69327.34it/s]
100%|██████████| 130/130 [00:00<00:00, 74367.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84305.68it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 474.66it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77371.11it/s]
100%|██████████| 287/287 [00:00<00:00, 45890.94it/s]
100%|██████████| 771/771 [00:00<00:00, 48191.71it/s]
100%|██████████| 2000/2000 [00:00<00:00, 63038.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77884.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74690.66it/s]
100%|██████████| 353/353 [00:00<00:00, 81310.85it/s]
100%|██████████| 252/252 [00:00<00:00, 77145.07it/s]
100%|██████████| 203/203 [00:00<00:00, 77326.65it/s]
100%|██████████| 153/153 [00:00<00:00, 77908.04it/s]
100%|██████████| 200/200 [00:00<00:00, 78810.67it/s]
100%|██████████| 65/65 [00:00<00:00, 74306.29it/s]
100%|██████████| 144/144 [00:00<00:00, 75488.04it/s]
100%|██████████| 30/30 [00:00<00:00, 64826.96it/s]
100%|██████████| 130/130 [00:00<00:00, 72181.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90521.01it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 474.15it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 78010.68it/s]
100%|██████████| 287/287 [00:00<00:00, 80186.87it/s]
100%|██████████| 771/771 [00:00<00:00, 80293.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73875.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72843.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97989.36it/s]
100%|██████████| 353/353 [00:00<00:00, 73797.01it/s]
100%|██████████| 252/252 [00:00<00:00, 75573.05it/s]
100%|██████████| 203/203 [00:00<00:00, 57980.50it/s]
100%|██████████| 153/153 [00:00<00:00, 55778.23it/s]
100%|██████████| 200/200 [00:00<00:00, 77335.74it/s]
100%|██████████| 65/65 [00:00<00:00, 61583.41it/s]
100%|██████████| 144/144 [00:00<00:00, 76317.89it/s]
100%|██████████| 30/30 [00:00<00:00, 59325.37it/s]
100%|██████████| 130/130 [00:00<00:00, 76581.39it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85285.74it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 465.87it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75883.04it/s]
100%|██████████| 287/287 [00:00<00:00, 72533.46it/s]
100%|██████████| 771/771 [00:00<00:00, 85875.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77538.76it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76782.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77031.32it/s]
100%|██████████| 353/353 [00:00<00:00, 69872.08it/s]
100%|██████████| 252/252 [00:00<00:00, 77128.18it/s]
100%|██████████| 203/203 [00:00<00:00, 75731.01it/s]
100%|██████████| 153/153 [00:00<00:00, 74602.25it/s]
100%|██████████| 200/200 [00:00<00:00, 73243.76it/s]
100%|██████████| 65/65 [00:00<00:00, 66284.89it/s]
100%|██████████| 144/144 [00:00<00:00, 71680.49it/s]
100%|██████████| 30/30 [00:00<00:00, 47411.12it/s]
100%|██████████| 130/130 [00:00<00:00, 71322.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89787.97it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:11<00:00, 489.70it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 74036.75it/s]
100%|██████████| 287/287 [00:00<00:00, 77036.05it/s]
100%|██████████| 771/771 [00:00<00:00, 85095.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78268.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78011.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98410.10it/s]
100%|██████████| 353/353 [00:00<00:00, 76619.19it/s]
100%|██████████| 252/252 [00:00<00:00, 69660.88it/s]
100%|██████████| 203/203 [00:00<00:00, 63102.62it/s]
100%|██████████| 153/153 [00:00<00:00, 58884.98it/s]
100%|██████████| 200/200 [00:00<00:00, 75471.06it/s]
100%|██████████| 65/65 [00:00<00:00, 73386.21it/s]
100%|██████████| 144/144 [00:00<00:00, 76029.68it/s]
100%|██████████| 30/30 [00:00<00:00, 67979.00it/s]
100%|██████████| 130/130 [00:00<00:00, 76818.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77913.04it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 471.91it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 79075.09it/s]
100%|██████████| 287/287 [00:00<00:00, 75057.07it/s]
100%|██████████| 771/771 [00:00<00:00, 89181.45it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78259.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79413.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 99145.18it/s]
100%|██████████| 353/353 [00:00<00:00, 76516.24it/s]
100%|██████████| 252/252 [00:00<00:00, 74776.41it/s]
100%|██████████| 203/203 [00:00<00:00, 62546.37it/s]
100%|██████████| 153/153 [00:00<00:00, 60643.41it/s]
100%|██████████| 200/200 [00:00<00:00, 69025.00it/s]
100%|██████████| 65/65 [00:00<00:00, 66156.21it/s]
100%|██████████| 144/144 [00:00<00:00, 72384.92it/s]
100%|██████████| 30/30 [00:00<00:00, 73670.44it/s]
100%|██████████| 130/130 [00:00<00:00, 67274.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72964.00it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:12<00:00, 486.38it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77104.87it/s]
100%|██████████| 287/287 [00:00<00:00, 74444.36it/s]
100%|██████████| 771/771 [00:00<00:00, 74185.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97797.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80018.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74317.46it/s]
100%|██████████| 353/353 [00:00<00:00, 67941.87it/s]
100%|██████████| 252/252 [00:00<00:00, 73800.07it/s]
100%|██████████| 203/203 [00:00<00:00, 75129.60it/s]
100%|██████████| 153/153 [00:00<00:00, 74437.83it/s]
100%|██████████| 200/200 [00:00<00:00, 78186.30it/s]
100%|██████████| 65/65 [00:00<00:00, 65996.07it/s]
100%|██████████| 144/144 [00:00<00:00, 76356.48it/s]
100%|██████████| 30/30 [00:00<00:00, 62977.54it/s]
100%|██████████| 130/130 [00:00<00:00, 72334.77it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86396.52it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:27<00:00, 209.52it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77015.58it/s]
100%|██████████| 287/287 [00:00<00:00, 68438.53it/s]
100%|██████████| 771/771 [00:00<00:00, 88406.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76152.77it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79179.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95162.88it/s]
100%|██████████| 353/353 [00:00<00:00, 74879.35it/s]
100%|██████████| 252/252 [00:00<00:00, 67002.51it/s]
100%|██████████| 203/203 [00:00<00:00, 66085.35it/s]
100%|██████████| 153/153 [00:00<00:00, 69647.11it/s]
100%|██████████| 200/200 [00:00<00:00, 73429.69it/s]
100%|██████████| 65/65 [00:00<00:00, 69406.76it/s]
100%|██████████| 144/144 [00:00<00:00, 71671.98it/s]
100%|██████████| 30/30 [00:00<00:00, 64893.82it/s]
100%|██████████| 130/130 [00:00<00:00, 74064.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71040.02it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 220.68it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76120.15it/s]
100%|██████████| 287/287 [00:00<00:00, 67362.35it/s]
100%|██████████| 771/771 [00:00<00:00, 87513.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75942.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76963.94it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93040.66it/s]
100%|██████████| 353/353 [00:00<00:00, 76453.03it/s]
100%|██████████| 252/252 [00:00<00:00, 74602.25it/s]
100%|██████████| 203/203 [00:00<00:00, 54035.90it/s]
100%|██████████| 153/153 [00:00<00:00, 61000.81it/s]
100%|██████████| 200/200 [00:00<00:00, 76170.05it/s]
100%|██████████| 65/65 [00:00<00:00, 72200.68it/s]
100%|██████████| 144/144 [00:00<00:00, 71910.92it/s]
100%|██████████| 30/30 [00:00<00:00, 49656.32it/s]
100%|██████████| 130/130 [00:00<00:00, 71182.70it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78470.29it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:27<00:00, 216.33it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76174.12it/s]
100%|██████████| 287/287 [00:00<00:00, 68932.33it/s]
100%|██████████| 771/771 [00:00<00:00, 80064.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74732.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81166.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93300.06it/s]
100%|██████████| 353/353 [00:00<00:00, 75594.27it/s]
100%|██████████| 252/252 [00:00<00:00, 68540.60it/s]
100%|██████████| 203/203 [00:00<00:00, 60198.23it/s]
100%|██████████| 153/153 [00:00<00:00, 62321.89it/s]
100%|██████████| 200/200 [00:00<00:00, 72817.78it/s]
100%|██████████| 65/65 [00:00<00:00, 70647.77it/s]
100%|██████████| 144/144 [00:00<00:00, 70773.35it/s]
100%|██████████| 30/30 [00:00<00:00, 32472.03it/s]
100%|██████████| 130/130 [00:00<00:00, 54960.14it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69074.20it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 221.89it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76889.80it/s]
100%|██████████| 287/287 [00:00<00:00, 71969.70it/s]
100%|██████████| 771/771 [00:00<00:00, 73164.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85831.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77385.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93213.66it/s]
100%|██████████| 353/353 [00:00<00:00, 77384.06it/s]
100%|██████████| 252/252 [00:00<00:00, 74423.65it/s]
100%|██████████| 203/203 [00:00<00:00, 74361.90it/s]
100%|██████████| 153/153 [00:00<00:00, 75497.47it/s]
100%|██████████| 200/200 [00:00<00:00, 76875.07it/s]
100%|██████████| 65/65 [00:00<00:00, 72817.78it/s]
100%|██████████| 144/144 [00:00<00:00, 52049.27it/s]
100%|██████████| 30/30 [00:00<00:00, 59521.82it/s]
100%|██████████| 130/130 [00:00<00:00, 69967.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85034.78it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 218.72it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77459.79it/s]
100%|██████████| 287/287 [00:00<00:00, 80293.84it/s]
100%|██████████| 771/771 [00:00<00:00, 74570.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76100.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79396.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94555.75it/s]
100%|██████████| 353/353 [00:00<00:00, 76091.55it/s]
100%|██████████| 252/252 [00:00<00:00, 77274.79it/s]
100%|██████████| 203/203 [00:00<00:00, 64391.11it/s]
100%|██████████| 153/153 [00:00<00:00, 55488.85it/s]
100%|██████████| 200/200 [00:00<00:00, 66444.42it/s]
100%|██████████| 65/65 [00:00<00:00, 66446.44it/s]
100%|██████████| 144/144 [00:00<00:00, 72272.32it/s]
100%|██████████| 30/30 [00:00<00:00, 60845.80it/s]
100%|██████████| 130/130 [00:00<00:00, 71210.59it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83522.40it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 220.94it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77692.46it/s]
100%|██████████| 287/287 [00:00<00:00, 68578.89it/s]
100%|██████████| 771/771 [00:00<00:00, 70772.51it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98529.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76978.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89671.70it/s]
100%|██████████| 353/353 [00:00<00:00, 76571.64it/s]
100%|██████████| 252/252 [00:00<00:00, 73004.88it/s]
100%|██████████| 203/203 [00:00<00:00, 74109.47it/s]
100%|██████████| 153/153 [00:00<00:00, 72634.81it/s]
100%|██████████| 200/200 [00:00<00:00, 73320.58it/s]
100%|██████████| 65/65 [00:00<00:00, 65980.10it/s]
100%|██████████| 144/144 [00:00<00:00, 74777.74it/s]
100%|██████████| 30/30 [00:00<00:00, 64395.66it/s]
100%|██████████| 130/130 [00:00<00:00, 69292.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89825.33it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:27<00:00, 215.61it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76131.21it/s]
100%|██████████| 287/287 [00:00<00:00, 71686.83it/s]
100%|██████████| 771/771 [00:00<00:00, 80822.98it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76431.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81618.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93466.38it/s]
100%|██████████| 353/353 [00:00<00:00, 75974.41it/s]
100%|██████████| 252/252 [00:00<00:00, 72999.83it/s]
100%|██████████| 203/203 [00:00<00:00, 76997.98it/s]
100%|██████████| 153/153 [00:00<00:00, 71717.54it/s]
100%|██████████| 200/200 [00:00<00:00, 73862.89it/s]
100%|██████████| 65/65 [00:00<00:00, 68499.94it/s]
100%|██████████| 144/144 [00:00<00:00, 75365.58it/s]
100%|██████████| 30/30 [00:00<00:00, 54755.93it/s]
100%|██████████| 130/130 [00:00<00:00, 72672.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78950.97it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 221.68it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 77878.74it/s]
100%|██████████| 287/287 [00:00<00:00, 75799.08it/s]
100%|██████████| 771/771 [00:00<00:00, 73462.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87538.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77570.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90662.17it/s]
100%|██████████| 353/353 [00:00<00:00, 76567.68it/s]
100%|██████████| 252/252 [00:00<00:00, 76007.81it/s]
100%|██████████| 203/203 [00:00<00:00, 72960.04it/s]
100%|██████████| 153/153 [00:00<00:00, 72462.57it/s]
100%|██████████| 200/200 [00:00<00:00, 74163.27it/s]
100%|██████████| 65/65 [00:00<00:00, 45287.34it/s]
100%|██████████| 144/144 [00:00<00:00, 76822.66it/s]
100%|██████████| 30/30 [00:00<00:00, 66541.05it/s]
100%|██████████| 130/130 [00:00<00:00, 75011.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81700.70it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 217.79it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76704.01it/s]
100%|██████████| 287/287 [00:00<00:00, 52653.54it/s]
100%|██████████| 771/771 [00:00<00:00, 85781.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75997.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80200.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95147.05it/s]
100%|██████████| 353/353 [00:00<00:00, 75990.01it/s]
100%|██████████| 252/252 [00:00<00:00, 75325.30it/s]
100%|██████████| 203/203 [00:00<00:00, 70989.14it/s]
100%|██████████| 153/153 [00:00<00:00, 68218.19it/s]
100%|██████████| 200/200 [00:00<00:00, 76692.34it/s]
100%|██████████| 65/65 [00:00<00:00, 70428.77it/s]
100%|██████████| 144/144 [00:00<00:00, 76231.20it/s]
100%|██████████| 30/30 [00:00<00:00, 57852.47it/s]
100%|██████████| 130/130 [00:00<00:00, 63277.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95192.19it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 221.08it/s]
INFO:root:The new embedding has 5813 word and vectors have 600 dimensions
100%|██████████| 999/999 [00:00<00:00, 76865.82it/s]
100%|██████████| 287/287 [00:00<00:00, 70801.39it/s]
100%|██████████| 771/771 [00:00<00:00, 70370.55it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78482.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83283.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93208.14it/s]
100%|██████████| 353/353 [00:00<00:00, 76107.19it/s]
100%|██████████| 252/252 [00:00<00:00, 75357.52it/s]
100%|██████████| 203/203 [00:00<00:00, 74277.56it/s]
100%|██████████| 153/153 [00:00<00:00, 75845.47it/s]
100%|██████████| 200/200 [00:00<00:00, 75688.97it/s]
100%|██████████| 65/65 [00:00<00:00, 55435.09it/s]
100%|██████████| 144/144 [00:00<00:00, 74473.46it/s]
100%|██████████| 30/30 [00:00<00:00, 65775.81it/s]
100%|██████████| 130/130 [00:00<00:00, 75867.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76820.36it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 217.80it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79113.90it/s]
100%|██████████| 287/287 [00:00<00:00, 71064.72it/s]
100%|██████████| 771/771 [00:00<00:00, 74025.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91706.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75465.63it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90245.37it/s]
100%|██████████| 353/353 [00:00<00:00, 58256.51it/s]
100%|██████████| 252/252 [00:00<00:00, 58664.85it/s]
100%|██████████| 203/203 [00:00<00:00, 65723.17it/s]
100%|██████████| 153/153 [00:00<00:00, 65150.10it/s]
100%|██████████| 200/200 [00:00<00:00, 77744.28it/s]
100%|██████████| 65/65 [00:00<00:00, 71593.95it/s]
100%|██████████| 144/144 [00:00<00:00, 77423.38it/s]
100%|██████████| 30/30 [00:00<00:00, 54073.54it/s]
100%|██████████| 130/130 [00:00<00:00, 77341.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77816.81it/s]
100%|██████████| 203

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 221.99it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82469.49it/s]
100%|██████████| 287/287 [00:00<00:00, 73995.90it/s]
100%|██████████| 771/771 [00:00<00:00, 78077.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81733.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79179.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95827.46it/s]
100%|██████████| 353/353 [00:00<00:00, 80519.32it/s]
100%|██████████| 252/252 [00:00<00:00, 80152.01it/s]
100%|██████████| 203/203 [00:00<00:00, 77885.45it/s]
100%|██████████| 153/153 [00:00<00:00, 72274.86it/s]
100%|██████████| 200/200 [00:00<00:00, 61360.60it/s]
100%|██████████| 65/65 [00:00<00:00, 66252.68it/s]
100%|██████████| 144/144 [00:00<00:00, 81147.36it/s]
100%|██████████| 30/30 [00:00<00:00, 57719.78it/s]
100%|██████████| 130/130 [00:00<00:00, 74631.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81865.64it/s]
100%|██████████| 203

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 217.79it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82019.10it/s]
100%|██████████| 287/287 [00:00<00:00, 64462.10it/s]
100%|██████████| 771/771 [00:00<00:00, 78101.88it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79939.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78643.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95790.25it/s]
100%|██████████| 353/353 [00:00<00:00, 78700.33it/s]
100%|██████████| 252/252 [00:00<00:00, 78045.09it/s]
100%|██████████| 203/203 [00:00<00:00, 70865.06it/s]
100%|██████████| 153/153 [00:00<00:00, 62558.83it/s]
100%|██████████| 200/200 [00:00<00:00, 63195.78it/s]
100%|██████████| 65/65 [00:00<00:00, 56456.77it/s]
100%|██████████| 144/144 [00:00<00:00, 66804.53it/s]
100%|██████████| 30/30 [00:00<00:00, 59861.62it/s]
100%|██████████| 130/130 [00:00<00:00, 66148.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 100709.10it/s]
100%|██████████| 20

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 220.99it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80628.65it/s]
100%|██████████| 287/287 [00:00<00:00, 73674.35it/s]
100%|██████████| 771/771 [00:00<00:00, 75759.83it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91133.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81752.34it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96691.22it/s]
100%|██████████| 353/353 [00:00<00:00, 78859.62it/s]
100%|██████████| 252/252 [00:00<00:00, 79339.78it/s]
100%|██████████| 203/203 [00:00<00:00, 77828.49it/s]
100%|██████████| 153/153 [00:00<00:00, 76862.92it/s]
100%|██████████| 200/200 [00:00<00:00, 70575.53it/s]
100%|██████████| 65/65 [00:00<00:00, 64527.75it/s]
100%|██████████| 144/144 [00:00<00:00, 78438.93it/s]
100%|██████████| 30/30 [00:00<00:00, 66400.59it/s]
100%|██████████| 130/130 [00:00<00:00, 68353.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78577.81it/s]
100%|██████████| 203

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 217.05it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79950.19it/s]
100%|██████████| 287/287 [00:00<00:00, 73818.93it/s]
100%|██████████| 771/771 [00:00<00:00, 87765.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97910.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82493.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86729.66it/s]
100%|██████████| 353/353 [00:00<00:00, 80001.58it/s]
100%|██████████| 252/252 [00:00<00:00, 77838.18it/s]
100%|██████████| 203/203 [00:00<00:00, 77963.90it/s]
100%|██████████| 153/153 [00:00<00:00, 74837.14it/s]
100%|██████████| 200/200 [00:00<00:00, 67770.30it/s]
100%|██████████| 65/65 [00:00<00:00, 75270.50it/s]
100%|██████████| 144/144 [00:00<00:00, 76618.01it/s]
100%|██████████| 30/30 [00:00<00:00, 57143.11it/s]
100%|██████████| 130/130 [00:00<00:00, 79414.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94139.18it/s]
100%|██████████| 203

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:26<00:00, 221.38it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80868.29it/s]
100%|██████████| 287/287 [00:00<00:00, 71031.17it/s]
100%|██████████| 771/771 [00:00<00:00, 80420.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 99826.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80707.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89537.06it/s]
100%|██████████| 353/353 [00:00<00:00, 77991.43it/s]
100%|██████████| 252/252 [00:00<00:00, 80518.37it/s]
100%|██████████| 203/203 [00:00<00:00, 81673.26it/s]
100%|██████████| 153/153 [00:00<00:00, 81118.51it/s]
100%|██████████| 200/200 [00:00<00:00, 75410.00it/s]
100%|██████████| 65/65 [00:00<00:00, 74877.71it/s]
100%|██████████| 144/144 [00:00<00:00, 77762.30it/s]
100%|██████████| 30/30 [00:00<00:00, 54923.23it/s]
100%|██████████| 130/130 [00:00<00:00, 75177.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101489.60it/s]
100%|██████████| 20

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:39<00:00, 149.65it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 86520.67it/s]
100%|██████████| 287/287 [00:00<00:00, 77080.44it/s]
100%|██████████| 771/771 [00:00<00:00, 78073.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86166.92it/s]
100%|██████████| 1000/1000 [00:00<00:00, 99053.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82781.23it/s]
100%|██████████| 353/353 [00:00<00:00, 90263.32it/s]
100%|██████████| 252/252 [00:00<00:00, 76057.03it/s]
100%|██████████| 203/203 [00:00<00:00, 74045.02it/s]
100%|██████████| 153/153 [00:00<00:00, 78643.20it/s]
100%|██████████| 200/200 [00:00<00:00, 74182.95it/s]
100%|██████████| 65/65 [00:00<00:00, 65051.24it/s]
100%|██████████| 144/144 [00:00<00:00, 58271.08it/s]
100%|██████████| 30/30 [00:00<00:00, 40563.87it/s]
100%|██████████| 130/130 [00:00<00:00, 63535.25it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93289.68it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 172.75it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 77180.14it/s]
100%|██████████| 287/287 [00:00<00:00, 76893.34it/s]
100%|██████████| 771/771 [00:00<00:00, 77582.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81078.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78951.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80901.88it/s]
100%|██████████| 353/353 [00:00<00:00, 76107.19it/s]
100%|██████████| 252/252 [00:00<00:00, 76741.79it/s]
100%|██████████| 203/203 [00:00<00:00, 75791.68it/s]
100%|██████████| 153/153 [00:00<00:00, 74628.27it/s]
100%|██████████| 200/200 [00:00<00:00, 75818.94it/s]
100%|██████████| 65/65 [00:00<00:00, 65222.43it/s]
100%|██████████| 144/144 [00:00<00:00, 76154.30it/s]
100%|██████████| 30/30 [00:00<00:00, 54073.54it/s]
100%|██████████| 130/130 [00:00<00:00, 67274.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93673.64it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 175.03it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 78997.56it/s]
100%|██████████| 287/287 [00:00<00:00, 75240.03it/s]
100%|██████████| 771/771 [00:00<00:00, 77391.61it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85071.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77507.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82295.04it/s]
100%|██████████| 353/353 [00:00<00:00, 76782.10it/s]
100%|██████████| 252/252 [00:00<00:00, 75228.80it/s]
100%|██████████| 203/203 [00:00<00:00, 75542.87it/s]
100%|██████████| 153/153 [00:00<00:00, 71263.58it/s]
100%|██████████| 200/200 [00:00<00:00, 72906.38it/s]
100%|██████████| 65/65 [00:00<00:00, 60991.00it/s]
100%|██████████| 144/144 [00:00<00:00, 78144.62it/s]
100%|██████████| 30/30 [00:00<00:00, 67832.41it/s]
100%|██████████| 130/130 [00:00<00:00, 56662.11it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94830.00it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 175.97it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 78820.72it/s]
100%|██████████| 287/287 [00:00<00:00, 77213.94it/s]
100%|██████████| 771/771 [00:00<00:00, 78817.63it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81742.78it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79783.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74914.78it/s]
100%|██████████| 353/353 [00:00<00:00, 77975.00it/s]
100%|██████████| 252/252 [00:00<00:00, 78660.76it/s]
100%|██████████| 203/203 [00:00<00:00, 74550.71it/s]
100%|██████████| 153/153 [00:00<00:00, 71295.25it/s]
100%|██████████| 200/200 [00:00<00:00, 60025.82it/s]
100%|██████████| 65/65 [00:00<00:00, 63050.36it/s]
100%|██████████| 144/144 [00:00<00:00, 75800.67it/s]
100%|██████████| 30/30 [00:00<00:00, 68015.74it/s]
100%|██████████| 130/130 [00:00<00:00, 73723.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77333.50it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 172.95it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 88537.16it/s]
100%|██████████| 287/287 [00:00<00:00, 77472.34it/s]
100%|██████████| 771/771 [00:00<00:00, 78572.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76717.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77375.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86049.36it/s]
100%|██████████| 353/353 [00:00<00:00, 78889.03it/s]
100%|██████████| 252/252 [00:00<00:00, 76597.19it/s]
100%|██████████| 203/203 [00:00<00:00, 76692.82it/s]
100%|██████████| 153/153 [00:00<00:00, 73491.58it/s]
100%|██████████| 200/200 [00:00<00:00, 72836.75it/s]
100%|██████████| 65/65 [00:00<00:00, 62644.71it/s]
100%|██████████| 144/144 [00:00<00:00, 76192.73it/s]
100%|██████████| 30/30 [00:00<00:00, 66541.05it/s]
100%|██████████| 130/130 [00:00<00:00, 69415.60it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76235.52it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 175.73it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 86570.73it/s]
100%|██████████| 287/287 [00:00<00:00, 77938.83it/s]
100%|██████████| 771/771 [00:00<00:00, 77293.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76490.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 102043.74it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85142.21it/s]
100%|██████████| 353/353 [00:00<00:00, 76358.40it/s]
100%|██████████| 252/252 [00:00<00:00, 75665.02it/s]
100%|██████████| 203/203 [00:00<00:00, 74931.24it/s]
100%|██████████| 153/153 [00:00<00:00, 73702.60it/s]
100%|██████████| 200/200 [00:00<00:00, 75133.08it/s]
100%|██████████| 65/65 [00:00<00:00, 58329.00it/s]
100%|██████████| 144/144 [00:00<00:00, 72315.59it/s]
100%|██████████| 30/30 [00:00<00:00, 65879.12it/s]
100%|██████████| 130/130 [00:00<00:00, 79426.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72510.26it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 174.69it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 92968.93it/s]
100%|██████████| 287/287 [00:00<00:00, 76795.23it/s]
100%|██████████| 771/771 [00:00<00:00, 78015.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77123.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79101.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80193.95it/s]
100%|██████████| 353/353 [00:00<00:00, 78872.22it/s]
100%|██████████| 252/252 [00:00<00:00, 77826.71it/s]
100%|██████████| 203/203 [00:00<00:00, 80083.12it/s]
100%|██████████| 153/153 [00:00<00:00, 76350.80it/s]
100%|██████████| 200/200 [00:00<00:00, 76510.47it/s]
100%|██████████| 65/65 [00:00<00:00, 65020.21it/s]
100%|██████████| 144/144 [00:00<00:00, 72611.18it/s]
100%|██████████| 30/30 [00:00<00:00, 65707.11it/s]
100%|██████████| 130/130 [00:00<00:00, 62587.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94927.50it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 175.06it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 75998.65it/s]
100%|██████████| 287/287 [00:00<00:00, 75230.63it/s]
100%|██████████| 771/771 [00:00<00:00, 79019.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85897.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79221.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84831.67it/s]
100%|██████████| 353/353 [00:00<00:00, 78889.03it/s]
100%|██████████| 252/252 [00:00<00:00, 77672.30it/s]
100%|██████████| 203/203 [00:00<00:00, 76748.13it/s]
100%|██████████| 153/153 [00:00<00:00, 73048.21it/s]
100%|██████████| 200/200 [00:00<00:00, 65362.38it/s]
100%|██████████| 65/65 [00:00<00:00, 68637.91it/s]
100%|██████████| 144/144 [00:00<00:00, 71816.86it/s]
100%|██████████| 30/30 [00:00<00:00, 65741.44it/s]
100%|██████████| 130/130 [00:00<00:00, 47442.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72639.78it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 174.92it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 72767.70it/s]
100%|██████████| 287/287 [00:00<00:00, 59692.81it/s]
100%|██████████| 771/771 [00:00<00:00, 59666.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93511.19it/s]
100%|██████████| 1000/1000 [00:00<00:00, 58390.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83820.70it/s]
100%|██████████| 353/353 [00:00<00:00, 56777.59it/s]
100%|██████████| 252/252 [00:00<00:00, 56030.78it/s]
100%|██████████| 203/203 [00:00<00:00, 55872.68it/s]
100%|██████████| 153/153 [00:00<00:00, 47581.26it/s]
100%|██████████| 200/200 [00:00<00:00, 75805.24it/s]
100%|██████████| 65/65 [00:00<00:00, 53488.28it/s]
100%|██████████| 144/144 [00:00<00:00, 55934.41it/s]
100%|██████████| 30/30 [00:00<00:00, 44259.28it/s]
100%|██████████| 130/130 [00:00<00:00, 56797.87it/s]
100%|██████████| 3500/3500 [00:00<00:00, 66849.11it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 176.89it/s]
INFO:root:The new embedding has 5845 word and vectors have 400 dimensions
100%|██████████| 999/999 [00:00<00:00, 85980.95it/s]
100%|██████████| 287/287 [00:00<00:00, 76298.74it/s]
100%|██████████| 771/771 [00:00<00:00, 76530.79it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85128.10it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78508.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78214.97it/s]
100%|██████████| 353/353 [00:00<00:00, 76142.42it/s]
100%|██████████| 252/252 [00:00<00:00, 75465.13it/s]
100%|██████████| 203/203 [00:00<00:00, 79351.70it/s]
100%|██████████| 153/153 [00:00<00:00, 73081.48it/s]
100%|██████████| 200/200 [00:00<00:00, 68826.78it/s]
100%|██████████| 65/65 [00:00<00:00, 65066.77it/s]
100%|██████████| 144/144 [00:00<00:00, 53162.55it/s]
100%|██████████| 30/30 [00:00<00:00, 47680.61it/s]
100%|██████████| 130/130 [00:00<00:00, 73923.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73895.05it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [04:48<00:00, 20.24it/s]
INFO:root:The new embedding has 5819 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 57977.75it/s]
100%|██████████| 287/287 [00:00<00:00, 69349.31it/s]
100%|██████████| 771/771 [00:00<00:00, 82996.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84241.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75312.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86696.79it/s]
100%|██████████| 353/353 [00:00<00:00, 71803.56it/s]
100%|██████████| 252/252 [00:00<00:00, 60007.07it/s]
100%|██████████| 203/203 [00:00<00:00, 83238.22it/s]
100%|██████████| 153/153 [00:00<00:00, 68980.81it/s]
100%|██████████| 200/200 [00:00<00:00, 73077.86it/s]
100%|██████████| 65/65 [00:00<00:00, 69869.24it/s]
100%|██████████| 144/144 [00:00<00:00, 69856.56it/s]
100%|██████████| 30/30 [00:00<00:00, 37763.84it/s]
100%|██████████| 130/130 [00:00<00:00, 60773.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82861.91it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:21<00:00, 41.46it/s]
INFO:root:The new embedding has 5819 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 61481.83it/s]
100%|██████████| 287/287 [00:00<00:00, 71291.99it/s]
100%|██████████| 771/771 [00:00<00:00, 82333.39it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76806.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89081.30it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91666.75it/s]
100%|██████████| 353/353 [00:00<00:00, 78073.68it/s]
100%|██████████| 252/252 [00:00<00:00, 72010.12it/s]
100%|██████████| 203/203 [00:00<00:00, 70245.34it/s]
100%|██████████| 153/153 [00:00<00:00, 71066.28it/s]
100%|██████████| 200/200 [00:00<00:00, 70362.42it/s]
100%|██████████| 65/65 [00:00<00:00, 68072.35it/s]
100%|██████████| 144/144 [00:00<00:00, 67295.80it/s]
100%|██████████| 30/30 [00:00<00:00, 54260.08it/s]
100%|██████████| 130/130 [00:00<00:00, 72258.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85465.48it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:23<00:00, 40.88it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77724.16it/s]
100%|██████████| 287/287 [00:00<00:00, 80117.49it/s]
100%|██████████| 771/771 [00:00<00:00, 81668.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78996.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79072.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78339.15it/s]
100%|██████████| 353/353 [00:00<00:00, 79747.35it/s]
100%|██████████| 252/252 [00:00<00:00, 80006.40it/s]
100%|██████████| 203/203 [00:00<00:00, 77544.96it/s]
100%|██████████| 153/153 [00:00<00:00, 81385.99it/s]
100%|██████████| 200/200 [00:00<00:00, 78456.86it/s]
100%|██████████| 65/65 [00:00<00:00, 66657.64it/s]
100%|██████████| 144/144 [00:00<00:00, 77423.38it/s]
100%|██████████| 30/30 [00:00<00:00, 69711.42it/s]
100%|██████████| 130/130 [00:00<00:00, 73061.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93962.03it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [02:19<00:00, 41.96it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 50624.14it/s]
100%|██████████| 287/287 [00:00<00:00, 57224.06it/s]
100%|██████████| 771/771 [00:00<00:00, 80869.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81830.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79350.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79432.06it/s]
100%|██████████| 353/353 [00:00<00:00, 76722.42it/s]
100%|██████████| 252/252 [00:00<00:00, 75239.51it/s]
100%|██████████| 203/203 [00:00<00:00, 70048.85it/s]
100%|██████████| 153/153 [00:00<00:00, 79717.83it/s]
100%|██████████| 200/200 [00:00<00:00, 75369.34it/s]
100%|██████████| 65/65 [00:00<00:00, 69495.22it/s]
100%|██████████| 144/144 [00:00<00:00, 74117.04it/s]
100%|██████████| 30/30 [00:00<00:00, 57985.77it/s]
100%|██████████| 130/130 [00:00<00:00, 74356.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77699.43it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:46<00:00, 126.09it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 90653.81it/s]
100%|██████████| 287/287 [00:00<00:00, 83328.62it/s]
100%|██████████| 771/771 [00:00<00:00, 84444.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74395.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75414.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93665.37it/s]
100%|██████████| 353/353 [00:00<00:00, 78168.49it/s]
100%|██████████| 252/252 [00:00<00:00, 83979.39it/s]
100%|██████████| 203/203 [00:00<00:00, 83597.81it/s]
100%|██████████| 153/153 [00:00<00:00, 70504.12it/s]
100%|██████████| 200/200 [00:00<00:00, 71252.93it/s]
100%|██████████| 65/65 [00:00<00:00, 72086.13it/s]
100%|██████████| 144/144 [00:00<00:00, 72874.01it/s]
100%|██████████| 30/30 [00:00<00:00, 66788.28it/s]
100%|██████████| 130/130 [00:00<00:00, 66968.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79473.27it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:31<00:00, 184.43it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 75367.11it/s]
100%|██████████| 287/287 [00:00<00:00, 73923.19it/s]
100%|██████████| 771/771 [00:00<00:00, 82283.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94066.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93719.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89714.53it/s]
100%|██████████| 353/353 [00:00<00:00, 73789.65it/s]
100%|██████████| 252/252 [00:00<00:00, 74172.95it/s]
100%|██████████| 203/203 [00:00<00:00, 71399.89it/s]
100%|██████████| 153/153 [00:00<00:00, 75809.63it/s]
100%|██████████| 200/200 [00:00<00:00, 76447.72it/s]
100%|██████████| 65/65 [00:00<00:00, 54932.45it/s]
100%|██████████| 144/144 [00:00<00:00, 84272.33it/s]
100%|██████████| 30/30 [00:00<00:00, 52081.59it/s]
100%|██████████| 130/130 [00:00<00:00, 83873.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91776.21it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:32<00:00, 180.31it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 50357.05it/s]
100%|██████████| 287/287 [00:00<00:00, 56072.54it/s]
100%|██████████| 771/771 [00:00<00:00, 57389.94it/s]
100%|██████████| 2000/2000 [00:00<00:00, 57401.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 58912.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 57236.42it/s]
100%|██████████| 353/353 [00:00<00:00, 57114.89it/s]
100%|██████████| 252/252 [00:00<00:00, 55309.50it/s]
100%|██████████| 203/203 [00:00<00:00, 53953.72it/s]
100%|██████████| 153/153 [00:00<00:00, 99724.71it/s]
100%|██████████| 200/200 [00:00<00:00, 58108.95it/s]
100%|██████████| 65/65 [00:00<00:00, 54243.88it/s]
100%|██████████| 144/144 [00:00<00:00, 57200.47it/s]
100%|██████████| 30/30 [00:00<00:00, 50271.32it/s]
100%|██████████| 130/130 [00:00<00:00, 53477.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 56816.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:31<00:00, 184.53it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58425.61it/s]
100%|██████████| 287/287 [00:00<00:00, 59339.70it/s]
100%|██████████| 771/771 [00:00<00:00, 56273.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 57906.78it/s]
100%|██████████| 1000/1000 [00:00<00:00, 58376.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 57703.10it/s]
100%|██████████| 353/353 [00:00<00:00, 58769.87it/s]
100%|██████████| 252/252 [00:00<00:00, 56525.19it/s]
100%|██████████| 203/203 [00:00<00:00, 55777.51it/s]
100%|██████████| 153/153 [00:00<00:00, 56336.45it/s]
100%|██████████| 200/200 [00:00<00:00, 62041.33it/s]
100%|██████████| 65/65 [00:00<00:00, 56398.38it/s]
100%|██████████| 144/144 [00:00<00:00, 60428.19it/s]
100%|██████████| 30/30 [00:00<00:00, 50963.60it/s]
100%|██████████| 130/130 [00:00<00:00, 61912.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88125.68it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 149.26it/s]
INFO:root:The new embedding has 5843 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 53946.90it/s]
100%|██████████| 287/287 [00:00<00:00, 53245.10it/s]
100%|██████████| 771/771 [00:00<00:00, 80734.20it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92343.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80007.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91072.29it/s]
100%|██████████| 353/353 [00:00<00:00, 81773.41it/s]
100%|██████████| 252/252 [00:00<00:00, 76342.69it/s]
100%|██████████| 203/203 [00:00<00:00, 85246.67it/s]
100%|██████████| 153/153 [00:00<00:00, 71693.50it/s]
100%|██████████| 200/200 [00:00<00:00, 86160.72it/s]
100%|██████████| 65/65 [00:00<00:00, 65284.90it/s]
100%|██████████| 144/144 [00:00<00:00, 71536.16it/s]
100%|██████████| 30/30 [00:00<00:00, 57985.77it/s]
100%|██████████| 130/130 [00:00<00:00, 80008.73it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90782.43it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 171.76it/s]
INFO:root:The new embedding has 5843 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 92344.02it/s]
100%|██████████| 287/287 [00:00<00:00, 71725.27it/s]
100%|██████████| 771/771 [00:00<00:00, 89482.51it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89440.32it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87045.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82718.64it/s]
100%|██████████| 353/353 [00:00<00:00, 72513.92it/s]
100%|██████████| 252/252 [00:00<00:00, 72939.38it/s]
100%|██████████| 203/203 [00:00<00:00, 70210.58it/s]
100%|██████████| 153/153 [00:00<00:00, 65242.83it/s]
100%|██████████| 200/200 [00:00<00:00, 74778.11it/s]
100%|██████████| 65/65 [00:00<00:00, 44605.65it/s]
100%|██████████| 144/144 [00:00<00:00, 69113.15it/s]
100%|██████████| 30/30 [00:00<00:00, 45639.87it/s]
100%|██████████| 130/130 [00:00<00:00, 64178.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79087.93it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.68it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80342.64it/s]
100%|██████████| 287/287 [00:00<00:00, 77632.22it/s]
100%|██████████| 771/771 [00:00<00:00, 78604.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77671.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80619.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76988.43it/s]
100%|██████████| 353/353 [00:00<00:00, 81123.74it/s]
100%|██████████| 252/252 [00:00<00:00, 79423.25it/s]
100%|██████████| 203/203 [00:00<00:00, 70723.79it/s]
100%|██████████| 153/153 [00:00<00:00, 73677.21it/s]
100%|██████████| 200/200 [00:00<00:00, 78603.90it/s]
100%|██████████| 65/65 [00:00<00:00, 74306.29it/s]
100%|██████████| 144/144 [00:00<00:00, 68385.39it/s]
100%|██████████| 30/30 [00:00<00:00, 64296.94it/s]
100%|██████████| 130/130 [00:00<00:00, 77672.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76164.72it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 171.22it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80218.05it/s]
100%|██████████| 287/287 [00:00<00:00, 77597.19it/s]
100%|██████████| 771/771 [00:00<00:00, 81400.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82485.48it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86806.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78325.49it/s]
100%|██████████| 353/353 [00:00<00:00, 79375.40it/s]
100%|██████████| 252/252 [00:00<00:00, 78538.02it/s]
100%|██████████| 203/203 [00:00<00:00, 74290.53it/s]
100%|██████████| 153/153 [00:00<00:00, 73273.41it/s]
100%|██████████| 200/200 [00:00<00:00, 73597.19it/s]
100%|██████████| 65/65 [00:00<00:00, 61639.10it/s]
100%|██████████| 144/144 [00:00<00:00, 72393.60it/s]
100%|██████████| 30/30 [00:00<00:00, 64494.68it/s]
100%|██████████| 130/130 [00:00<00:00, 78703.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75915.00it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [04:21<00:00, 22.40it/s]
INFO:root:The new embedding has 5824 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 61886.83it/s]
100%|██████████| 287/287 [00:00<00:00, 91194.34it/s]
100%|██████████| 771/771 [00:00<00:00, 90516.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87514.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75496.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80618.35it/s]
100%|██████████| 353/353 [00:00<00:00, 74148.10it/s]
100%|██████████| 252/252 [00:00<00:00, 72939.38it/s]
100%|██████████| 203/203 [00:00<00:00, 71363.99it/s]
100%|██████████| 153/153 [00:00<00:00, 76278.20it/s]
100%|██████████| 200/200 [00:00<00:00, 70256.35it/s]
100%|██████████| 65/65 [00:00<00:00, 69283.29it/s]
100%|██████████| 144/144 [00:00<00:00, 80648.92it/s]
100%|██████████| 30/30 [00:00<00:00, 40368.66it/s]
100%|██████████| 130/130 [00:00<00:00, 68482.73it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71522.50it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [03:14<00:00, 29.98it/s]
INFO:root:The new embedding has 5824 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 81487.94it/s]
100%|██████████| 287/287 [00:00<00:00, 82022.71it/s]
100%|██████████| 771/771 [00:00<00:00, 80261.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77770.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90756.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76846.90it/s]
100%|██████████| 353/353 [00:00<00:00, 87801.06it/s]
100%|██████████| 252/252 [00:00<00:00, 70775.72it/s]
100%|██████████| 203/203 [00:00<00:00, 71131.47it/s]
100%|██████████| 153/153 [00:00<00:00, 70473.15it/s]
100%|██████████| 200/200 [00:00<00:00, 75498.23it/s]
100%|██████████| 65/65 [00:00<00:00, 70647.77it/s]
100%|██████████| 144/144 [00:00<00:00, 69057.83it/s]
100%|██████████| 30/30 [00:00<00:00, 66121.45it/s]
100%|██████████| 130/130 [00:00<00:00, 55339.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89819.83it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [03:16<00:00, 29.75it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 62962.77it/s]
100%|██████████| 287/287 [00:00<00:00, 78734.07it/s]
100%|██████████| 771/771 [00:00<00:00, 82166.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80222.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81463.36it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81804.43it/s]
100%|██████████| 353/353 [00:00<00:00, 79511.80it/s]
100%|██████████| 252/252 [00:00<00:00, 78590.57it/s]
100%|██████████| 203/203 [00:00<00:00, 78669.84it/s]
100%|██████████| 153/153 [00:00<00:00, 76341.72it/s]
100%|██████████| 200/200 [00:00<00:00, 76741.45it/s]
100%|██████████| 65/65 [00:00<00:00, 70776.16it/s]
100%|██████████| 144/144 [00:00<00:00, 80135.30it/s]
100%|██████████| 30/30 [00:00<00:00, 60640.54it/s]
100%|██████████| 130/130 [00:00<00:00, 75374.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83699.07it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [03:15<00:00, 29.90it/s]
INFO:root:The new embedding has 5824 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81475.26it/s]
100%|██████████| 287/287 [00:00<00:00, 79226.36it/s]
100%|██████████| 771/771 [00:00<00:00, 78069.83it/s]
100%|██████████| 2000/2000 [00:00<00:00, 59576.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 62341.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78606.84it/s]
100%|██████████| 353/353 [00:00<00:00, 79687.26it/s]
100%|██████████| 252/252 [00:00<00:00, 75692.11it/s]
100%|██████████| 203/203 [00:00<00:00, 75616.67it/s]
100%|██████████| 153/153 [00:00<00:00, 75998.17it/s]
100%|██████████| 200/200 [00:00<00:00, 77564.57it/s]
100%|██████████| 65/65 [00:00<00:00, 74367.09it/s]
100%|██████████| 144/144 [00:00<00:00, 75103.18it/s]
100%|██████████| 30/30 [00:00<00:00, 55164.02it/s]
100%|██████████| 130/130 [00:00<00:00, 78533.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95212.57it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['moderatorship' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:30<00:00, 191.09it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 62860.76it/s]
100%|██████████| 287/287 [00:00<00:00, 75537.48it/s]
100%|██████████| 771/771 [00:00<00:00, 91487.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74734.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93849.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76346.60it/s]
100%|██████████| 353/353 [00:00<00:00, 74607.68it/s]
100%|██████████| 252/252 [00:00<00:00, 74230.26it/s]
100%|██████████| 203/203 [00:00<00:00, 73267.68it/s]
100%|██████████| 153/153 [00:00<00:00, 72601.94it/s]
100%|██████████| 200/200 [00:00<00:00, 73468.28it/s]
100%|██████████| 65/65 [00:00<00:00, 65536.00it/s]
100%|██████████| 144/144 [00:00<00:00, 71714.53it/s]
100%|██████████| 30/30 [00:00<00:00, 55406.92it/s]
100%|██████████| 130/130 [00:00<00:00, 69433.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89784.68it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:27<00:00, 215.16it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 78880.08it/s]
100%|██████████| 287/287 [00:00<00:00, 72990.86it/s]
100%|██████████| 771/771 [00:00<00:00, 90055.65it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74778.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88580.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76098.65it/s]
100%|██████████| 353/353 [00:00<00:00, 73734.53it/s]
100%|██████████| 252/252 [00:00<00:00, 75105.85it/s]
100%|██████████| 203/203 [00:00<00:00, 72254.22it/s]
100%|██████████| 153/153 [00:00<00:00, 77587.78it/s]
100%|██████████| 200/200 [00:00<00:00, 74591.93it/s]
100%|██████████| 65/65 [00:00<00:00, 72973.70it/s]
100%|██████████| 144/144 [00:00<00:00, 76540.33it/s]
100%|██████████| 30/30 [00:00<00:00, 65433.76it/s]
100%|██████████| 130/130 [00:00<00:00, 60618.07it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89157.59it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 174.84it/s]
INFO:root:The new embedding has 5825 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 87595.06it/s]
100%|██████████| 287/287 [00:00<00:00, 70210.86it/s]
100%|██████████| 771/771 [00:00<00:00, 88242.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88449.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72100.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86432.38it/s]
100%|██████████| 353/353 [00:00<00:00, 73054.19it/s]
100%|██████████| 252/252 [00:00<00:00, 73805.22it/s]
100%|██████████| 203/203 [00:00<00:00, 72779.19it/s]
100%|██████████| 153/153 [00:00<00:00, 72783.09it/s]
100%|██████████| 200/200 [00:00<00:00, 70274.01it/s]
100%|██████████| 65/65 [00:00<00:00, 60476.88it/s]
100%|██████████| 144/144 [00:00<00:00, 60921.91it/s]
100%|██████████| 30/30 [00:00<00:00, 32913.71it/s]
100%|██████████| 130/130 [00:00<00:00, 65261.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80898.39it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:30<00:00, 190.44it/s]
INFO:root:The new embedding has 5825 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 91928.69it/s]
100%|██████████| 287/287 [00:00<00:00, 77144.66it/s]
100%|██████████| 771/771 [00:00<00:00, 84796.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94573.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78129.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87837.60it/s]
100%|██████████| 353/353 [00:00<00:00, 74679.17it/s]
100%|██████████| 252/252 [00:00<00:00, 74298.09it/s]
100%|██████████| 203/203 [00:00<00:00, 75322.34it/s]
100%|██████████| 153/153 [00:00<00:00, 74000.06it/s]
100%|██████████| 200/200 [00:00<00:00, 68860.68it/s]
100%|██████████| 65/65 [00:00<00:00, 61625.17it/s]
100%|██████████| 144/144 [00:00<00:00, 70393.91it/s]
100%|██████████| 30/30 [00:00<00:00, 84110.37it/s]
100%|██████████| 130/130 [00:00<00:00, 61458.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93136.98it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:31<00:00, 187.11it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 100318.66it/s]
100%|██████████| 287/287 [00:00<00:00, 74842.41it/s]
100%|██████████| 771/771 [00:00<00:00, 78167.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77322.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 103440.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96123.94it/s]
100%|██████████| 353/353 [00:00<00:00, 73639.18it/s]
100%|██████████| 252/252 [00:00<00:00, 86494.65it/s]
100%|██████████| 203/203 [00:00<00:00, 72704.61it/s]
100%|██████████| 153/153 [00:00<00:00, 80346.63it/s]
100%|██████████| 200/200 [00:00<00:00, 57681.41it/s]
100%|██████████| 65/65 [00:00<00:00, 40648.54it/s]
100%|██████████| 144/144 [00:00<00:00, 58730.04it/s]
100%|██████████| 30/30 [00:00<00:00, 43630.07it/s]
100%|██████████| 130/130 [00:00<00:00, 57444.11it/s]
100%|██████████| 3500/3500 [00:00<00:00, 56969.69it/s]
100%|██████████| 2

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:30<00:00, 190.58it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78379.87it/s]
100%|██████████| 287/287 [00:00<00:00, 77812.88it/s]
100%|██████████| 771/771 [00:00<00:00, 75937.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80050.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81313.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 100023.94it/s]
100%|██████████| 353/353 [00:00<00:00, 78416.89it/s]
100%|██████████| 252/252 [00:00<00:00, 80322.56it/s]
100%|██████████| 203/203 [00:00<00:00, 77566.16it/s]
100%|██████████| 153/153 [00:00<00:00, 76789.34it/s]
100%|██████████| 200/200 [00:00<00:00, 76748.47it/s]
100%|██████████| 65/65 [00:00<00:00, 66560.00it/s]
100%|██████████| 144/144 [00:00<00:00, 73050.29it/s]
100%|██████████| 30/30 [00:00<00:00, 61082.10it/s]
100%|██████████| 130/130 [00:00<00:00, 78308.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90291.07it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['sanctify' 'lustrate']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['incoordination' 'unskillfulness']
['caesarism' 'autocracy']
['mildness' 'balminess']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [01:09<00:00, 83.51it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 71849.34it/s]
100%|██████████| 287/287 [00:00<00:00, 79205.50it/s]
100%|██████████| 771/771 [00:00<00:00, 79374.79it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95528.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79139.30it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92858.71it/s]
100%|██████████| 353/353 [00:00<00:00, 72627.75it/s]
100%|██████████| 252/252 [00:00<00:00, 85981.01it/s]
100%|██████████| 203/203 [00:00<00:00, 77249.47it/s]
100%|██████████| 153/153 [00:00<00:00, 80538.22it/s]
100%|██████████| 200/200 [00:00<00:00, 70825.80it/s]
100%|██████████| 65/65 [00:00<00:00, 63387.53it/s]
100%|██████████| 144/144 [00:00<00:00, 77028.41it/s]
100%|██████████| 30/30 [00:00<00:00, 55775.32it/s]
100%|██████████| 130/130 [00:00<00:00, 72701.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79478.86it/s]
100%|██████████| 2034/

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.44it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 82772.50it/s]
100%|██████████| 287/287 [00:00<00:00, 73678.86it/s]
100%|██████████| 771/771 [00:00<00:00, 73388.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83308.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96449.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89457.49it/s]
100%|██████████| 353/353 [00:00<00:00, 84828.08it/s]
100%|██████████| 252/252 [00:00<00:00, 72459.35it/s]
100%|██████████| 203/203 [00:00<00:00, 72772.97it/s]
100%|██████████| 153/153 [00:00<00:00, 71121.41it/s]
100%|██████████| 200/200 [00:00<00:00, 71605.70it/s]
100%|██████████| 65/65 [00:00<00:00, 64284.31it/s]
100%|██████████| 144/144 [00:00<00:00, 70574.87it/s]
100%|██████████| 30/30 [00:00<00:00, 60004.35it/s]
100%|██████████| 130/130 [00:00<00:00, 73386.21it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86023.90it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 149.29it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80028.07it/s]
100%|██████████| 287/287 [00:00<00:00, 76839.35it/s]
100%|██████████| 771/771 [00:00<00:00, 78969.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76259.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81002.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89695.35it/s]
100%|██████████| 353/353 [00:00<00:00, 80523.70it/s]
100%|██████████| 252/252 [00:00<00:00, 81329.99it/s]
100%|██████████| 203/203 [00:00<00:00, 81097.60it/s]
100%|██████████| 153/153 [00:00<00:00, 76560.31it/s]
100%|██████████| 200/200 [00:00<00:00, 79520.41it/s]
100%|██████████| 65/65 [00:00<00:00, 66706.57it/s]
100%|██████████| 144/144 [00:00<00:00, 64735.24it/s]
100%|██████████| 30/30 [00:00<00:00, 56859.07it/s]
100%|██████████| 130/130 [00:00<00:00, 83526.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 98326.61it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 149.97it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75769.15it/s]
100%|██████████| 287/287 [00:00<00:00, 77323.05it/s]
100%|██████████| 771/771 [00:00<00:00, 81612.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79735.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80229.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78945.66it/s]
100%|██████████| 353/353 [00:00<00:00, 78404.43it/s]
100%|██████████| 252/252 [00:00<00:00, 77786.62it/s]
100%|██████████| 203/203 [00:00<00:00, 71906.40it/s]
100%|██████████| 153/153 [00:00<00:00, 79767.37it/s]
100%|██████████| 200/200 [00:00<00:00, 80885.24it/s]
100%|██████████| 65/65 [00:00<00:00, 77014.06it/s]
100%|██████████| 144/144 [00:00<00:00, 73378.66it/s]
100%|██████████| 30/30 [00:00<00:00, 63710.95it/s]
100%|██████████| 130/130 [00:00<00:00, 77440.64it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81017.59it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.72it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 73415.39it/s]
100%|██████████| 287/287 [00:00<00:00, 42641.35it/s]
100%|██████████| 771/771 [00:00<00:00, 82097.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89901.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73692.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91332.08it/s]
100%|██████████| 353/353 [00:00<00:00, 74818.80it/s]
100%|██████████| 252/252 [00:00<00:00, 72853.92it/s]
100%|██████████| 203/203 [00:00<00:00, 79255.67it/s]
100%|██████████| 153/153 [00:00<00:00, 83384.68it/s]
100%|██████████| 200/200 [00:00<00:00, 70179.94it/s]
100%|██████████| 65/65 [00:00<00:00, 63713.43it/s]
100%|██████████| 144/144 [00:00<00:00, 68563.94it/s]
100%|██████████| 30/30 [00:00<00:00, 46125.04it/s]
100%|██████████| 130/130 [00:00<00:00, 78817.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77923.80it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.10it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 83330.54it/s]
100%|██████████| 287/287 [00:00<00:00, 73638.30it/s]
100%|██████████| 771/771 [00:00<00:00, 83762.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94465.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75829.91it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85498.58it/s]
100%|██████████| 353/353 [00:00<00:00, 84005.07it/s]
100%|██████████| 252/252 [00:00<00:00, 72588.74it/s]
100%|██████████| 203/203 [00:00<00:00, 71531.86it/s]
100%|██████████| 153/153 [00:00<00:00, 71902.35it/s]
100%|██████████| 200/200 [00:00<00:00, 68283.34it/s]
100%|██████████| 65/65 [00:00<00:00, 56632.69it/s]
100%|██████████| 144/144 [00:00<00:00, 56064.21it/s]
100%|██████████| 30/30 [00:00<00:00, 56223.91it/s]
100%|██████████| 130/130 [00:00<00:00, 66870.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70340.17it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.76it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 84844.08it/s]
100%|██████████| 287/287 [00:00<00:00, 78426.30it/s]
100%|██████████| 771/771 [00:00<00:00, 81928.72it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78756.66it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81878.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83708.62it/s]
100%|██████████| 353/353 [00:00<00:00, 78964.76it/s]
100%|██████████| 252/252 [00:00<00:00, 79982.19it/s]
100%|██████████| 203/203 [00:00<00:00, 72673.58it/s]
100%|██████████| 153/153 [00:00<00:00, 75249.59it/s]
100%|██████████| 200/200 [00:00<00:00, 74209.20it/s]
100%|██████████| 65/65 [00:00<00:00, 68568.85it/s]
100%|██████████| 144/144 [00:00<00:00, 74208.11it/s]
100%|██████████| 30/30 [00:00<00:00, 67288.30it/s]
100%|██████████| 130/130 [00:00<00:00, 66870.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78051.82it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.48it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 66271.94it/s]
100%|██████████| 287/287 [00:00<00:00, 81429.02it/s]
100%|██████████| 771/771 [00:00<00:00, 90522.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79013.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81736.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78431.92it/s]
100%|██████████| 353/353 [00:00<00:00, 80955.18it/s]
100%|██████████| 252/252 [00:00<00:00, 75127.20it/s]
100%|██████████| 203/203 [00:00<00:00, 69443.25it/s]
100%|██████████| 153/153 [00:00<00:00, 73073.16it/s]
100%|██████████| 200/200 [00:00<00:00, 76253.14it/s]
100%|██████████| 65/65 [00:00<00:00, 75856.92it/s]
100%|██████████| 144/144 [00:00<00:00, 79923.22it/s]
100%|██████████| 30/30 [00:00<00:00, 59719.56it/s]
100%|██████████| 130/130 [00:00<00:00, 79449.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76651.09it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [02:41<00:00, 36.14it/s]
INFO:root:The new embedding has 5826 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 48791.99it/s]
100%|██████████| 287/287 [00:00<00:00, 75537.48it/s]
100%|██████████| 771/771 [00:00<00:00, 74886.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85512.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 97043.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77687.64it/s]
100%|██████████| 353/353 [00:00<00:00, 92202.60it/s]
100%|██████████| 252/252 [00:00<00:00, 88545.25it/s]
100%|██████████| 203/203 [00:00<00:00, 81853.85it/s]
100%|██████████| 153/153 [00:00<00:00, 73441.12it/s]
100%|██████████| 200/200 [00:00<00:00, 73830.38it/s]
100%|██████████| 65/65 [00:00<00:00, 70120.82it/s]
100%|██████████| 144/144 [00:00<00:00, 71714.53it/s]
100%|██████████| 30/30 [00:00<00:00, 53340.03it/s]
100%|██████████| 130/130 [00:00<00:00, 65175.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83700.98it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [01:12<00:00, 80.87it/s]
INFO:root:The new embedding has 5826 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 74761.98it/s]
100%|██████████| 287/287 [00:00<00:00, 89049.06it/s]
100%|██████████| 771/771 [00:00<00:00, 74186.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96093.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88366.25it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87114.55it/s]
100%|██████████| 353/353 [00:00<00:00, 54051.89it/s]
100%|██████████| 252/252 [00:00<00:00, 51353.83it/s]
100%|██████████| 203/203 [00:00<00:00, 54688.40it/s]
100%|██████████| 153/153 [00:00<00:00, 77785.27it/s]
100%|██████████| 200/200 [00:00<00:00, 54099.11it/s]
100%|██████████| 65/65 [00:00<00:00, 53667.28it/s]
100%|██████████| 144/144 [00:00<00:00, 55805.21it/s]
100%|██████████| 30/30 [00:00<00:00, 50251.25it/s]
100%|██████████| 130/130 [00:00<00:00, 55502.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75469.70it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [01:13<00:00, 79.91it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 83347.12it/s]
100%|██████████| 287/287 [00:00<00:00, 80170.85it/s]
100%|██████████| 771/771 [00:00<00:00, 80147.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78437.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81118.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78045.18it/s]
100%|██████████| 353/353 [00:00<00:00, 80444.95it/s]
100%|██████████| 252/252 [00:00<00:00, 80267.66it/s]
100%|██████████| 203/203 [00:00<00:00, 78164.30it/s]
100%|██████████| 153/153 [00:00<00:00, 78904.28it/s]
100%|██████████| 200/200 [00:00<00:00, 78581.81it/s]
100%|██████████| 65/65 [00:00<00:00, 67599.74it/s]
100%|██████████| 144/144 [00:00<00:00, 77087.40it/s]
100%|██████████| 30/30 [00:00<00:00, 58579.66it/s]
100%|██████████| 130/130 [00:00<00:00, 75552.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77722.88it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [01:12<00:00, 80.97it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82415.96it/s]
100%|██████████| 287/287 [00:00<00:00, 73954.98it/s]
100%|██████████| 771/771 [00:00<00:00, 74825.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98409.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84336.44it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91726.89it/s]
100%|██████████| 353/353 [00:00<00:00, 79988.62it/s]
100%|██████████| 252/252 [00:00<00:00, 77331.33it/s]
100%|██████████| 203/203 [00:00<00:00, 76824.30it/s]
100%|██████████| 153/153 [00:00<00:00, 76798.53it/s]
100%|██████████| 200/200 [00:00<00:00, 76475.59it/s]
100%|██████████| 65/65 [00:00<00:00, 71462.58it/s]
100%|██████████| 144/144 [00:00<00:00, 72865.22it/s]
100%|██████████| 30/30 [00:00<00:00, 47771.12it/s]
100%|██████████| 130/130 [00:00<00:00, 74478.83it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79329.40it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [01:05<00:00, 88.81it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 77655.02it/s]
100%|██████████| 287/287 [00:00<00:00, 77233.75it/s]
100%|██████████| 771/771 [00:00<00:00, 90418.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82577.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84202.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74333.26it/s]
100%|██████████| 353/353 [00:00<00:00, 84857.25it/s]
100%|██████████| 252/252 [00:00<00:00, 71411.70it/s]
100%|██████████| 203/203 [00:00<00:00, 63927.00it/s]
100%|██████████| 153/153 [00:00<00:00, 71042.68it/s]
100%|██████████| 200/200 [00:00<00:00, 72938.07it/s]
100%|██████████| 65/65 [00:00<00:00, 72837.23it/s]
100%|██████████| 144/144 [00:00<00:00, 70789.94it/s]
100%|██████████| 30/30 [00:00<00:00, 65095.25it/s]
100%|██████████| 130/130 [00:00<00:00, 69923.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91472.55it/s]
100%|██████████| 2034/

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:24<00:00, 235.61it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 63303.31it/s]
100%|██████████| 287/287 [00:00<00:00, 73057.31it/s]
100%|██████████| 771/771 [00:00<00:00, 75505.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76130.65it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93113.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82807.38it/s]
100%|██████████| 353/353 [00:00<00:00, 85672.34it/s]
100%|██████████| 252/252 [00:00<00:00, 73415.61it/s]
100%|██████████| 203/203 [00:00<00:00, 74309.98it/s]
100%|██████████| 153/153 [00:00<00:00, 68988.23it/s]
100%|██████████| 200/200 [00:00<00:00, 72786.19it/s]
100%|██████████| 65/65 [00:00<00:00, 71556.37it/s]
100%|██████████| 144/144 [00:00<00:00, 74620.68it/s]
100%|██████████| 30/30 [00:00<00:00, 63009.07it/s]
100%|██████████| 130/130 [00:00<00:00, 61382.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86776.99it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:38<00:00, 153.56it/s]
INFO:root:The new embedding has 5828 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 64930.73it/s]
100%|██████████| 287/287 [00:00<00:00, 90733.79it/s]
100%|██████████| 771/771 [00:00<00:00, 85898.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81495.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92229.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93943.69it/s]
100%|██████████| 353/353 [00:00<00:00, 72153.48it/s]
100%|██████████| 252/252 [00:00<00:00, 78108.53it/s]
100%|██████████| 203/203 [00:00<00:00, 69352.75it/s]
100%|██████████| 153/153 [00:00<00:00, 70995.52it/s]
100%|██████████| 200/200 [00:00<00:00, 68534.38it/s]
100%|██████████| 65/65 [00:00<00:00, 73405.97it/s]
100%|██████████| 144/144 [00:00<00:00, 69160.63it/s]
100%|██████████| 30/30 [00:00<00:00, 62539.32it/s]
100%|██████████| 130/130 [00:00<00:00, 60956.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88399.51it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 216.86it/s]
INFO:root:The new embedding has 5828 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 87097.98it/s]
100%|██████████| 287/287 [00:00<00:00, 68971.82it/s]
100%|██████████| 771/771 [00:00<00:00, 83979.75it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94263.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81892.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93777.06it/s]
100%|██████████| 353/353 [00:00<00:00, 75374.91it/s]
100%|██████████| 252/252 [00:00<00:00, 72969.60it/s]
100%|██████████| 203/203 [00:00<00:00, 69801.91it/s]
100%|██████████| 153/153 [00:00<00:00, 67578.82it/s]
100%|██████████| 200/200 [00:00<00:00, 75038.98it/s]
100%|██████████| 65/65 [00:00<00:00, 63343.35it/s]
100%|██████████| 144/144 [00:00<00:00, 70723.63it/s]
100%|██████████| 30/30 [00:00<00:00, 38106.94it/s]
100%|██████████| 130/130 [00:00<00:00, 66220.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88585.14it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:27<00:00, 216.29it/s]
INFO:root:The new embedding has 5828 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79855.72it/s]
100%|██████████| 287/287 [00:00<00:00, 72446.15it/s]
100%|██████████| 771/771 [00:00<00:00, 79562.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77549.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 61224.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 58775.58it/s]
100%|██████████| 353/353 [00:00<00:00, 73804.36it/s]
100%|██████████| 252/252 [00:00<00:00, 77348.31it/s]
100%|██████████| 203/203 [00:00<00:00, 77186.45it/s]
100%|██████████| 153/153 [00:00<00:00, 72307.44it/s]
100%|██████████| 200/200 [00:00<00:00, 78157.16it/s]
100%|██████████| 65/65 [00:00<00:00, 71858.13it/s]
100%|██████████| 144/144 [00:00<00:00, 76695.84it/s]
100%|██████████| 30/30 [00:00<00:00, 68796.68it/s]
100%|██████████| 130/130 [00:00<00:00, 41064.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76561.55it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:26<00:00, 216.54it/s]
INFO:root:The new embedding has 5828 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79931.89it/s]
100%|██████████| 287/287 [00:00<00:00, 67993.97it/s]
100%|██████████| 771/771 [00:00<00:00, 89287.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80074.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79327.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79321.90it/s]
100%|██████████| 353/353 [00:00<00:00, 75776.10it/s]
100%|██████████| 252/252 [00:00<00:00, 74930.14it/s]
100%|██████████| 203/203 [00:00<00:00, 75690.61it/s]
100%|██████████| 153/153 [00:00<00:00, 74723.86it/s]
100%|██████████| 200/200 [00:00<00:00, 70658.76it/s]
100%|██████████| 65/65 [00:00<00:00, 66060.03it/s]
100%|██████████| 144/144 [00:00<00:00, 78438.93it/s]
100%|██████████| 30/30 [00:00<00:00, 71453.22it/s]
100%|██████████| 130/130 [00:00<00:00, 79229.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90486.98it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:42<00:00, 137.04it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 53982.35it/s]
100%|██████████| 287/287 [00:00<00:00, 53816.40it/s]
100%|██████████| 771/771 [00:00<00:00, 53715.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 53624.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 54859.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 71992.04it/s]
100%|██████████| 353/353 [00:00<00:00, 73216.76it/s]
100%|██████████| 252/252 [00:00<00:00, 73872.28it/s]
100%|██████████| 203/203 [00:00<00:00, 73148.09it/s]
100%|██████████| 153/153 [00:00<00:00, 73863.78it/s]
100%|██████████| 200/200 [00:00<00:00, 74858.18it/s]
100%|██████████| 65/65 [00:00<00:00, 67953.58it/s]
100%|██████████| 144/144 [00:00<00:00, 72926.80it/s]
100%|██████████| 30/30 [00:00<00:00, 67613.71it/s]
100%|██████████| 130/130 [00:00<00:00, 63145.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71747.96it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.55it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 78804.42it/s]
100%|██████████| 287/287 [00:00<00:00, 73355.59it/s]
100%|██████████| 771/771 [00:00<00:00, 77812.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93648.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76033.36it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88148.35it/s]
100%|██████████| 353/353 [00:00<00:00, 72885.17it/s]
100%|██████████| 252/252 [00:00<00:00, 71431.01it/s]
100%|██████████| 203/203 [00:00<00:00, 65819.71it/s]
100%|██████████| 153/153 [00:00<00:00, 67986.92it/s]
100%|██████████| 200/200 [00:00<00:00, 77961.04it/s]
100%|██████████| 65/65 [00:00<00:00, 67018.13it/s]
100%|██████████| 144/144 [00:00<00:00, 68782.57it/s]
100%|██████████| 30/30 [00:00<00:00, 52341.56it/s]
100%|██████████| 130/130 [00:00<00:00, 69450.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89638.30it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.86it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81156.49it/s]
100%|██████████| 287/287 [00:00<00:00, 80551.74it/s]
100%|██████████| 771/771 [00:00<00:00, 79256.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79775.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82162.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79619.03it/s]
100%|██████████| 353/353 [00:00<00:00, 80458.06it/s]
100%|██████████| 252/252 [00:00<00:00, 77456.00it/s]
100%|██████████| 203/203 [00:00<00:00, 66706.65it/s]
100%|██████████| 153/153 [00:00<00:00, 79589.30it/s]
100%|██████████| 200/200 [00:00<00:00, 80243.05it/s]
100%|██████████| 65/65 [00:00<00:00, 76089.80it/s]
100%|██████████| 144/144 [00:00<00:00, 79659.69it/s]
100%|██████████| 30/30 [00:00<00:00, 66121.45it/s]
100%|██████████| 130/130 [00:00<00:00, 76959.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78142.39it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.53it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81235.16it/s]
100%|██████████| 287/287 [00:00<00:00, 78764.98it/s]
100%|██████████| 771/771 [00:00<00:00, 81003.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79801.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81816.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78830.92it/s]
100%|██████████| 353/353 [00:00<00:00, 81377.89it/s]
100%|██████████| 252/252 [00:00<00:00, 78282.08it/s]
100%|██████████| 203/203 [00:00<00:00, 73967.83it/s]
100%|██████████| 153/153 [00:00<00:00, 68729.63it/s]
100%|██████████| 200/200 [00:00<00:00, 75716.29it/s]
100%|██████████| 65/65 [00:00<00:00, 68055.36it/s]
100%|██████████| 144/144 [00:00<00:00, 74777.74it/s]
100%|██████████| 30/30 [00:00<00:00, 57351.47it/s]
100%|██████████| 130/130 [00:00<00:00, 71839.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78407.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.65it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 87043.70it/s]
100%|██████████| 287/287 [00:00<00:00, 71703.91it/s]
100%|██████████| 771/771 [00:00<00:00, 90939.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91155.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92121.77it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90121.27it/s]
100%|██████████| 353/353 [00:00<00:00, 81503.32it/s]
100%|██████████| 252/252 [00:00<00:00, 69821.95it/s]
100%|██████████| 203/203 [00:00<00:00, 71906.40it/s]
100%|██████████| 153/153 [00:00<00:00, 73123.12it/s]
100%|██████████| 200/200 [00:00<00:00, 71679.13it/s]
100%|██████████| 65/65 [00:00<00:00, 63862.68it/s]
100%|██████████| 144/144 [00:00<00:00, 69042.04it/s]
100%|██████████| 30/30 [00:00<00:00, 60611.33it/s]
100%|██████████| 130/130 [00:00<00:00, 60282.98it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86285.81it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.60it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 84034.13it/s]
100%|██████████| 287/287 [00:00<00:00, 70453.31it/s]
100%|██████████| 771/771 [00:00<00:00, 90443.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92635.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91763.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90111.59it/s]
100%|██████████| 353/353 [00:00<00:00, 78028.42it/s]
100%|██████████| 252/252 [00:00<00:00, 71785.15it/s]
100%|██████████| 203/203 [00:00<00:00, 73299.22it/s]
100%|██████████| 153/153 [00:00<00:00, 74576.24it/s]
100%|██████████| 200/200 [00:00<00:00, 70051.01it/s]
100%|██████████| 65/65 [00:00<00:00, 61890.98it/s]
100%|██████████| 144/144 [00:00<00:00, 70673.97it/s]
100%|██████████| 30/30 [00:00<00:00, 46968.69it/s]
100%|██████████| 130/130 [00:00<00:00, 64989.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90531.06it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.20it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79851.16it/s]
100%|██████████| 287/287 [00:00<00:00, 80144.16it/s]
100%|██████████| 771/771 [00:00<00:00, 87181.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89385.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93037.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79587.81it/s]
100%|██████████| 353/353 [00:00<00:00, 71339.95it/s]
100%|██████████| 252/252 [00:00<00:00, 77952.99it/s]
100%|██████████| 203/203 [00:00<00:00, 79093.70it/s]
100%|██████████| 153/153 [00:00<00:00, 76624.30it/s]
100%|██████████| 200/200 [00:00<00:00, 73173.48it/s]
100%|██████████| 65/65 [00:00<00:00, 67717.28it/s]
100%|██████████| 144/144 [00:00<00:00, 76910.71it/s]
100%|██████████| 30/30 [00:00<00:00, 61082.10it/s]
100%|██████████| 130/130 [00:00<00:00, 77617.01it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90233.91it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.82it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77416.85it/s]
100%|██████████| 287/287 [00:00<00:00, 80827.59it/s]
100%|██████████| 771/771 [00:00<00:00, 79289.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79424.79it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83616.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79618.53it/s]
100%|██████████| 353/353 [00:00<00:00, 80615.77it/s]
100%|██████████| 252/252 [00:00<00:00, 81292.46it/s]
100%|██████████| 203/203 [00:00<00:00, 71955.02it/s]
100%|██████████| 153/153 [00:00<00:00, 76414.45it/s]
100%|██████████| 200/200 [00:00<00:00, 79249.96it/s]
100%|██████████| 65/65 [00:00<00:00, 70265.40it/s]
100%|██████████| 144/144 [00:00<00:00, 78114.30it/s]
100%|██████████| 30/30 [00:00<00:00, 53498.78it/s]
100%|██████████| 130/130 [00:00<00:00, 73120.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79785.12it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 144.69it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 88666.43it/s]
100%|██████████| 287/287 [00:00<00:00, 74823.80it/s]
100%|██████████| 771/771 [00:00<00:00, 90870.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82213.04it/s]
100%|██████████| 1000/1000 [00:00<00:00, 97157.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82554.21it/s]
100%|██████████| 353/353 [00:00<00:00, 75141.56it/s]
100%|██████████| 252/252 [00:00<00:00, 75422.05it/s]
100%|██████████| 203/203 [00:00<00:00, 76713.55it/s]
100%|██████████| 153/153 [00:00<00:00, 76982.79it/s]
100%|██████████| 200/200 [00:00<00:00, 67584.66it/s]
100%|██████████| 65/65 [00:00<00:00, 64087.86it/s]
100%|██████████| 144/144 [00:00<00:00, 64923.12it/s]
100%|██████████| 30/30 [00:00<00:00, 60993.27it/s]
100%|██████████| 130/130 [00:00<00:00, 65804.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 68328.95it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 123.66it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 83536.55it/s]
100%|██████████| 287/287 [00:00<00:00, 72796.64it/s]
100%|██████████| 771/771 [00:00<00:00, 87992.39it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87207.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77320.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94380.57it/s]
100%|██████████| 353/353 [00:00<00:00, 81959.00it/s]
100%|██████████| 252/252 [00:00<00:00, 76931.70it/s]
100%|██████████| 203/203 [00:00<00:00, 81462.28it/s]
100%|██████████| 153/153 [00:00<00:00, 71862.10it/s]
100%|██████████| 200/200 [00:00<00:00, 69765.54it/s]
100%|██████████| 65/65 [00:00<00:00, 66188.34it/s]
100%|██████████| 144/144 [00:00<00:00, 71291.29it/s]
100%|██████████| 30/30 [00:00<00:00, 60262.99it/s]
100%|██████████| 130/130 [00:00<00:00, 69081.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90242.23it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 123.25it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76492.56it/s]
100%|██████████| 287/287 [00:00<00:00, 74315.67it/s]
100%|██████████| 771/771 [00:00<00:00, 77164.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 103178.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 95679.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98830.58it/s]
100%|██████████| 353/353 [00:00<00:00, 78851.22it/s]
100%|██████████| 252/252 [00:00<00:00, 67331.16it/s]
100%|██████████| 203/203 [00:00<00:00, 78035.35it/s]
100%|██████████| 153/153 [00:00<00:00, 62970.12it/s]
100%|██████████| 200/200 [00:00<00:00, 67786.73it/s]
100%|██████████| 65/65 [00:00<00:00, 60624.81it/s]
100%|██████████| 144/144 [00:00<00:00, 62980.16it/s]
100%|██████████| 30/30 [00:00<00:00, 48733.20it/s]
100%|██████████| 130/130 [00:00<00:00, 74929.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79753.05it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 124.87it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76063.49it/s]
100%|██████████| 287/287 [00:00<00:00, 77318.08it/s]
100%|██████████| 771/771 [00:00<00:00, 79486.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79601.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79290.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78858.09it/s]
100%|██████████| 353/353 [00:00<00:00, 80598.22it/s]
100%|██████████| 252/252 [00:00<00:00, 79280.27it/s]
100%|██████████| 203/203 [00:00<00:00, 76734.29it/s]
100%|██████████| 153/153 [00:00<00:00, 77428.63it/s]
100%|██████████| 200/200 [00:00<00:00, 80939.87it/s]
100%|██████████| 65/65 [00:00<00:00, 69958.88it/s]
100%|██████████| 144/144 [00:00<00:00, 75554.14it/s]
100%|██████████| 30/30 [00:00<00:00, 57195.05it/s]
100%|██████████| 130/130 [00:00<00:00, 76313.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77326.98it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 165.28it/s]
INFO:root:The new embedding has 5843 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 79292.06it/s]
100%|██████████| 287/287 [00:00<00:00, 71119.30it/s]
100%|██████████| 771/771 [00:00<00:00, 80697.94it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91986.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92919.74it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88057.67it/s]
100%|██████████| 353/353 [00:00<00:00, 73697.83it/s]
100%|██████████| 252/252 [00:00<00:00, 73374.84it/s]
100%|██████████| 203/203 [00:00<00:00, 65415.16it/s]
100%|██████████| 153/153 [00:00<00:00, 61984.79it/s]
100%|██████████| 200/200 [00:00<00:00, 88468.76it/s]
100%|██████████| 65/65 [00:00<00:00, 64497.22it/s]
100%|██████████| 144/144 [00:00<00:00, 70864.69it/s]
100%|██████████| 30/30 [00:00<00:00, 39681.21it/s]
100%|██████████| 130/130 [00:00<00:00, 72277.24it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84662.07it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.36it/s]
INFO:root:The new embedding has 5843 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 72803.10it/s]
100%|██████████| 287/287 [00:00<00:00, 78672.33it/s]
100%|██████████| 771/771 [00:00<00:00, 90697.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92052.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96310.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88038.57it/s]
100%|██████████| 353/353 [00:00<00:00, 86716.02it/s]
100%|██████████| 252/252 [00:00<00:00, 72290.86it/s]
100%|██████████| 203/203 [00:00<00:00, 72953.79it/s]
100%|██████████| 153/153 [00:00<00:00, 71342.80it/s]
100%|██████████| 200/200 [00:00<00:00, 73797.91it/s]
100%|██████████| 65/65 [00:00<00:00, 60143.34it/s]
100%|██████████| 144/144 [00:00<00:00, 84757.20it/s]
100%|██████████| 30/30 [00:00<00:00, 62137.84it/s]
100%|██████████| 130/130 [00:00<00:00, 60416.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90138.06it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 165.46it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81649.90it/s]
100%|██████████| 287/287 [00:00<00:00, 79756.53it/s]
100%|██████████| 771/771 [00:00<00:00, 79947.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78916.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 60663.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 59631.55it/s]
100%|██████████| 353/353 [00:00<00:00, 54287.73it/s]
100%|██████████| 252/252 [00:00<00:00, 57823.98it/s]
100%|██████████| 203/203 [00:00<00:00, 58398.06it/s]
100%|██████████| 153/153 [00:00<00:00, 57108.53it/s]
100%|██████████| 200/200 [00:00<00:00, 58571.48it/s]
100%|██████████| 65/65 [00:00<00:00, 56880.82it/s]
100%|██████████| 144/144 [00:00<00:00, 58378.10it/s]
100%|██████████| 30/30 [00:00<00:00, 53498.78it/s]
100%|██████████| 130/130 [00:00<00:00, 60490.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 58107.80it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.09it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80122.95it/s]
100%|██████████| 287/287 [00:00<00:00, 78451.85it/s]
100%|██████████| 771/771 [00:00<00:00, 79687.75it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77114.64it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81722.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77774.07it/s]
100%|██████████| 353/353 [00:00<00:00, 80910.94it/s]
100%|██████████| 252/252 [00:00<00:00, 77958.74it/s]
100%|██████████| 203/203 [00:00<00:00, 71688.45it/s]
100%|██████████| 153/153 [00:00<00:00, 76232.90it/s]
100%|██████████| 200/200 [00:00<00:00, 77543.06it/s]
100%|██████████| 65/65 [00:00<00:00, 56880.82it/s]
100%|██████████| 144/144 [00:00<00:00, 76087.15it/s]
100%|██████████| 30/30 [00:00<00:00, 52847.17it/s]
100%|██████████| 130/130 [00:00<00:00, 78533.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77080.13it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.99it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 77855.58it/s]
100%|██████████| 287/287 [00:00<00:00, 74740.17it/s]
100%|██████████| 771/771 [00:00<00:00, 82583.59it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91195.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78543.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90544.74it/s]
100%|██████████| 353/353 [00:00<00:00, 77242.76it/s]
100%|██████████| 252/252 [00:00<00:00, 74418.41it/s]
100%|██████████| 203/203 [00:00<00:00, 76824.30it/s]
100%|██████████| 153/153 [00:00<00:00, 64057.55it/s]
100%|██████████| 200/200 [00:00<00:00, 86418.13it/s]
100%|██████████| 65/65 [00:00<00:00, 66333.27it/s]
100%|██████████| 144/144 [00:00<00:00, 57626.16it/s]
100%|██████████| 30/30 [00:00<00:00, 53137.30it/s]
100%|██████████| 130/130 [00:00<00:00, 70319.77it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86448.41it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.49it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 92092.35it/s]
100%|██████████| 287/287 [00:00<00:00, 89719.40it/s]
100%|██████████| 771/771 [00:00<00:00, 92896.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88108.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90349.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85823.99it/s]
100%|██████████| 353/353 [00:00<00:00, 77892.96it/s]
100%|██████████| 252/252 [00:00<00:00, 85300.99it/s]
100%|██████████| 203/203 [00:00<00:00, 71718.64it/s]
100%|██████████| 153/153 [00:00<00:00, 70776.28it/s]
100%|██████████| 200/200 [00:00<00:00, 82491.97it/s]
100%|██████████| 65/65 [00:00<00:00, 46067.89it/s]
100%|██████████| 144/144 [00:00<00:00, 85561.66it/s]
100%|██████████| 30/30 [00:00<00:00, 52604.15it/s]
100%|██████████| 130/130 [00:00<00:00, 81127.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 65213.14it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.52it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75715.75it/s]
100%|██████████| 287/287 [00:00<00:00, 73602.28it/s]
100%|██████████| 771/771 [00:00<00:00, 63653.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85375.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90116.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89485.49it/s]
100%|██████████| 353/353 [00:00<00:00, 74248.50it/s]
100%|██████████| 252/252 [00:00<00:00, 75234.15it/s]
100%|██████████| 203/203 [00:00<00:00, 71220.72it/s]
100%|██████████| 153/153 [00:00<00:00, 71862.10it/s]
100%|██████████| 200/200 [00:00<00:00, 73468.28it/s]
100%|██████████| 65/65 [00:00<00:00, 64148.18it/s]
100%|██████████| 144/144 [00:00<00:00, 70922.94it/s]
100%|██████████| 30/30 [00:00<00:00, 62820.33it/s]
100%|██████████| 130/130 [00:00<00:00, 71210.59it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82674.78it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.66it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58345.07it/s]
100%|██████████| 287/287 [00:00<00:00, 76560.79it/s]
100%|██████████| 771/771 [00:00<00:00, 80825.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85994.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72338.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91392.45it/s]
100%|██████████| 353/353 [00:00<00:00, 78872.22it/s]
100%|██████████| 252/252 [00:00<00:00, 72924.29it/s]
100%|██████████| 203/203 [00:00<00:00, 76171.38it/s]
100%|██████████| 153/153 [00:00<00:00, 76088.28it/s]
100%|██████████| 200/200 [00:00<00:00, 79309.90it/s]
100%|██████████| 65/65 [00:00<00:00, 63743.22it/s]
100%|██████████| 144/144 [00:00<00:00, 76443.46it/s]
100%|██████████| 30/30 [00:00<00:00, 59130.23it/s]
100%|██████████| 130/130 [00:00<00:00, 73743.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 99486.06it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:30<00:00, 194.63it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 79009.48it/s]
100%|██████████| 287/287 [00:00<00:00, 97211.12it/s]
100%|██████████| 771/771 [00:00<00:00, 76527.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84915.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77149.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75140.26it/s]
100%|██████████| 353/353 [00:00<00:00, 76702.55it/s]
100%|██████████| 252/252 [00:00<00:00, 76747.36it/s]
100%|██████████| 203/203 [00:00<00:00, 69499.94it/s]
100%|██████████| 153/153 [00:00<00:00, 75989.17it/s]
100%|██████████| 200/200 [00:00<00:00, 64123.28it/s]
100%|██████████| 65/65 [00:00<00:00, 54222.31it/s]
100%|██████████| 144/144 [00:00<00:00, 73085.65it/s]
100%|██████████| 30/30 [00:00<00:00, 59465.56it/s]
100%|██████████| 130/130 [00:00<00:00, 53667.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87998.90it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:28<00:00, 206.52it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 70382.98it/s]
100%|██████████| 287/287 [00:00<00:00, 74772.67it/s]
100%|██████████| 771/771 [00:00<00:00, 86269.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81111.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83266.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87828.40it/s]
100%|██████████| 353/353 [00:00<00:00, 91169.29it/s]
100%|██████████| 252/252 [00:00<00:00, 73040.19it/s]
100%|██████████| 203/203 [00:00<00:00, 79410.90it/s]
100%|██████████| 153/153 [00:00<00:00, 66342.24it/s]
100%|██████████| 200/200 [00:00<00:00, 75321.97it/s]
100%|██████████| 65/65 [00:00<00:00, 62358.13it/s]
100%|██████████| 144/144 [00:00<00:00, 45631.59it/s]
100%|██████████| 30/30 [00:00<00:00, 34971.96it/s]
100%|██████████| 130/130 [00:00<00:00, 59872.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75800.94it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:41<00:00, 142.58it/s]
INFO:root:The new embedding has 5832 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 86511.74it/s]
100%|██████████| 287/287 [00:00<00:00, 54961.43it/s]
100%|██████████| 771/771 [00:00<00:00, 90428.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79704.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84152.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88404.12it/s]
100%|██████████| 353/353 [00:00<00:00, 71803.56it/s]
100%|██████████| 252/252 [00:00<00:00, 51576.86it/s]
100%|██████████| 203/203 [00:00<00:00, 66208.69it/s]
100%|██████████| 153/153 [00:00<00:00, 72348.20it/s]
100%|██████████| 200/200 [00:00<00:00, 54446.73it/s]
100%|██████████| 65/65 [00:00<00:00, 53751.92it/s]
100%|██████████| 144/144 [00:00<00:00, 83055.52it/s]
100%|██████████| 30/30 [00:00<00:00, 58443.62it/s]
100%|██████████| 130/130 [00:00<00:00, 71500.07it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79557.26it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 148.80it/s]
INFO:root:The new embedding has 5832 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 89522.69it/s]
100%|██████████| 287/287 [00:00<00:00, 70075.98it/s]
100%|██████████| 771/771 [00:00<00:00, 87599.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80935.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 70973.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78598.50it/s]
100%|██████████| 353/353 [00:00<00:00, 63092.40it/s]
100%|██████████| 252/252 [00:00<00:00, 87129.22it/s]
100%|██████████| 203/203 [00:00<00:00, 74707.70it/s]
100%|██████████| 153/153 [00:00<00:00, 68030.16it/s]
100%|██████████| 200/200 [00:00<00:00, 85729.26it/s]
100%|██████████| 65/65 [00:00<00:00, 73445.52it/s]
100%|██████████| 144/144 [00:00<00:00, 70295.60it/s]
100%|██████████| 30/30 [00:00<00:00, 27968.24it/s]
100%|██████████| 130/130 [00:00<00:00, 65599.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88720.06it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 148.54it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 59146.42it/s]
100%|██████████| 287/287 [00:00<00:00, 75932.96it/s]
100%|██████████| 771/771 [00:00<00:00, 82977.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88479.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72516.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91119.78it/s]
100%|██████████| 353/353 [00:00<00:00, 71388.11it/s]
100%|██████████| 252/252 [00:00<00:00, 54014.95it/s]
100%|██████████| 203/203 [00:00<00:00, 78035.35it/s]
100%|██████████| 153/153 [00:00<00:00, 71797.77it/s]
100%|██████████| 200/200 [00:00<00:00, 79294.91it/s]
100%|██████████| 65/65 [00:00<00:00, 69107.67it/s]
100%|██████████| 144/144 [00:00<00:00, 71544.63it/s]
100%|██████████| 30/30 [00:00<00:00, 58254.22it/s]
100%|██████████| 130/130 [00:00<00:00, 77760.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86106.14it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 148.29it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 89240.51it/s]
100%|██████████| 287/287 [00:00<00:00, 78508.14it/s]
100%|██████████| 771/771 [00:00<00:00, 87565.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90808.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93752.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88998.76it/s]
100%|██████████| 353/353 [00:00<00:00, 74468.83it/s]
100%|██████████| 252/252 [00:00<00:00, 75958.65it/s]
100%|██████████| 203/203 [00:00<00:00, 77608.58it/s]
100%|██████████| 153/153 [00:00<00:00, 72478.94it/s]
100%|██████████| 200/200 [00:00<00:00, 74519.04it/s]
100%|██████████| 65/65 [00:00<00:00, 74960.07it/s]
100%|██████████| 144/144 [00:00<00:00, 79044.60it/s]
100%|██████████| 30/30 [00:00<00:00, 71820.27it/s]
100%|██████████| 130/130 [00:00<00:00, 68655.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90286.63it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.85it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 78816.28it/s]
100%|██████████| 287/287 [00:00<00:00, 71258.23it/s]
100%|██████████| 771/771 [00:00<00:00, 91793.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89085.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76963.94it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72873.44it/s]
100%|██████████| 353/353 [00:00<00:00, 68195.35it/s]
100%|██████████| 252/252 [00:00<00:00, 51221.93it/s]
100%|██████████| 203/203 [00:00<00:00, 64410.60it/s]
100%|██████████| 153/153 [00:00<00:00, 61633.55it/s]
100%|██████████| 200/200 [00:00<00:00, 39301.95it/s]
100%|██████████| 65/65 [00:00<00:00, 45804.73it/s]
100%|██████████| 144/144 [00:00<00:00, 45909.07it/s]
100%|██████████| 30/30 [00:00<00:00, 36002.61it/s]
100%|██████████| 130/130 [00:00<00:00, 33267.82it/s]
100%|██████████| 3500/3500 [00:00<00:00, 60403.33it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 172.66it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 84512.10it/s]
100%|██████████| 287/287 [00:00<00:00, 72172.51it/s]
100%|██████████| 771/771 [00:00<00:00, 84752.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88955.66it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93202.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88790.26it/s]
100%|██████████| 353/353 [00:00<00:00, 76778.12it/s]
100%|██████████| 252/252 [00:00<00:00, 75610.89it/s]
100%|██████████| 203/203 [00:00<00:00, 72543.56it/s]
100%|██████████| 153/153 [00:00<00:00, 61954.87it/s]
100%|██████████| 200/200 [00:00<00:00, 69928.38it/s]
100%|██████████| 65/65 [00:00<00:00, 62948.46it/s]
100%|██████████| 144/144 [00:00<00:00, 75972.30it/s]
100%|██████████| 30/30 [00:00<00:00, 64660.39it/s]
100%|██████████| 130/130 [00:00<00:00, 70776.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84843.11it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:47<00:00, 122.34it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 80359.59it/s]
100%|██████████| 287/287 [00:00<00:00, 87840.43it/s]
100%|██████████| 771/771 [00:00<00:00, 83931.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91816.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 96980.37it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91689.46it/s]
100%|██████████| 353/353 [00:00<00:00, 75694.75it/s]
100%|██████████| 252/252 [00:00<00:00, 73960.16it/s]
100%|██████████| 203/203 [00:00<00:00, 77263.49it/s]
100%|██████████| 153/153 [00:00<00:00, 72940.27it/s]
100%|██████████| 200/200 [00:00<00:00, 72912.72it/s]
100%|██████████| 65/65 [00:00<00:00, 65900.35it/s]
100%|██████████| 144/144 [00:00<00:00, 70287.42it/s]
100%|██████████| 30/30 [00:00<00:00, 64133.09it/s]
100%|██████████| 130/130 [00:00<00:00, 74703.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81933.26it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 174.52it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 86397.58it/s]
100%|██████████| 287/287 [00:00<00:00, 78651.76it/s]
100%|██████████| 771/771 [00:00<00:00, 85691.04it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91100.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86146.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87204.50it/s]
100%|██████████| 353/353 [00:00<00:00, 91298.59it/s]
100%|██████████| 252/252 [00:00<00:00, 79149.66it/s]
100%|██████████| 203/203 [00:00<00:00, 88645.88it/s]
100%|██████████| 153/153 [00:00<00:00, 64192.11it/s]
100%|██████████| 200/200 [00:00<00:00, 67836.07it/s]
100%|██████████| 65/65 [00:00<00:00, 45590.26it/s]
100%|██████████| 144/144 [00:00<00:00, 63456.58it/s]
100%|██████████| 30/30 [00:00<00:00, 50091.21it/s]
100%|██████████| 130/130 [00:00<00:00, 56252.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74256.50it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.29it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 72290.63it/s]
100%|██████████| 287/287 [00:00<00:00, 99608.21it/s]
100%|██████████| 771/771 [00:00<00:00, 80841.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81243.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83076.91it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90445.16it/s]
100%|██████████| 353/353 [00:00<00:00, 79358.38it/s]
100%|██████████| 252/252 [00:00<00:00, 79441.16it/s]
100%|██████████| 203/203 [00:00<00:00, 76348.97it/s]
100%|██████████| 153/153 [00:00<00:00, 76780.15it/s]
100%|██████████| 200/200 [00:00<00:00, 76246.21it/s]
100%|██████████| 65/65 [00:00<00:00, 69142.72it/s]
100%|██████████| 144/144 [00:00<00:00, 77126.78it/s]
100%|██████████| 30/30 [00:00<00:00, 71412.67it/s]
100%|██████████| 130/130 [00:00<00:00, 64087.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76595.10it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 174.06it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 83680.02it/s]
100%|██████████| 287/287 [00:00<00:00, 77447.42it/s]
100%|██████████| 771/771 [00:00<00:00, 77885.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84336.44it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81179.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92003.22it/s]
100%|██████████| 353/353 [00:00<00:00, 80135.81it/s]
100%|██████████| 252/252 [00:00<00:00, 67963.26it/s]
100%|██████████| 203/203 [00:00<00:00, 77700.65it/s]
100%|██████████| 153/153 [00:00<00:00, 78470.10it/s]
100%|██████████| 200/200 [00:00<00:00, 78303.07it/s]
100%|██████████| 65/65 [00:00<00:00, 64973.73it/s]
100%|██████████| 144/144 [00:00<00:00, 63657.23it/s]
100%|██████████| 30/30 [00:00<00:00, 54684.54it/s]
100%|██████████| 130/130 [00:00<00:00, 79310.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85554.14it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 147.17it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 54312.62it/s]
100%|██████████| 287/287 [00:00<00:00, 53720.33it/s]
100%|██████████| 771/771 [00:00<00:00, 54178.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 53987.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 55726.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 53918.06it/s]
100%|██████████| 353/353 [00:00<00:00, 54373.46it/s]
100%|██████████| 252/252 [00:00<00:00, 53073.79it/s]
100%|██████████| 203/203 [00:00<00:00, 54422.74it/s]
100%|██████████| 153/153 [00:00<00:00, 54783.04it/s]
100%|██████████| 200/200 [00:00<00:00, 54859.77it/s]
100%|██████████| 65/65 [00:00<00:00, 52855.71it/s]
100%|██████████| 144/144 [00:00<00:00, 51267.28it/s]
100%|██████████| 30/30 [00:00<00:00, 46534.44it/s]
100%|██████████| 130/130 [00:00<00:00, 67885.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90176.26it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.58it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 73940.07it/s]
100%|██████████| 287/287 [00:00<00:00, 72942.21it/s]
100%|██████████| 771/771 [00:00<00:00, 83614.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75306.42it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76713.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74095.15it/s]
100%|██████████| 353/353 [00:00<00:00, 74140.68it/s]
100%|██████████| 252/252 [00:00<00:00, 74183.37it/s]
100%|██████████| 203/203 [00:00<00:00, 72217.45it/s]
100%|██████████| 153/153 [00:00<00:00, 72750.09it/s]
100%|██████████| 200/200 [00:00<00:00, 74268.33it/s]
100%|██████████| 65/65 [00:00<00:00, 64896.40it/s]
100%|██████████| 144/144 [00:00<00:00, 71825.40it/s]
100%|██████████| 30/30 [00:00<00:00, 51442.81it/s]
100%|██████████| 130/130 [00:00<00:00, 73061.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77064.34it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.42it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82292.94it/s]
100%|██████████| 287/287 [00:00<00:00, 80401.10it/s]
100%|██████████| 771/771 [00:00<00:00, 83287.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81479.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83050.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82442.78it/s]
100%|██████████| 353/353 [00:00<00:00, 80686.07it/s]
100%|██████████| 252/252 [00:00<00:00, 78143.18it/s]
100%|██████████| 203/203 [00:00<00:00, 80030.43it/s]
100%|██████████| 153/153 [00:00<00:00, 76862.92it/s]
100%|██████████| 200/200 [00:00<00:00, 77939.31it/s]
100%|██████████| 65/65 [00:00<00:00, 68534.38it/s]
100%|██████████| 144/144 [00:00<00:00, 80799.97it/s]
100%|██████████| 30/30 [00:00<00:00, 68052.53it/s]
100%|██████████| 130/130 [00:00<00:00, 73653.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78095.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 165.62it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78717.07it/s]
100%|██████████| 287/287 [00:00<00:00, 78987.22it/s]
100%|██████████| 771/771 [00:00<00:00, 81431.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80521.10it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80212.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84283.90it/s]
100%|██████████| 353/353 [00:00<00:00, 80633.34it/s]
100%|██████████| 252/252 [00:00<00:00, 78972.25it/s]
100%|██████████| 203/203 [00:00<00:00, 78279.28it/s]
100%|██████████| 153/153 [00:00<00:00, 76124.38it/s]
100%|██████████| 200/200 [00:00<00:00, 72384.23it/s]
100%|██████████| 65/65 [00:00<00:00, 69318.53it/s]
100%|██████████| 144/144 [00:00<00:00, 77983.19it/s]
100%|██████████| 30/30 [00:00<00:00, 69365.56it/s]
100%|██████████| 130/130 [00:00<00:00, 72808.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84531.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [04:00<00:00, 24.26it/s]
INFO:root:The new embedding has 5826 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 63938.93it/s]
100%|██████████| 287/287 [00:00<00:00, 66061.09it/s]
100%|██████████| 771/771 [00:00<00:00, 67921.45it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87972.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76590.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82680.60it/s]
100%|██████████| 353/353 [00:00<00:00, 62288.15it/s]
100%|██████████| 252/252 [00:00<00:00, 72648.61it/s]
100%|██████████| 203/203 [00:00<00:00, 69099.47it/s]
100%|██████████| 153/153 [00:00<00:00, 69316.11it/s]
100%|██████████| 200/200 [00:00<00:00, 74638.38it/s]
100%|██████████| 65/65 [00:00<00:00, 76196.13it/s]
100%|██████████| 144/144 [00:00<00:00, 96807.14it/s]
100%|██████████| 30/30 [00:00<00:00, 66121.45it/s]
100%|██████████| 130/130 [00:00<00:00, 62508.26it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81827.31it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [02:48<00:00, 34.74it/s]
INFO:root:The new embedding has 5826 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 68027.89it/s]
100%|██████████| 287/287 [00:00<00:00, 53871.79it/s]
100%|██████████| 771/771 [00:00<00:00, 54386.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 66575.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76482.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73164.12it/s]
100%|██████████| 353/353 [00:00<00:00, 74551.32it/s]
100%|██████████| 252/252 [00:00<00:00, 74115.74it/s]
100%|██████████| 203/203 [00:00<00:00, 76451.80it/s]
100%|██████████| 153/153 [00:00<00:00, 76459.97it/s]
100%|██████████| 200/200 [00:00<00:00, 73084.23it/s]
100%|██████████| 65/65 [00:00<00:00, 62400.95it/s]
100%|██████████| 144/144 [00:00<00:00, 71039.73it/s]
100%|██████████| 30/30 [00:00<00:00, 53249.73it/s]
100%|██████████| 130/130 [00:00<00:00, 73120.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86398.04it/s]
100%|██████████| 2034/

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [02:58<00:00, 32.67it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58292.31it/s]
100%|██████████| 287/287 [00:00<00:00, 77021.26it/s]
100%|██████████| 771/771 [00:00<00:00, 80593.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 100696.32it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78071.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88566.53it/s]
100%|██████████| 353/353 [00:00<00:00, 78396.13it/s]
100%|██████████| 252/252 [00:00<00:00, 77495.76it/s]
100%|██████████| 203/203 [00:00<00:00, 76789.66it/s]
100%|██████████| 153/153 [00:00<00:00, 73567.41it/s]
100%|██████████| 200/200 [00:00<00:00, 76517.45it/s]
100%|██████████| 65/65 [00:00<00:00, 67084.09it/s]
100%|██████████| 144/144 [00:00<00:00, 76637.45it/s]
100%|██████████| 30/30 [00:00<00:00, 58497.96it/s]
100%|██████████| 130/130 [00:00<00:00, 55775.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93102.13it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [02:53<00:00, 33.64it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79149.77it/s]
100%|██████████| 287/287 [00:00<00:00, 77898.48it/s]
100%|██████████| 771/771 [00:00<00:00, 76819.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83059.64it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91630.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88089.10it/s]
100%|██████████| 353/353 [00:00<00:00, 80506.19it/s]
100%|██████████| 252/252 [00:00<00:00, 77930.00it/s]
100%|██████████| 203/203 [00:00<00:00, 80889.58it/s]
100%|██████████| 153/153 [00:00<00:00, 75470.84it/s]
100%|██████████| 200/200 [00:00<00:00, 72710.48it/s]
100%|██████████| 65/65 [00:00<00:00, 59357.67it/s]
100%|██████████| 144/144 [00:00<00:00, 78459.31it/s]
100%|██████████| 30/30 [00:00<00:00, 60757.66it/s]
100%|██████████| 130/130 [00:00<00:00, 78578.98it/s]
100%|██████████| 3500/3500 [00:00<00:00, 98015.42it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:32<00:00, 178.93it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 73303.65it/s]
100%|██████████| 287/287 [00:00<00:00, 72524.72it/s]
100%|██████████| 771/771 [00:00<00:00, 73392.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92621.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81085.39it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89607.20it/s]
100%|██████████| 353/353 [00:00<00:00, 74092.44it/s]
100%|██████████| 252/252 [00:00<00:00, 77353.97it/s]
100%|██████████| 203/203 [00:00<00:00, 73820.33it/s]
100%|██████████| 153/153 [00:00<00:00, 71765.66it/s]
100%|██████████| 200/200 [00:00<00:00, 71514.13it/s]
100%|██████████| 65/65 [00:00<00:00, 65709.75it/s]
100%|██████████| 144/144 [00:00<00:00, 75019.22it/s]
100%|██████████| 30/30 [00:00<00:00, 62851.71it/s]
100%|██████████| 130/130 [00:00<00:00, 68534.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90503.71it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:29<00:00, 199.83it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 85617.28it/s]
100%|██████████| 287/287 [00:00<00:00, 74123.48it/s]
100%|██████████| 771/771 [00:00<00:00, 91183.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88542.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89092.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91202.99it/s]
100%|██████████| 353/353 [00:00<00:00, 91734.16it/s]
100%|██████████| 252/252 [00:00<00:00, 77122.55it/s]
100%|██████████| 203/203 [00:00<00:00, 74799.59it/s]
100%|██████████| 153/153 [00:00<00:00, 67879.05it/s]
100%|██████████| 200/200 [00:00<00:00, 60646.39it/s]
100%|██████████| 65/65 [00:00<00:00, 64375.39it/s]
100%|██████████| 144/144 [00:00<00:00, 64610.59it/s]
100%|██████████| 30/30 [00:00<00:00, 34072.33it/s]
100%|██████████| 130/130 [00:00<00:00, 59584.69it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91578.69it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:36<00:00, 161.30it/s]
INFO:root:The new embedding has 5825 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 86023.32it/s]
100%|██████████| 287/287 [00:00<00:00, 74578.11it/s]
100%|██████████| 771/771 [00:00<00:00, 75982.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94373.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90078.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83274.29it/s]
100%|██████████| 353/353 [00:00<00:00, 70679.27it/s]
100%|██████████| 252/252 [00:00<00:00, 74723.55it/s]
100%|██████████| 203/203 [00:00<00:00, 75382.36it/s]
100%|██████████| 153/153 [00:00<00:00, 76853.71it/s]
100%|██████████| 200/200 [00:00<00:00, 73506.91it/s]
100%|██████████| 65/65 [00:00<00:00, 66012.05it/s]
100%|██████████| 144/144 [00:00<00:00, 71748.61it/s]
100%|██████████| 30/30 [00:00<00:00, 63389.98it/s]
100%|██████████| 130/130 [00:00<00:00, 69815.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77150.21it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:33<00:00, 176.68it/s]
INFO:root:The new embedding has 5825 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 93853.95it/s]
100%|██████████| 287/287 [00:00<00:00, 78528.62it/s]
100%|██████████| 771/771 [00:00<00:00, 96167.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88090.65it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83055.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88218.80it/s]
100%|██████████| 353/353 [00:00<00:00, 73471.09it/s]
100%|██████████| 252/252 [00:00<00:00, 55823.63it/s]
100%|██████████| 203/203 [00:00<00:00, 80958.80it/s]
100%|██████████| 153/153 [00:00<00:00, 72039.57it/s]
100%|██████████| 200/200 [00:00<00:00, 74268.33it/s]
100%|██████████| 65/65 [00:00<00:00, 68362.53it/s]
100%|██████████| 144/144 [00:00<00:00, 63496.61it/s]
100%|██████████| 30/30 [00:00<00:00, 54353.83it/s]
100%|██████████| 130/130 [00:00<00:00, 69116.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84747.11it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:32<00:00, 179.79it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 73889.22it/s]
100%|██████████| 287/287 [00:00<00:00, 78263.13it/s]
100%|██████████| 771/771 [00:00<00:00, 79072.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80502.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82046.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 103462.58it/s]
100%|██████████| 353/353 [00:00<00:00, 76726.40it/s]
100%|██████████| 252/252 [00:00<00:00, 74292.87it/s]
100%|██████████| 203/203 [00:00<00:00, 95261.10it/s]
100%|██████████| 153/153 [00:00<00:00, 73500.00it/s]
100%|██████████| 200/200 [00:00<00:00, 76038.87it/s]
100%|██████████| 65/65 [00:00<00:00, 66140.16it/s]
100%|██████████| 144/144 [00:00<00:00, 81071.11it/s]
100%|██████████| 30/30 [00:00<00:00, 55800.05it/s]
100%|██████████| 130/130 [00:00<00:00, 72479.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 97152.05it/s]
100%|██████████| 20

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:32<00:00, 177.43it/s]
INFO:root:The new embedding has 5825 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80605.38it/s]
100%|██████████| 287/287 [00:00<00:00, 77677.31it/s]
100%|██████████| 771/771 [00:00<00:00, 77545.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95393.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81436.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80956.53it/s]
100%|██████████| 353/353 [00:00<00:00, 78842.82it/s]
100%|██████████| 252/252 [00:00<00:00, 78649.05it/s]
100%|██████████| 203/203 [00:00<00:00, 76198.65it/s]
100%|██████████| 153/153 [00:00<00:00, 72552.69it/s]
100%|██████████| 200/200 [00:00<00:00, 74978.62it/s]
100%|██████████| 65/65 [00:00<00:00, 75709.46it/s]
100%|██████████| 144/144 [00:00<00:00, 79471.02it/s]
100%|██████████| 30/30 [00:00<00:00, 65844.65it/s]
100%|██████████| 130/130 [00:00<00:00, 76656.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77696.55it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['antedating' 'chronologize']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:45<00:00, 129.23it/s]
INFO:root:The new embedding has 5827 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 73766.94it/s]
100%|██████████| 287/287 [00:00<00:00, 71546.23it/s]
100%|██████████| 771/771 [00:00<00:00, 73755.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82780.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74970.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73455.41it/s]
100%|██████████| 353/353 [00:00<00:00, 73489.32it/s]
100%|██████████| 252/252 [00:00<00:00, 71897.46it/s]
100%|██████████| 203/203 [00:00<00:00, 71423.85it/s]
100%|██████████| 153/153 [00:00<00:00, 53575.60it/s]
100%|██████████| 200/200 [00:00<00:00, 65174.49it/s]
100%|██████████| 65/65 [00:00<00:00, 67067.59it/s]
100%|██████████| 144/144 [00:00<00:00, 62829.48it/s]
100%|██████████| 30/30 [00:00<00:00, 43705.84it/s]
100%|██████████| 130/130 [00:00<00:00, 71829.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87797.85it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.39it/s]
INFO:root:The new embedding has 5827 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 93121.83it/s]
100%|██████████| 287/287 [00:00<00:00, 73195.02it/s]
100%|██████████| 771/771 [00:00<00:00, 92267.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80442.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79815.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93016.59it/s]
100%|██████████| 353/353 [00:00<00:00, 74375.31it/s]
100%|██████████| 252/252 [00:00<00:00, 73222.35it/s]
100%|██████████| 203/203 [00:00<00:00, 73910.04it/s]
100%|██████████| 153/153 [00:00<00:00, 70956.27it/s]
100%|██████████| 200/200 [00:00<00:00, 73681.23it/s]
100%|██████████| 65/65 [00:00<00:00, 65804.91it/s]
100%|██████████| 144/144 [00:00<00:00, 69929.35it/s]
100%|██████████| 30/30 [00:00<00:00, 67686.46it/s]
100%|██████████| 130/130 [00:00<00:00, 61520.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89539.34it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.90it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 83551.54it/s]
100%|██████████| 287/287 [00:00<00:00, 80165.51it/s]
100%|██████████| 771/771 [00:00<00:00, 81380.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80879.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81792.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81099.50it/s]
100%|██████████| 353/353 [00:00<00:00, 80348.91it/s]
100%|██████████| 252/252 [00:00<00:00, 78966.35it/s]
100%|██████████| 203/203 [00:00<00:00, 81051.28it/s]
100%|██████████| 153/153 [00:00<00:00, 81118.51it/s]
100%|██████████| 200/200 [00:00<00:00, 81545.72it/s]
100%|██████████| 65/65 [00:00<00:00, 76302.76it/s]
100%|██████████| 144/144 [00:00<00:00, 79148.18it/s]
100%|██████████| 30/30 [00:00<00:00, 70138.86it/s]
100%|██████████| 130/130 [00:00<00:00, 75364.14it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82134.96it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 144.65it/s]
INFO:root:The new embedding has 5827 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 66680.08it/s]
100%|██████████| 287/287 [00:00<00:00, 78176.73it/s]
100%|██████████| 771/771 [00:00<00:00, 80527.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81746.77it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82347.82it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81065.02it/s]
100%|██████████| 353/353 [00:00<00:00, 80179.21it/s]
100%|██████████| 252/252 [00:00<00:00, 78854.42it/s]
100%|██████████| 203/203 [00:00<00:00, 77495.56it/s]
100%|██████████| 153/153 [00:00<00:00, 76982.79it/s]
100%|██████████| 200/200 [00:00<00:00, 76790.63it/s]
100%|██████████| 65/65 [00:00<00:00, 69797.69it/s]
100%|██████████| 144/144 [00:00<00:00, 80273.76it/s]
100%|██████████| 30/30 [00:00<00:00, 64893.82it/s]
100%|██████████| 130/130 [00:00<00:00, 78556.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82024.36it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['bestowals' 'giving']
['bestowals' 'gift']
['preposed' 'put']
['transmigrated' 'immigrate']
['dissociations' 'compartmentalization']
['dissociations' 'separation']
['independences' 'independent']
['independences' 'victory']
['traversals' 'travel']
['traversals' 'skiing']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['dematerialised' 'vanish']
['princedoms' 'domain']
['princedoms' 'rank']
['syphons' 'draw']
['syphons' 'tube']
['subserving' 'help']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 176.59it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 81386.64it/s]
100%|██████████| 287/287 [00:00<00:00, 72664.81it/s]
100%|██████████| 771/771 [00:00<00:00, 85666.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 69955.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 66354.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73304.78it/s]
100%|██████████| 353/353 [00:00<00:00, 73083.04it/s]
100%|██████████| 252/252 [00:00<00:00, 74602.25it/s]
100%|██████████| 203/203 [00:00<00:00, 72574.47it/s]
100%|██████████| 153/153 [00:00<00:00, 72601.94it/s]
100%|██████████| 200/200 [00:00<00:00, 71508.04it/s]
100%|██████████| 65/65 [00:00<00:00, 69195.37it/s]
100%|██████████| 144/144 [00:00<00:00, 73432.19it/s]
100%|██████████| 30/30 [00:00<00:00, 57013.65it/s]
100%|██████████| 130/130 [00:00<00:00, 71154.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80313.29it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:32<00:00, 178.25it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 74117.94it/s]
100%|██████████| 287/287 [00:00<00:00, 84754.29it/s]
100%|██████████| 771/771 [00:00<00:00, 93110.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84451.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75989.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74004.07it/s]
100%|██████████| 353/353 [00:00<00:00, 74263.40it/s]
100%|██████████| 252/252 [00:00<00:00, 74749.97it/s]
100%|██████████| 203/203 [00:00<00:00, 73533.44it/s]
100%|██████████| 153/153 [00:00<00:00, 73023.27it/s]
100%|██████████| 200/200 [00:00<00:00, 73941.01it/s]
100%|██████████| 65/65 [00:00<00:00, 61306.44it/s]
100%|██████████| 144/144 [00:00<00:00, 70698.79it/s]
100%|██████████| 30/30 [00:00<00:00, 54424.36it/s]
100%|██████████| 130/130 [00:00<00:00, 77418.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88472.49it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 174.26it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82844.51it/s]
100%|██████████| 287/287 [00:00<00:00, 80267.07it/s]
100%|██████████| 771/771 [00:00<00:00, 98095.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86166.92it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76000.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79396.47it/s]
100%|██████████| 353/353 [00:00<00:00, 77876.57it/s]
100%|██████████| 252/252 [00:00<00:00, 77212.70it/s]
100%|██████████| 203/203 [00:00<00:00, 75940.40it/s]
100%|██████████| 153/153 [00:00<00:00, 62687.17it/s]
100%|██████████| 200/200 [00:00<00:00, 55494.89it/s]
100%|██████████| 65/65 [00:00<00:00, 48832.13it/s]
100%|██████████| 144/144 [00:00<00:00, 74657.57it/s]
100%|██████████| 30/30 [00:00<00:00, 55750.61it/s]
100%|██████████| 130/130 [00:00<00:00, 72105.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90883.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:32<00:00, 180.54it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79758.44it/s]
100%|██████████| 287/287 [00:00<00:00, 78868.19it/s]
100%|██████████| 771/771 [00:00<00:00, 80416.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81336.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81173.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79702.24it/s]
100%|██████████| 353/353 [00:00<00:00, 78729.62it/s]
100%|██████████| 252/252 [00:00<00:00, 78813.26it/s]
100%|██████████| 203/203 [00:00<00:00, 78401.82it/s]
100%|██████████| 153/153 [00:00<00:00, 76761.78it/s]
100%|██████████| 200/200 [00:00<00:00, 78332.32it/s]
100%|██████████| 65/65 [00:00<00:00, 70410.58it/s]
100%|██████████| 144/144 [00:00<00:00, 81256.53it/s]
100%|██████████| 30/30 [00:00<00:00, 69595.75it/s]
100%|██████████| 130/130 [00:00<00:00, 79739.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78950.97it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:29<00:00, 199.32it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 63079.36it/s]
100%|██████████| 287/287 [00:00<00:00, 74656.74it/s]
100%|██████████| 771/771 [00:00<00:00, 76075.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76012.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77784.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73814.36it/s]
100%|██████████| 353/353 [00:00<00:00, 75313.56it/s]
100%|██████████| 252/252 [00:00<00:00, 77038.24it/s]
100%|██████████| 203/203 [00:00<00:00, 74688.04it/s]
100%|██████████| 153/153 [00:00<00:00, 77691.10it/s]
100%|██████████| 200/200 [00:00<00:00, 72471.78it/s]
100%|██████████| 65/65 [00:00<00:00, 73663.81it/s]
100%|██████████| 144/144 [00:00<00:00, 71443.08it/s]
100%|██████████| 30/30 [00:00<00:00, 60993.27it/s]
100%|██████████| 130/130 [00:00<00:00, 71154.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78273.22it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.62it/s]
INFO:root:The new embedding has 5837 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 83431.76it/s]
100%|██████████| 287/287 [00:00<00:00, 80697.54it/s]
100%|██████████| 771/771 [00:00<00:00, 84143.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89909.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92769.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89935.12it/s]
100%|██████████| 353/353 [00:00<00:00, 81584.16it/s]
100%|██████████| 252/252 [00:00<00:00, 76419.97it/s]
100%|██████████| 203/203 [00:00<00:00, 73412.98it/s]
100%|██████████| 153/153 [00:00<00:00, 78508.50it/s]
100%|██████████| 200/200 [00:00<00:00, 70215.18it/s]
100%|██████████| 65/65 [00:00<00:00, 74286.04it/s]
100%|██████████| 144/144 [00:00<00:00, 84912.10it/s]
100%|██████████| 30/30 [00:00<00:00, 57247.10it/s]
100%|██████████| 130/130 [00:00<00:00, 57932.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86288.85it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 149.88it/s]
INFO:root:The new embedding has 5837 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82414.34it/s]
100%|██████████| 287/287 [00:00<00:00, 79404.04it/s]
100%|██████████| 771/771 [00:00<00:00, 83238.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81928.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82693.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81169.60it/s]
100%|██████████| 353/353 [00:00<00:00, 80235.70it/s]
100%|██████████| 252/252 [00:00<00:00, 81890.80it/s]
100%|██████████| 203/203 [00:00<00:00, 77679.38it/s]
100%|██████████| 153/153 [00:00<00:00, 31197.30it/s]
100%|██████████| 200/200 [00:00<00:00, 57127.54it/s]
100%|██████████| 65/65 [00:00<00:00, 55378.79it/s]
100%|██████████| 144/144 [00:00<00:00, 57407.07it/s]
100%|██████████| 30/30 [00:00<00:00, 29803.20it/s]
100%|██████████| 130/130 [00:00<00:00, 57644.52it/s]
100%|██████████| 3500/3500 [00:00<00:00, 58267.86it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.61it/s]
INFO:root:The new embedding has 5837 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60006.15it/s]
100%|██████████| 287/287 [00:00<00:00, 58654.45it/s]
100%|██████████| 771/771 [00:00<00:00, 59630.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 60024.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 60634.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85732.18it/s]
100%|██████████| 353/353 [00:00<00:00, 80375.08it/s]
100%|██████████| 252/252 [00:00<00:00, 78989.96it/s]
100%|██████████| 203/203 [00:00<00:00, 79181.97it/s]
100%|██████████| 153/153 [00:00<00:00, 77344.64it/s]
100%|██████████| 200/200 [00:00<00:00, 78648.12it/s]
100%|██████████| 65/65 [00:00<00:00, 66755.57it/s]
100%|██████████| 144/144 [00:00<00:00, 76959.71it/s]
100%|██████████| 30/30 [00:00<00:00, 65331.84it/s]
100%|██████████| 130/130 [00:00<00:00, 73564.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79087.50it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 155.50it/s]
INFO:root:The new embedding has 5843 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 93433.30it/s]
100%|██████████| 287/287 [00:00<00:00, 73973.16it/s]
100%|██████████| 771/771 [00:00<00:00, 95669.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75315.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85605.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75528.59it/s]
100%|██████████| 353/353 [00:00<00:00, 74551.32it/s]
100%|██████████| 252/252 [00:00<00:00, 73497.30it/s]
100%|██████████| 203/203 [00:00<00:00, 74038.58it/s]
100%|██████████| 153/153 [00:00<00:00, 76106.32it/s]
100%|██████████| 200/200 [00:00<00:00, 76790.63it/s]
100%|██████████| 65/65 [00:00<00:00, 72993.24it/s]
100%|██████████| 144/144 [00:00<00:00, 75215.41it/s]
100%|██████████| 30/30 [00:00<00:00, 57143.11it/s]
100%|██████████| 130/130 [00:00<00:00, 69592.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81277.31it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.22it/s]
INFO:root:The new embedding has 5843 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 91423.23it/s]
100%|██████████| 287/287 [00:00<00:00, 74679.90it/s]
100%|██████████| 771/771 [00:00<00:00, 77519.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97811.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91016.30it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90112.88it/s]
100%|██████████| 353/353 [00:00<00:00, 78475.08it/s]
100%|██████████| 252/252 [00:00<00:00, 92118.23it/s]
100%|██████████| 203/203 [00:00<00:00, 73743.61it/s]
100%|██████████| 153/153 [00:00<00:00, 75461.96it/s]
100%|██████████| 200/200 [00:00<00:00, 57162.58it/s]
100%|██████████| 65/65 [00:00<00:00, 64558.31it/s]
100%|██████████| 144/144 [00:00<00:00, 71996.64it/s]
100%|██████████| 30/30 [00:00<00:00, 68909.70it/s]
100%|██████████| 130/130 [00:00<00:00, 59813.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87928.27it/s]
100%|██████████| 2034

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.26it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 66590.01it/s]
100%|██████████| 287/287 [00:00<00:00, 78976.86it/s]
100%|██████████| 771/771 [00:00<00:00, 74962.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81289.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81800.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88957.24it/s]
100%|██████████| 353/353 [00:00<00:00, 66142.03it/s]
100%|██████████| 252/252 [00:00<00:00, 65047.98it/s]
100%|██████████| 203/203 [00:00<00:00, 62253.69it/s]
100%|██████████| 153/153 [00:00<00:00, 47328.60it/s]
100%|██████████| 200/200 [00:00<00:00, 67693.74it/s]
100%|██████████| 65/65 [00:00<00:00, 55729.71it/s]
100%|██████████| 144/144 [00:00<00:00, 60591.87it/s]
100%|██████████| 30/30 [00:00<00:00, 39506.79it/s]
100%|██████████| 130/130 [00:00<00:00, 67390.87it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85768.58it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.67it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76304.51it/s]
100%|██████████| 287/287 [00:00<00:00, 76888.43it/s]
100%|██████████| 771/771 [00:00<00:00, 84183.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81491.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81939.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76766.26it/s]
100%|██████████| 353/353 [00:00<00:00, 78280.07it/s]
100%|██████████| 252/252 [00:00<00:00, 73415.61it/s]
100%|██████████| 203/203 [00:00<00:00, 76506.76it/s]
100%|██████████| 153/153 [00:00<00:00, 53755.11it/s]
100%|██████████| 200/200 [00:00<00:00, 70338.82it/s]
100%|██████████| 65/65 [00:00<00:00, 66044.03it/s]
100%|██████████| 144/144 [00:00<00:00, 72900.40it/s]
100%|██████████| 30/30 [00:00<00:00, 50696.66it/s]
100%|██████████| 130/130 [00:00<00:00, 69512.94it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85891.52it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.51it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 77806.43it/s]
100%|██████████| 287/287 [00:00<00:00, 74791.25it/s]
100%|██████████| 771/771 [00:00<00:00, 76643.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95963.03it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77535.89it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76030.14it/s]
100%|██████████| 353/353 [00:00<00:00, 76746.28it/s]
100%|██████████| 252/252 [00:00<00:00, 76641.62it/s]
100%|██████████| 203/203 [00:00<00:00, 74006.41it/s]
100%|██████████| 153/153 [00:00<00:00, 74968.28it/s]
100%|██████████| 200/200 [00:00<00:00, 73558.47it/s]
100%|██████████| 65/65 [00:00<00:00, 75063.26it/s]
100%|██████████| 144/144 [00:00<00:00, 73584.28it/s]
100%|██████████| 30/30 [00:00<00:00, 53476.04it/s]
100%|██████████| 130/130 [00:00<00:00, 73081.29it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74341.11it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.76it/s]
INFO:root:The new embedding has 5837 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 83325.57it/s]
100%|██████████| 287/287 [00:00<00:00, 63392.77it/s]
100%|██████████| 771/771 [00:00<00:00, 89311.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86304.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75803.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90594.28it/s]
100%|██████████| 353/353 [00:00<00:00, 73628.19it/s]
100%|██████████| 252/252 [00:00<00:00, 71653.76it/s]
100%|██████████| 203/203 [00:00<00:00, 85315.00it/s]
100%|██████████| 153/153 [00:00<00:00, 69981.30it/s]
100%|██████████| 200/200 [00:00<00:00, 72178.70it/s]
100%|██████████| 65/65 [00:00<00:00, 72701.27it/s]
100%|██████████| 144/144 [00:00<00:00, 81420.84it/s]
100%|██████████| 30/30 [00:00<00:00, 52582.16it/s]
100%|██████████| 130/130 [00:00<00:00, 57197.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82324.27it/s]
100%|██████████| 2034

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 154.80it/s]
INFO:root:The new embedding has 5837 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81740.69it/s]
100%|██████████| 287/287 [00:00<00:00, 80849.30it/s]
100%|██████████| 771/771 [00:00<00:00, 79764.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79553.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80766.86it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80104.61it/s]
100%|██████████| 353/353 [00:00<00:00, 86015.76it/s]
100%|██████████| 252/252 [00:00<00:00, 80267.66it/s]
100%|██████████| 203/203 [00:00<00:00, 78430.70it/s]
100%|██████████| 153/153 [00:00<00:00, 82230.72it/s]
100%|██████████| 200/200 [00:00<00:00, 78266.54it/s]
100%|██████████| 65/65 [00:00<00:00, 69142.72it/s]
100%|██████████| 144/144 [00:00<00:00, 76000.98it/s]
100%|██████████| 30/30 [00:00<00:00, 55725.92it/s]
100%|██████████| 130/130 [00:00<00:00, 71896.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91977.47it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.90it/s]
INFO:root:The new embedding has 5837 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81546.61it/s]
100%|██████████| 287/287 [00:00<00:00, 79018.33it/s]
100%|██████████| 771/771 [00:00<00:00, 80964.63it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80586.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81552.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80146.96it/s]
100%|██████████| 353/353 [00:00<00:00, 79481.93it/s]
100%|██████████| 252/252 [00:00<00:00, 77717.99it/s]
100%|██████████| 203/203 [00:00<00:00, 77467.36it/s]
100%|██████████| 153/153 [00:00<00:00, 74420.56it/s]
100%|██████████| 200/200 [00:00<00:00, 78193.59it/s]
100%|██████████| 65/65 [00:00<00:00, 65884.43it/s]
100%|██████████| 144/144 [00:00<00:00, 76404.78it/s]
100%|██████████| 30/30 [00:00<00:00, 63550.06it/s]
100%|██████████| 130/130 [00:00<00:00, 75218.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78281.57it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:31<00:00, 187.95it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 79208.12it/s]
100%|██████████| 287/287 [00:00<00:00, 70577.23it/s]
100%|██████████| 771/771 [00:00<00:00, 83496.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92934.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79804.86it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88084.79it/s]
100%|██████████| 353/353 [00:00<00:00, 71824.45it/s]
100%|██████████| 252/252 [00:00<00:00, 70123.04it/s]
100%|██████████| 203/203 [00:00<00:00, 75623.39it/s]
100%|██████████| 153/153 [00:00<00:00, 73048.21it/s]
100%|██████████| 200/200 [00:00<00:00, 67427.12it/s]
100%|██████████| 65/65 [00:00<00:00, 73923.47it/s]
100%|██████████| 144/144 [00:00<00:00, 76910.71it/s]
100%|██████████| 30/30 [00:00<00:00, 55529.18it/s]
100%|██████████| 130/130 [00:00<00:00, 73435.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79383.45it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:29<00:00, 201.01it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 74565.07it/s]
100%|██████████| 287/287 [00:00<00:00, 78682.61it/s]
100%|██████████| 771/771 [00:00<00:00, 74740.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77422.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78209.63it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74575.13it/s]
100%|██████████| 353/353 [00:00<00:00, 75221.73it/s]
100%|██████████| 252/252 [00:00<00:00, 74612.78it/s]
100%|██████████| 203/203 [00:00<00:00, 73788.34it/s]
100%|██████████| 153/153 [00:00<00:00, 72824.39it/s]
100%|██████████| 200/200 [00:00<00:00, 72836.75it/s]
100%|██████████| 65/65 [00:00<00:00, 63225.83it/s]
100%|██████████| 144/144 [00:00<00:00, 73271.84it/s]
100%|██████████| 30/30 [00:00<00:00, 58146.54it/s]
100%|██████████| 130/130 [00:00<00:00, 69521.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73735.82it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:29<00:00, 196.25it/s]
INFO:root:The new embedding has 5813 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 83998.75it/s]
100%|██████████| 287/287 [00:00<00:00, 70350.37it/s]
100%|██████████| 771/771 [00:00<00:00, 79002.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95050.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76555.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90222.08it/s]
100%|██████████| 353/353 [00:00<00:00, 73870.64it/s]
100%|██████████| 252/252 [00:00<00:00, 73944.63it/s]
100%|██████████| 203/203 [00:00<00:00, 73698.93it/s]
100%|██████████| 153/153 [00:00<00:00, 70341.83it/s]
100%|██████████| 200/200 [00:00<00:00, 65834.31it/s]
100%|██████████| 65/65 [00:00<00:00, 62760.07it/s]
100%|██████████| 144/144 [00:00<00:00, 74944.75it/s]
100%|██████████| 30/30 [00:00<00:00, 40213.84it/s]
100%|██████████| 130/130 [00:00<00:00, 66108.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71908.93it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:27<00:00, 209.60it/s]
INFO:root:The new embedding has 5813 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 86408.27it/s]
100%|██████████| 287/287 [00:00<00:00, 71789.44it/s]
100%|██████████| 771/771 [00:00<00:00, 74001.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92323.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76619.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73418.55it/s]
100%|██████████| 353/353 [00:00<00:00, 75348.06it/s]
100%|██████████| 252/252 [00:00<00:00, 72563.82it/s]
100%|██████████| 203/203 [00:00<00:00, 72537.38it/s]
100%|██████████| 153/153 [00:00<00:00, 68648.75it/s]
100%|██████████| 200/200 [00:00<00:00, 70981.62it/s]
100%|██████████| 65/65 [00:00<00:00, 64284.31it/s]
100%|██████████| 144/144 [00:00<00:00, 71291.29it/s]
100%|██████████| 30/30 [00:00<00:00, 65264.07it/s]
100%|██████████| 130/130 [00:00<00:00, 71219.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82890.45it/s]
100%|██████████| 2034

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:29<00:00, 197.64it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82146.13it/s]
100%|██████████| 287/287 [00:00<00:00, 73119.43it/s]
100%|██████████| 771/771 [00:00<00:00, 81009.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81391.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81313.33it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97061.16it/s]
100%|██████████| 353/353 [00:00<00:00, 78321.48it/s]
100%|██████████| 252/252 [00:00<00:00, 80549.05it/s]
100%|██████████| 203/203 [00:00<00:00, 53105.70it/s]
100%|██████████| 153/153 [00:00<00:00, 75908.27it/s]
100%|██████████| 200/200 [00:00<00:00, 80597.69it/s]
100%|██████████| 65/65 [00:00<00:00, 54679.05it/s]
100%|██████████| 144/144 [00:00<00:00, 76115.91it/s]
100%|██████████| 30/30 [00:00<00:00, 56679.78it/s]
100%|██████████| 130/130 [00:00<00:00, 79437.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72125.15it/s]
100%|██████████| 203

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:28<00:00, 204.58it/s]
INFO:root:The new embedding has 5813 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79915.12it/s]
100%|██████████| 287/287 [00:00<00:00, 79127.41it/s]
100%|██████████| 771/771 [00:00<00:00, 81200.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 68900.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83555.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84791.65it/s]
100%|██████████| 353/353 [00:00<00:00, 79103.99it/s]
100%|██████████| 252/252 [00:00<00:00, 78334.29it/s]
100%|██████████| 203/203 [00:00<00:00, 78430.70it/s]
100%|██████████| 153/153 [00:00<00:00, 77335.32it/s]
100%|██████████| 200/200 [00:00<00:00, 79967.66it/s]
100%|██████████| 65/65 [00:00<00:00, 77188.49it/s]
100%|██████████| 144/144 [00:00<00:00, 80455.54it/s]
100%|██████████| 30/30 [00:00<00:00, 70809.86it/s]
100%|██████████| 130/130 [00:00<00:00, 76377.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80457.22it/s]
100%|██████████| 203

['provincialism' 'narrow-mindedness']
['unsighted' 'color-blind']
['preliterate' 'noncivilized']
['reasoning' 're-argue']
['extravert' 'extroversive']
['illiberal' 'narrow-minded']
['snookered' 'flim-flam']
['reenact' 're-create']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['nonfunctional' 'run-down']
['fulfillments' 'self-fulfillment']
['continence' 'self-discipline']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['mccarthyism' 'witch-hunt']
['inconvertible' 'incommutable']
['defrauding' 'short-change']
['caesarism' 'autocracy']
['fashionable' 'up-to-date']
['methodically' 'know-how']
['autosuggestion' 'self-improvement']
['conjoins' 'cross-link']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['indexical' 'cross-index']
['discoverys' 'self-discovery']
['replacements' 'stand-in']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['inva

100%|██████████| 5846/5846 [00:27<00:00, 211.14it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 76037.27it/s]
100%|██████████| 287/287 [00:00<00:00, 73270.76it/s]
100%|██████████| 771/771 [00:00<00:00, 76554.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77074.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77882.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75737.26it/s]
100%|██████████| 353/353 [00:00<00:00, 76611.27it/s]
100%|██████████| 252/252 [00:00<00:00, 76243.57it/s]
100%|██████████| 203/203 [00:00<00:00, 74609.51it/s]
100%|██████████| 153/153 [00:00<00:00, 75073.53it/s]
100%|██████████| 200/200 [00:00<00:00, 75450.69it/s]
100%|██████████| 65/65 [00:00<00:00, 64360.19it/s]
100%|██████████| 144/144 [00:00<00:00, 73629.13it/s]
100%|██████████| 30/30 [00:00<00:00, 59130.23it/s]
100%|██████████| 130/130 [00:00<00:00, 71257.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74286.18it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:23<00:00, 246.74it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 84952.45it/s]
100%|██████████| 287/287 [00:00<00:00, 66014.00it/s]
100%|██████████| 771/771 [00:00<00:00, 94415.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85935.65it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75386.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85255.28it/s]
100%|██████████| 353/353 [00:00<00:00, 76778.12it/s]
100%|██████████| 252/252 [00:00<00:00, 77456.00it/s]
100%|██████████| 203/203 [00:00<00:00, 74174.03it/s]
100%|██████████| 153/153 [00:00<00:00, 73719.53it/s]
100%|██████████| 200/200 [00:00<00:00, 74904.97it/s]
100%|██████████| 65/65 [00:00<00:00, 64942.77it/s]
100%|██████████| 144/144 [00:00<00:00, 75886.39it/s]
100%|██████████| 30/30 [00:00<00:00, 67979.00it/s]
100%|██████████| 130/130 [00:00<00:00, 73179.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87812.03it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:45<00:00, 127.14it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 74950.54it/s]
100%|██████████| 287/287 [00:00<00:00, 72406.93it/s]
100%|██████████| 771/771 [00:00<00:00, 84468.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74238.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75528.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83054.98it/s]
100%|██████████| 353/353 [00:00<00:00, 75436.35it/s]
100%|██████████| 252/252 [00:00<00:00, 73268.03it/s]
100%|██████████| 203/203 [00:00<00:00, 73724.45it/s]
100%|██████████| 153/153 [00:00<00:00, 70643.83it/s]
100%|██████████| 200/200 [00:00<00:00, 73571.37it/s]
100%|██████████| 65/65 [00:00<00:00, 72837.23it/s]
100%|██████████| 144/144 [00:00<00:00, 74464.28it/s]
100%|██████████| 30/30 [00:00<00:00, 66682.10it/s]
100%|██████████| 130/130 [00:00<00:00, 60209.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86591.19it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.09it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 90720.54it/s]
100%|██████████| 287/287 [00:00<00:00, 72757.04it/s]
100%|██████████| 771/771 [00:00<00:00, 85854.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76136.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77737.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74998.28it/s]
100%|██████████| 353/353 [00:00<00:00, 74634.00it/s]
100%|██████████| 252/252 [00:00<00:00, 77775.17it/s]
100%|██████████| 203/203 [00:00<00:00, 75249.11it/s]
100%|██████████| 153/153 [00:00<00:00, 76405.35it/s]
100%|██████████| 200/200 [00:00<00:00, 77823.62it/s]
100%|██████████| 65/65 [00:00<00:00, 70923.45it/s]
100%|██████████| 144/144 [00:00<00:00, 72515.28it/s]
100%|██████████| 30/30 [00:00<00:00, 62415.24it/s]
100%|██████████| 130/130 [00:00<00:00, 54877.17it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80755.09it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.61it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78788.12it/s]
100%|██████████| 287/287 [00:00<00:00, 62410.06it/s]
100%|██████████| 771/771 [00:00<00:00, 78183.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91484.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78426.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98150.64it/s]
100%|██████████| 353/353 [00:00<00:00, 77643.78it/s]
100%|██████████| 252/252 [00:00<00:00, 76530.64it/s]
100%|██████████| 203/203 [00:00<00:00, 73571.56it/s]
100%|██████████| 153/153 [00:00<00:00, 75764.88it/s]
100%|██████████| 200/200 [00:00<00:00, 79332.40it/s]
100%|██████████| 65/65 [00:00<00:00, 63402.27it/s]
100%|██████████| 144/144 [00:00<00:00, 78245.86it/s]
100%|██████████| 30/30 [00:00<00:00, 71130.08it/s]
100%|██████████| 130/130 [00:00<00:00, 78050.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72551.47it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 128.89it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75437.67it/s]
100%|██████████| 287/287 [00:00<00:00, 75822.96it/s]
100%|██████████| 771/771 [00:00<00:00, 54188.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90916.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94385.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82282.13it/s]
100%|██████████| 353/353 [00:00<00:00, 85267.76it/s]
100%|██████████| 252/252 [00:00<00:00, 79072.69it/s]
100%|██████████| 203/203 [00:00<00:00, 78121.27it/s]
100%|██████████| 153/153 [00:00<00:00, 58766.35it/s]
100%|██████████| 200/200 [00:00<00:00, 76538.39it/s]
100%|██████████| 65/65 [00:00<00:00, 74877.71it/s]
100%|██████████| 144/144 [00:00<00:00, 64069.14it/s]
100%|██████████| 30/30 [00:00<00:00, 53498.78it/s]
100%|██████████| 130/130 [00:00<00:00, 50552.52it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77726.17it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:50<00:00, 116.16it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 78920.19it/s]
100%|██████████| 287/287 [00:00<00:00, 68105.53it/s]
100%|██████████| 771/771 [00:00<00:00, 88401.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79997.41it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86329.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87383.15it/s]
100%|██████████| 353/353 [00:00<00:00, 72128.87it/s]
100%|██████████| 252/252 [00:00<00:00, 89082.56it/s]
100%|██████████| 203/203 [00:00<00:00, 59234.99it/s]
100%|██████████| 153/153 [00:00<00:00, 75568.60it/s]
100%|██████████| 200/200 [00:00<00:00, 82727.89it/s]
100%|██████████| 65/65 [00:00<00:00, 68191.54it/s]
100%|██████████| 144/144 [00:00<00:00, 74171.65it/s]
100%|██████████| 30/30 [00:00<00:00, 54283.49it/s]
100%|██████████| 130/130 [00:00<00:00, 83667.26it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78190.67it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.63it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 84219.92it/s]
100%|██████████| 287/287 [00:00<00:00, 71469.76it/s]
100%|██████████| 771/771 [00:00<00:00, 80481.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85651.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90521.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89342.53it/s]
100%|██████████| 353/353 [00:00<00:00, 79915.22it/s]
100%|██████████| 252/252 [00:00<00:00, 72999.83it/s]
100%|██████████| 203/203 [00:00<00:00, 68898.18it/s]
100%|██████████| 153/153 [00:00<00:00, 83384.68it/s]
100%|██████████| 200/200 [00:00<00:00, 79264.93it/s]
100%|██████████| 65/65 [00:00<00:00, 74023.83it/s]
100%|██████████| 144/144 [00:00<00:00, 69775.85it/s]
100%|██████████| 30/30 [00:00<00:00, 61410.01it/s]
100%|██████████| 130/130 [00:00<00:00, 69239.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82338.12it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.32it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77942.48it/s]
100%|██████████| 287/287 [00:00<00:00, 75679.95it/s]
100%|██████████| 771/771 [00:00<00:00, 74342.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92562.93it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79399.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87744.50it/s]
100%|██████████| 353/353 [00:00<00:00, 74547.57it/s]
100%|██████████| 252/252 [00:00<00:00, 68235.29it/s]
100%|██████████| 203/203 [00:00<00:00, 56815.94it/s]
100%|██████████| 153/153 [00:00<00:00, 55517.65it/s]
100%|██████████| 200/200 [00:00<00:00, 57088.66it/s]
100%|██████████| 65/65 [00:00<00:00, 43069.47it/s]
100%|██████████| 144/144 [00:00<00:00, 76424.11it/s]
100%|██████████| 30/30 [00:00<00:00, 59861.62it/s]
100%|██████████| 130/130 [00:00<00:00, 53201.24it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86385.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.24it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 86556.42it/s]
100%|██████████| 287/287 [00:00<00:00, 74605.84it/s]
100%|██████████| 771/771 [00:00<00:00, 76761.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94313.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88554.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90014.25it/s]
100%|██████████| 353/353 [00:00<00:00, 81057.12it/s]
100%|██████████| 252/252 [00:00<00:00, 72683.58it/s]
100%|██████████| 203/203 [00:00<00:00, 67655.44it/s]
100%|██████████| 153/153 [00:00<00:00, 50717.50it/s]
100%|██████████| 200/200 [00:00<00:00, 49902.49it/s]
100%|██████████| 65/65 [00:00<00:00, 67666.86it/s]
100%|██████████| 144/144 [00:00<00:00, 74281.12it/s]
100%|██████████| 30/30 [00:00<00:00, 53704.28it/s]
100%|██████████| 130/130 [00:00<00:00, 58915.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79352.13it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 124.03it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 75060.63it/s]
100%|██████████| 287/287 [00:00<00:00, 95272.28it/s]
100%|██████████| 771/771 [00:00<00:00, 76576.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76886.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79158.72it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75912.26it/s]
100%|██████████| 353/353 [00:00<00:00, 76730.37it/s]
100%|██████████| 252/252 [00:00<00:00, 75751.78it/s]
100%|██████████| 203/203 [00:00<00:00, 74951.03it/s]
100%|██████████| 153/153 [00:00<00:00, 71693.50it/s]
100%|██████████| 200/200 [00:00<00:00, 74084.68it/s]
100%|██████████| 65/65 [00:00<00:00, 70960.37it/s]
100%|██████████| 144/144 [00:00<00:00, 71476.90it/s]
100%|██████████| 30/30 [00:00<00:00, 61440.00it/s]
100%|██████████| 130/130 [00:00<00:00, 70785.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81518.32it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 132.58it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 93550.12it/s]
100%|██████████| 287/287 [00:00<00:00, 74068.75it/s]
100%|██████████| 771/771 [00:00<00:00, 90598.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 99540.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83506.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93318.74it/s]
100%|██████████| 353/353 [00:00<00:00, 74229.89it/s]
100%|██████████| 252/252 [00:00<00:00, 72999.83it/s]
100%|██████████| 203/203 [00:00<00:00, 72642.58it/s]
100%|██████████| 153/153 [00:00<00:00, 72601.94it/s]
100%|██████████| 200/200 [00:00<00:00, 74051.98it/s]
100%|██████████| 65/65 [00:00<00:00, 64269.16it/s]
100%|██████████| 144/144 [00:00<00:00, 72619.91it/s]
100%|██████████| 30/30 [00:00<00:00, 64527.75it/s]
100%|██████████| 130/130 [00:00<00:00, 60963.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93557.82it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.29it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 64382.01it/s]
100%|██████████| 287/287 [00:00<00:00, 81866.52it/s]
100%|██████████| 771/771 [00:00<00:00, 82124.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82128.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82576.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86015.24it/s]
100%|██████████| 353/353 [00:00<00:00, 82341.88it/s]
100%|██████████| 252/252 [00:00<00:00, 79807.05it/s]
100%|██████████| 203/203 [00:00<00:00, 77814.27it/s]
100%|██████████| 153/153 [00:00<00:00, 79658.45it/s]
100%|██████████| 200/200 [00:00<00:00, 76924.42it/s]
100%|██████████| 65/65 [00:00<00:00, 67936.65it/s]
100%|██████████| 144/144 [00:00<00:00, 79210.46it/s]
100%|██████████| 30/30 [00:00<00:00, 63009.07it/s]
100%|██████████| 130/130 [00:00<00:00, 76057.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74455.73it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.47it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80546.50it/s]
100%|██████████| 287/287 [00:00<00:00, 74795.90it/s]
100%|██████████| 771/771 [00:00<00:00, 78167.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84004.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80467.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80114.30it/s]
100%|██████████| 353/353 [00:00<00:00, 80418.73it/s]
100%|██████████| 252/252 [00:00<00:00, 80530.64it/s]
100%|██████████| 203/203 [00:00<00:00, 80835.82it/s]
100%|██████████| 153/153 [00:00<00:00, 76514.67it/s]
100%|██████████| 200/200 [00:00<00:00, 78662.87it/s]
100%|██████████| 65/65 [00:00<00:00, 69248.10it/s]
100%|██████████| 144/144 [00:00<00:00, 76608.29it/s]
100%|██████████| 30/30 [00:00<00:00, 69595.75it/s]
100%|██████████| 130/130 [00:00<00:00, 74970.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71316.45it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.60it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 67144.89it/s]
100%|██████████| 287/287 [00:00<00:00, 73199.47it/s]
100%|██████████| 771/771 [00:00<00:00, 75894.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 70306.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78363.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80845.74it/s]
100%|██████████| 353/353 [00:00<00:00, 60907.04it/s]
100%|██████████| 252/252 [00:00<00:00, 76051.56it/s]
100%|██████████| 203/203 [00:00<00:00, 54070.22it/s]
100%|██████████| 153/153 [00:00<00:00, 55652.46it/s]
100%|██████████| 200/200 [00:00<00:00, 65387.86it/s]
100%|██████████| 65/65 [00:00<00:00, 61736.81it/s]
100%|██████████| 144/144 [00:00<00:00, 63731.11it/s]
100%|██████████| 30/30 [00:00<00:00, 22824.07it/s]
100%|██████████| 130/130 [00:00<00:00, 44536.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 68285.72it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.48it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 72798.04it/s]
100%|██████████| 287/287 [00:00<00:00, 62686.31it/s]
100%|██████████| 771/771 [00:00<00:00, 91697.62it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95803.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75428.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78089.25it/s]
100%|██████████| 353/353 [00:00<00:00, 74502.56it/s]
100%|██████████| 252/252 [00:00<00:00, 74728.83it/s]
100%|██████████| 203/203 [00:00<00:00, 73469.99it/s]
100%|██████████| 153/153 [00:00<00:00, 74248.35it/s]
100%|██████████| 200/200 [00:00<00:00, 74538.90it/s]
100%|██████████| 65/65 [00:00<00:00, 72430.86it/s]
100%|██████████| 144/144 [00:00<00:00, 69176.47it/s]
100%|██████████| 30/30 [00:00<00:00, 66823.75it/s]
100%|██████████| 130/130 [00:00<00:00, 60316.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82535.79it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 155.42it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80676.78it/s]
100%|██████████| 287/287 [00:00<00:00, 78400.76it/s]
100%|██████████| 771/771 [00:00<00:00, 79644.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82309.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81806.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90455.57it/s]
100%|██████████| 353/353 [00:00<00:00, 80261.79it/s]
100%|██████████| 252/252 [00:00<00:00, 78930.97it/s]
100%|██████████| 203/203 [00:00<00:00, 79603.94it/s]
100%|██████████| 153/153 [00:00<00:00, 78402.99it/s]
100%|██████████| 200/200 [00:00<00:00, 79512.87it/s]
100%|██████████| 65/65 [00:00<00:00, 69833.44it/s]
100%|██████████| 144/144 [00:00<00:00, 77205.65it/s]
100%|██████████| 30/30 [00:00<00:00, 65196.44it/s]
100%|██████████| 130/130 [00:00<00:00, 75698.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96669.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.24it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 93370.84it/s]
100%|██████████| 287/287 [00:00<00:00, 76405.28it/s]
100%|██████████| 771/771 [00:00<00:00, 81610.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 99021.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78810.67it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78070.84it/s]
100%|██████████| 353/353 [00:00<00:00, 79264.91it/s]
100%|██████████| 252/252 [00:00<00:00, 65801.20it/s]
100%|██████████| 203/203 [00:00<00:00, 65779.03it/s]
100%|██████████| 153/153 [00:00<00:00, 63455.80it/s]
100%|██████████| 200/200 [00:00<00:00, 78951.60it/s]
100%|██████████| 65/65 [00:00<00:00, 63997.60it/s]
100%|██████████| 144/144 [00:00<00:00, 71089.90it/s]
100%|██████████| 30/30 [00:00<00:00, 68422.58it/s]
100%|██████████| 130/130 [00:00<00:00, 75001.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92793.16it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 157.48it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 90137.02it/s]
100%|██████████| 287/287 [00:00<00:00, 70793.06it/s]
100%|██████████| 771/771 [00:00<00:00, 73111.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87102.79it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82768.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92390.98it/s]
100%|██████████| 353/353 [00:00<00:00, 76413.57it/s]
100%|██████████| 252/252 [00:00<00:00, 77269.14it/s]
100%|██████████| 203/203 [00:00<00:00, 74251.65it/s]
100%|██████████| 153/153 [00:00<00:00, 65858.84it/s]
100%|██████████| 200/200 [00:00<00:00, 63377.21it/s]
100%|██████████| 65/65 [00:00<00:00, 38947.11it/s]
100%|██████████| 144/144 [00:00<00:00, 75981.86it/s]
100%|██████████| 30/30 [00:00<00:00, 68089.35it/s]
100%|██████████| 130/130 [00:00<00:00, 74296.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91660.46it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.76it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 87872.45it/s]
100%|██████████| 287/287 [00:00<00:00, 73226.18it/s]
100%|██████████| 771/771 [00:00<00:00, 89102.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90662.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75603.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87484.01it/s]
100%|██████████| 353/353 [00:00<00:00, 73767.59it/s]
100%|██████████| 252/252 [00:00<00:00, 73105.87it/s]
100%|██████████| 203/203 [00:00<00:00, 73884.39it/s]
100%|██████████| 153/153 [00:00<00:00, 74977.04it/s]
100%|██████████| 200/200 [00:00<00:00, 73778.43it/s]
100%|██████████| 65/65 [00:00<00:00, 72778.90it/s]
100%|██████████| 144/144 [00:00<00:00, 72437.01it/s]
100%|██████████| 30/30 [00:00<00:00, 51296.01it/s]
100%|██████████| 130/130 [00:00<00:00, 70519.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89714.44it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.37it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81184.80it/s]
100%|██████████| 287/287 [00:00<00:00, 78513.26it/s]
100%|██████████| 771/771 [00:00<00:00, 82007.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82121.29it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83293.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 101787.85it/s]
100%|██████████| 353/353 [00:00<00:00, 79575.91it/s]
100%|██████████| 252/252 [00:00<00:00, 79001.76it/s]
100%|██████████| 203/203 [00:00<00:00, 78611.74it/s]
100%|██████████| 153/153 [00:00<00:00, 76368.98it/s]
100%|██████████| 200/200 [00:00<00:00, 79040.87it/s]
100%|██████████| 65/65 [00:00<00:00, 71164.12it/s]
100%|██████████| 144/144 [00:00<00:00, 79976.14it/s]
100%|██████████| 30/30 [00:00<00:00, 69212.94it/s]
100%|██████████| 130/130 [00:00<00:00, 79530.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79569.33it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 161.29it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77528.58it/s]
100%|██████████| 287/287 [00:00<00:00, 74356.99it/s]
100%|██████████| 771/771 [00:00<00:00, 80657.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82143.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82696.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79771.97it/s]
100%|██████████| 353/353 [00:00<00:00, 80305.33it/s]
100%|██████████| 252/252 [00:00<00:00, 82011.53it/s]
100%|██████████| 203/203 [00:00<00:00, 76699.73it/s]
100%|██████████| 153/153 [00:00<00:00, 81551.47it/s]
100%|██████████| 200/200 [00:00<00:00, 75915.00it/s]
100%|██████████| 65/65 [00:00<00:00, 66853.79it/s]
100%|██████████| 144/144 [00:00<00:00, 77057.89it/s]
100%|██████████| 30/30 [00:00<00:00, 52560.20it/s]
100%|██████████| 130/130 [00:00<00:00, 79472.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89388.86it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:58<00:00, 99.64it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 74435.26it/s]
100%|██████████| 287/287 [00:00<00:00, 75780.00it/s]
100%|██████████| 771/771 [00:00<00:00, 86430.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75301.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76218.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73419.84it/s]
100%|██████████| 353/353 [00:00<00:00, 74833.93it/s]
100%|██████████| 252/252 [00:00<00:00, 73400.32it/s]
100%|██████████| 203/203 [00:00<00:00, 72654.98it/s]
100%|██████████| 153/153 [00:00<00:00, 75135.06it/s]
100%|██████████| 200/200 [00:00<00:00, 73713.60it/s]
100%|██████████| 65/65 [00:00<00:00, 65599.08it/s]
100%|██████████| 144/144 [00:00<00:00, 74445.92it/s]
100%|██████████| 30/30 [00:00<00:00, 64826.96it/s]
100%|██████████| 130/130 [00:00<00:00, 72507.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72528.17it/s]
100%|██████████| 2034/

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:24<00:00, 242.55it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 87668.37it/s]
100%|██████████| 287/287 [00:00<00:00, 72524.72it/s]
100%|██████████| 771/771 [00:00<00:00, 88563.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87330.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 95113.25it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84633.11it/s]
100%|██████████| 353/353 [00:00<00:00, 76036.84it/s]
100%|██████████| 252/252 [00:00<00:00, 74048.24it/s]
100%|██████████| 203/203 [00:00<00:00, 75189.31it/s]
100%|██████████| 153/153 [00:00<00:00, 75073.53it/s]
100%|██████████| 200/200 [00:00<00:00, 71654.63it/s]
100%|██████████| 65/65 [00:00<00:00, 69726.28it/s]
100%|██████████| 144/144 [00:00<00:00, 74574.61it/s]
100%|██████████| 30/30 [00:00<00:00, 66295.64it/s]
100%|██████████| 130/130 [00:00<00:00, 71471.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72062.13it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:35<00:00, 163.21it/s]
INFO:root:The new embedding has 5832 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 92191.63it/s]
100%|██████████| 287/287 [00:00<00:00, 90095.45it/s]
100%|██████████| 771/771 [00:00<00:00, 92614.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96138.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73834.28it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82231.58it/s]
100%|██████████| 353/353 [00:00<00:00, 86080.77it/s]
100%|██████████| 252/252 [00:00<00:00, 72216.77it/s]
100%|██████████| 203/203 [00:00<00:00, 72303.30it/s]
100%|██████████| 153/153 [00:00<00:00, 75791.72it/s]
100%|██████████| 200/200 [00:00<00:00, 74738.13it/s]
100%|██████████| 65/65 [00:00<00:00, 61639.10it/s]
100%|██████████| 144/144 [00:00<00:00, 73530.53it/s]
100%|██████████| 30/30 [00:00<00:00, 65433.76it/s]
100%|██████████| 130/130 [00:00<00:00, 71025.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90781.31it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:30<00:00, 192.37it/s]
INFO:root:The new embedding has 5832 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 90941.07it/s]
100%|██████████| 287/287 [00:00<00:00, 79075.43it/s]
100%|██████████| 771/771 [00:00<00:00, 88439.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95505.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75392.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91026.83it/s]
100%|██████████| 353/353 [00:00<00:00, 89176.01it/s]
100%|██████████| 252/252 [00:00<00:00, 75052.52it/s]
100%|██████████| 203/203 [00:00<00:00, 70501.26it/s]
100%|██████████| 153/153 [00:00<00:00, 71295.25it/s]
100%|██████████| 200/200 [00:00<00:00, 70421.49it/s]
100%|██████████| 65/65 [00:00<00:00, 62116.60it/s]
100%|██████████| 144/144 [00:00<00:00, 68657.47it/s]
100%|██████████| 30/30 [00:00<00:00, 59918.63it/s]
100%|██████████| 130/130 [00:00<00:00, 67399.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81425.18it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 176.67it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60592.75it/s]
100%|██████████| 287/287 [00:00<00:00, 77189.18it/s]
100%|██████████| 771/771 [00:00<00:00, 88169.93it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79877.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79252.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79760.34it/s]
100%|██████████| 353/353 [00:00<00:00, 78242.84it/s]
100%|██████████| 252/252 [00:00<00:00, 80444.83it/s]
100%|██████████| 203/203 [00:00<00:00, 85212.54it/s]
100%|██████████| 153/153 [00:00<00:00, 74420.56it/s]
100%|██████████| 200/200 [00:00<00:00, 76966.77it/s]
100%|██████████| 65/65 [00:00<00:00, 66690.25it/s]
100%|██████████| 144/144 [00:00<00:00, 76520.94it/s]
100%|██████████| 30/30 [00:00<00:00, 67869.00it/s]
100%|██████████| 130/130 [00:00<00:00, 74195.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79893.68it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:32<00:00, 181.85it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 70231.97it/s]
100%|██████████| 287/287 [00:00<00:00, 79819.99it/s]
100%|██████████| 771/771 [00:00<00:00, 71669.70it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74858.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76597.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79901.14it/s]
100%|██████████| 353/353 [00:00<00:00, 79678.68it/s]
100%|██████████| 252/252 [00:00<00:00, 79566.74it/s]
100%|██████████| 203/203 [00:00<00:00, 77060.70it/s]
100%|██████████| 153/153 [00:00<00:00, 71629.48it/s]
100%|██████████| 200/200 [00:00<00:00, 79527.95it/s]
100%|██████████| 65/65 [00:00<00:00, 76452.54it/s]
100%|██████████| 144/144 [00:00<00:00, 72988.49it/s]
100%|██████████| 30/30 [00:00<00:00, 62477.22it/s]
100%|██████████| 130/130 [00:00<00:00, 79669.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71707.66it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:28<00:00, 207.15it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 87966.53it/s]
100%|██████████| 287/287 [00:00<00:00, 74055.08it/s]
100%|██████████| 771/771 [00:00<00:00, 75434.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76437.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75529.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76222.19it/s]
100%|██████████| 353/353 [00:00<00:00, 76142.42it/s]
100%|██████████| 252/252 [00:00<00:00, 74718.27it/s]
100%|██████████| 203/203 [00:00<00:00, 75717.54it/s]
100%|██████████| 153/153 [00:00<00:00, 74111.16it/s]
100%|██████████| 200/200 [00:00<00:00, 75227.41it/s]
100%|██████████| 65/65 [00:00<00:00, 69160.26it/s]
100%|██████████| 144/144 [00:00<00:00, 73006.14it/s]
100%|██████████| 30/30 [00:00<00:00, 67108.86it/s]
100%|██████████| 130/130 [00:00<00:00, 68715.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93684.40it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:27<00:00, 212.30it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 73313.91it/s]
100%|██████████| 287/287 [00:00<00:00, 73525.85it/s]
100%|██████████| 771/771 [00:00<00:00, 75323.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96251.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74850.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74248.17it/s]
100%|██████████| 353/353 [00:00<00:00, 75896.52it/s]
100%|██████████| 252/252 [00:00<00:00, 76608.29it/s]
100%|██████████| 203/203 [00:00<00:00, 74773.31it/s]
100%|██████████| 153/153 [00:00<00:00, 78202.35it/s]
100%|██████████| 200/200 [00:00<00:00, 75866.94it/s]
100%|██████████| 65/65 [00:00<00:00, 64133.09it/s]
100%|██████████| 144/144 [00:00<00:00, 72979.67it/s]
100%|██████████| 30/30 [00:00<00:00, 68089.35it/s]
100%|██████████| 130/130 [00:00<00:00, 73100.89it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74557.45it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 138.83it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 87032.85it/s]
100%|██████████| 287/287 [00:00<00:00, 88825.65it/s]
100%|██████████| 771/771 [00:00<00:00, 87679.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94432.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86984.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73403.13it/s]
100%|██████████| 353/353 [00:00<00:00, 72076.20it/s]
100%|██████████| 252/252 [00:00<00:00, 72201.97it/s]
100%|██████████| 203/203 [00:00<00:00, 72723.24it/s]
100%|██████████| 153/153 [00:00<00:00, 71121.41it/s]
100%|██████████| 200/200 [00:00<00:00, 69713.35it/s]
100%|██████████| 65/65 [00:00<00:00, 62258.45it/s]
100%|██████████| 144/144 [00:00<00:00, 70798.24it/s]
100%|██████████| 30/30 [00:00<00:00, 51909.70it/s]
100%|██████████| 130/130 [00:00<00:00, 72556.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87898.79it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.50it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 90696.98it/s]
100%|██████████| 287/287 [00:00<00:00, 87827.61it/s]
100%|██████████| 771/771 [00:00<00:00, 96287.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94720.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75361.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94479.78it/s]
100%|██████████| 353/353 [00:00<00:00, 82396.87it/s]
100%|██████████| 252/252 [00:00<00:00, 73055.34it/s]
100%|██████████| 203/203 [00:00<00:00, 70378.88it/s]
100%|██████████| 153/153 [00:00<00:00, 71105.65it/s]
100%|██████████| 200/200 [00:00<00:00, 70891.64it/s]
100%|██████████| 65/65 [00:00<00:00, 62861.37it/s]
100%|██████████| 144/144 [00:00<00:00, 73405.42it/s]
100%|██████████| 30/30 [00:00<00:00, 53957.60it/s]
100%|██████████| 130/130 [00:00<00:00, 67158.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93136.39it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.64it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79557.03it/s]
100%|██████████| 287/287 [00:00<00:00, 75637.15it/s]
100%|██████████| 771/771 [00:00<00:00, 78582.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81341.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80670.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80149.00it/s]
100%|██████████| 353/353 [00:00<00:00, 79850.57it/s]
100%|██████████| 252/252 [00:00<00:00, 77223.98it/s]
100%|██████████| 203/203 [00:00<00:00, 80143.42it/s]
100%|██████████| 153/153 [00:00<00:00, 80366.75it/s]
100%|██████████| 200/200 [00:00<00:00, 75321.97it/s]
100%|██████████| 65/65 [00:00<00:00, 74857.16it/s]
100%|██████████| 144/144 [00:00<00:00, 73755.01it/s]
100%|██████████| 30/30 [00:00<00:00, 57039.49it/s]
100%|██████████| 130/130 [00:00<00:00, 72076.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95161.34it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 132.97it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 90528.46it/s]
100%|██████████| 287/287 [00:00<00:00, 41480.54it/s]
100%|██████████| 771/771 [00:00<00:00, 77228.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93645.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87945.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92072.56it/s]
100%|██████████| 353/353 [00:00<00:00, 73086.65it/s]
100%|██████████| 252/252 [00:00<00:00, 75757.21it/s]
100%|██████████| 203/203 [00:00<00:00, 72847.68it/s]
100%|██████████| 153/153 [00:00<00:00, 71773.68it/s]
100%|██████████| 200/200 [00:00<00:00, 59561.26it/s]
100%|██████████| 65/65 [00:00<00:00, 75478.89it/s]
100%|██████████| 144/144 [00:00<00:00, 78869.13it/s]
100%|██████████| 30/30 [00:00<00:00, 62820.33it/s]
100%|██████████| 130/130 [00:00<00:00, 75499.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91065.70it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.61it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 74390.33it/s]
100%|██████████| 287/287 [00:00<00:00, 72928.95it/s]
100%|██████████| 771/771 [00:00<00:00, 73505.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74249.27it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75038.98it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72903.84it/s]
100%|██████████| 353/353 [00:00<00:00, 72107.79it/s]
100%|██████████| 252/252 [00:00<00:00, 71455.15it/s]
100%|██████████| 203/203 [00:00<00:00, 64842.26it/s]
100%|██████████| 153/153 [00:00<00:00, 72948.56it/s]
100%|██████████| 200/200 [00:00<00:00, 75112.89it/s]
100%|██████████| 65/65 [00:00<00:00, 59448.27it/s]
100%|██████████| 144/144 [00:00<00:00, 40329.85it/s]
100%|██████████| 30/30 [00:00<00:00, 44699.51it/s]
100%|██████████| 130/130 [00:00<00:00, 72498.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82663.60it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:39<00:00, 149.66it/s]
INFO:root:The new embedding has 5819 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 94255.08it/s]
100%|██████████| 287/287 [00:00<00:00, 72502.88it/s]
100%|██████████| 771/771 [00:00<00:00, 90888.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92401.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76999.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84919.84it/s]
100%|██████████| 353/353 [00:00<00:00, 74630.24it/s]
100%|██████████| 252/252 [00:00<00:00, 74734.12it/s]
100%|██████████| 203/203 [00:00<00:00, 72260.35it/s]
100%|██████████| 153/153 [00:00<00:00, 69114.54it/s]
100%|██████████| 200/200 [00:00<00:00, 68759.08it/s]
100%|██████████| 65/65 [00:00<00:00, 69160.26it/s]
100%|██████████| 144/144 [00:00<00:00, 73638.11it/s]
100%|██████████| 30/30 [00:00<00:00, 62015.34it/s]
100%|██████████| 130/130 [00:00<00:00, 79137.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91527.30it/s]
100%|██████████| 2034

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:38<00:00, 151.18it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78112.48it/s]
100%|██████████| 287/287 [00:00<00:00, 75381.38it/s]
100%|██████████| 771/771 [00:00<00:00, 82191.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92680.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 100626.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86717.10it/s]
100%|██████████| 353/353 [00:00<00:00, 81900.06it/s]
100%|██████████| 252/252 [00:00<00:00, 78253.10it/s]
100%|██████████| 203/203 [00:00<00:00, 77319.63it/s]
100%|██████████| 153/153 [00:00<00:00, 55570.53it/s]
100%|██████████| 200/200 [00:00<00:00, 72528.17it/s]
100%|██████████| 65/65 [00:00<00:00, 76302.76it/s]
100%|██████████| 144/144 [00:00<00:00, 78276.28it/s]
100%|██████████| 30/30 [00:00<00:00, 70138.86it/s]
100%|██████████| 130/130 [00:00<00:00, 67018.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72290.66it/s]
100%|██████████| 20

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:39<00:00, 149.31it/s]
INFO:root:The new embedding has 5819 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79576.67it/s]
100%|██████████| 287/287 [00:00<00:00, 75381.38it/s]
100%|██████████| 771/771 [00:00<00:00, 79333.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80675.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81947.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80027.68it/s]
100%|██████████| 353/353 [00:00<00:00, 77827.44it/s]
100%|██████████| 252/252 [00:00<00:00, 97505.96it/s]
100%|██████████| 203/203 [00:00<00:00, 77333.67it/s]
100%|██████████| 153/153 [00:00<00:00, 79157.33it/s]
100%|██████████| 200/200 [00:00<00:00, 74242.04it/s]
100%|██████████| 65/65 [00:00<00:00, 71631.57it/s]
100%|██████████| 144/144 [00:00<00:00, 66262.18it/s]
100%|██████████| 30/30 [00:00<00:00, 64198.53it/s]
100%|██████████| 130/130 [00:00<00:00, 77133.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78800.94it/s]
100%|██████████| 203

['squishing' 'squirt']
['blithering' 'chatter']
['conjurors' 'enchantress']
['anterooms' 'building']
['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['autografts' 'graft']
['disfavoring' 'prejudice']
['companionships' 'friendship']
['snookered' 'play']
['snookered' 'flim-flam']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['swooshing' 'sound']
['feminised' 'change']
['liverpools' 'england']
['glistens' 'spangle']
['glistens' 'brightness']
['transfusing' 'pour']
['transfusing' 'lend']
['copilots' 'pilot']
['positioners' 'actuator']
['interlayers' 'layer']
['censorships' 'deletion']
['censorships' 'censoring']
['rompers' 'garment']
['rompers' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['reviles' 'abuse']


100%|██████████| 5846/5846 [00:45<00:00, 128.73it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 73699.47it/s]
100%|██████████| 287/287 [00:00<00:00, 75038.35it/s]
100%|██████████| 771/771 [00:00<00:00, 81575.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86521.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91265.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79710.32it/s]
100%|██████████| 353/353 [00:00<00:00, 63826.76it/s]
100%|██████████| 252/252 [00:00<00:00, 73615.03it/s]
100%|██████████| 203/203 [00:00<00:00, 69065.84it/s]
100%|██████████| 153/153 [00:00<00:00, 65791.32it/s]
100%|██████████| 200/200 [00:00<00:00, 70855.71it/s]
100%|██████████| 65/65 [00:00<00:00, 68898.09it/s]
100%|██████████| 144/144 [00:00<00:00, 87571.38it/s]
100%|██████████| 30/30 [00:00<00:00, 62045.92it/s]
100%|██████████| 130/130 [00:00<00:00, 72817.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72761.11it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:56<00:00, 103.09it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 71262.79it/s]
100%|██████████| 287/287 [00:00<00:00, 74132.61it/s]
100%|██████████| 771/771 [00:00<00:00, 80744.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84291.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73248.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93316.66it/s]
100%|██████████| 353/353 [00:00<00:00, 74148.10it/s]
100%|██████████| 252/252 [00:00<00:00, 69789.67it/s]
100%|██████████| 203/203 [00:00<00:00, 75960.72it/s]
100%|██████████| 153/153 [00:00<00:00, 74446.46it/s]
100%|██████████| 200/200 [00:00<00:00, 73448.98it/s]
100%|██████████| 65/65 [00:00<00:00, 65082.30it/s]
100%|██████████| 144/144 [00:00<00:00, 74262.85it/s]
100%|██████████| 30/30 [00:00<00:00, 66576.25it/s]
100%|██████████| 130/130 [00:00<00:00, 62130.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87194.49it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:55<00:00, 104.68it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 85333.07it/s]
100%|██████████| 287/287 [00:00<00:00, 77627.22it/s]
100%|██████████| 771/771 [00:00<00:00, 81639.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91999.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80874.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90778.60it/s]
100%|██████████| 353/353 [00:00<00:00, 58549.09it/s]
100%|██████████| 252/252 [00:00<00:00, 62512.69it/s]
100%|██████████| 203/203 [00:00<00:00, 77629.81it/s]
100%|██████████| 153/153 [00:00<00:00, 76725.07it/s]
100%|██████████| 200/200 [00:00<00:00, 76741.45it/s]
100%|██████████| 65/65 [00:00<00:00, 74795.54it/s]
100%|██████████| 144/144 [00:00<00:00, 76979.32it/s]
100%|██████████| 30/30 [00:00<00:00, 61111.76it/s]
100%|██████████| 130/130 [00:00<00:00, 70675.25it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76639.09it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:55<00:00, 105.02it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92835.04it/s]
100%|██████████| 287/287 [00:00<00:00, 77233.75it/s]
100%|██████████| 771/771 [00:00<00:00, 79715.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89415.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 71739.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79531.47it/s]
100%|██████████| 353/353 [00:00<00:00, 80964.04it/s]
100%|██████████| 252/252 [00:00<00:00, 77603.86it/s]
100%|██████████| 203/203 [00:00<00:00, 78873.90it/s]
100%|██████████| 153/153 [00:00<00:00, 76908.98it/s]
100%|██████████| 200/200 [00:00<00:00, 76868.03it/s]
100%|██████████| 65/65 [00:00<00:00, 73943.52it/s]
100%|██████████| 144/144 [00:00<00:00, 74198.99it/s]
100%|██████████| 30/30 [00:00<00:00, 65638.56it/s]
100%|██████████| 130/130 [00:00<00:00, 72507.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77651.34it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [01:29<00:00, 65.26it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 74212.46it/s]
100%|██████████| 287/287 [00:00<00:00, 92533.27it/s]
100%|██████████| 771/771 [00:00<00:00, 98447.65it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98160.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76153.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92257.53it/s]
100%|██████████| 353/353 [00:00<00:00, 74151.82it/s]
100%|██████████| 252/252 [00:00<00:00, 73898.11it/s]
100%|██████████| 203/203 [00:00<00:00, 70776.70it/s]
100%|██████████| 153/153 [00:00<00:00, 63411.91it/s]
100%|██████████| 200/200 [00:00<00:00, 60554.45it/s]
100%|██████████| 65/65 [00:00<00:00, 60882.04it/s]
100%|██████████| 144/144 [00:00<00:00, 69391.06it/s]
100%|██████████| 30/30 [00:00<00:00, 37752.51it/s]
100%|██████████| 130/130 [00:00<00:00, 72759.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78467.35it/s]
100%|██████████| 2034/

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.50it/s]
INFO:root:The new embedding has 5844 word and vectors have 900 dimensions
100%|██████████| 999/999 [00:00<00:00, 97755.87it/s]
100%|██████████| 287/287 [00:00<00:00, 73279.68it/s]
100%|██████████| 771/771 [00:00<00:00, 93929.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92773.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76267.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79152.75it/s]
100%|██████████| 353/353 [00:00<00:00, 74159.24it/s]
100%|██████████| 252/252 [00:00<00:00, 75475.91it/s]
100%|██████████| 203/203 [00:00<00:00, 74498.53it/s]
100%|██████████| 153/153 [00:00<00:00, 73838.28it/s]
100%|██████████| 200/200 [00:00<00:00, 74347.32it/s]
100%|██████████| 65/65 [00:00<00:00, 65980.10it/s]
100%|██████████| 144/144 [00:00<00:00, 72480.47it/s]
100%|██████████| 30/30 [00:00<00:00, 68089.35it/s]
100%|██████████| 130/130 [00:00<00:00, 89460.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84968.33it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 155.43it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60620.80it/s]
100%|██████████| 287/287 [00:00<00:00, 78075.32it/s]
100%|██████████| 771/771 [00:00<00:00, 81808.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80560.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82582.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79742.65it/s]
100%|██████████| 353/353 [00:00<00:00, 79027.99it/s]
100%|██████████| 252/252 [00:00<00:00, 79650.69it/s]
100%|██████████| 203/203 [00:00<00:00, 77821.38it/s]
100%|██████████| 153/153 [00:00<00:00, 75872.37it/s]
100%|██████████| 200/200 [00:00<00:00, 77292.99it/s]
100%|██████████| 65/65 [00:00<00:00, 58429.01it/s]
100%|██████████| 144/144 [00:00<00:00, 73944.63it/s]
100%|██████████| 30/30 [00:00<00:00, 57221.06it/s]
100%|██████████| 130/130 [00:00<00:00, 75562.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94018.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 161.28it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 65050.68it/s]
100%|██████████| 287/287 [00:00<00:00, 81983.60it/s]
100%|██████████| 771/771 [00:00<00:00, 81575.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89379.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80667.45it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92363.85it/s]
100%|██████████| 353/353 [00:00<00:00, 80506.19it/s]
100%|██████████| 252/252 [00:00<00:00, 77861.11it/s]
100%|██████████| 203/203 [00:00<00:00, 76506.76it/s]
100%|██████████| 153/153 [00:00<00:00, 77335.32it/s]
100%|██████████| 200/200 [00:00<00:00, 76959.71it/s]
100%|██████████| 65/65 [00:00<00:00, 66952.30it/s]
100%|██████████| 144/144 [00:00<00:00, 75791.16it/s]
100%|██████████| 30/30 [00:00<00:00, 54947.21it/s]
100%|██████████| 130/130 [00:00<00:00, 71062.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80082.83it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:25<00:00, 226.36it/s]
INFO:root:The new embedding has 5846 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 77667.98it/s]
100%|██████████| 287/287 [00:00<00:00, 74416.74it/s]
100%|██████████| 771/771 [00:00<00:00, 76997.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83247.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81640.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85931.83it/s]
100%|██████████| 353/353 [00:00<00:00, 62960.93it/s]
100%|██████████| 252/252 [00:00<00:00, 78398.21it/s]
100%|██████████| 203/203 [00:00<00:00, 72260.35it/s]
100%|██████████| 153/153 [00:00<00:00, 71113.53it/s]
100%|██████████| 200/200 [00:00<00:00, 67475.93it/s]
100%|██████████| 65/65 [00:00<00:00, 45129.91it/s]
100%|██████████| 144/144 [00:00<00:00, 67093.95it/s]
100%|██████████| 30/30 [00:00<00:00, 65501.88it/s]
100%|██████████| 130/130 [00:00<00:00, 61632.14it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81754.85it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 173.93it/s]
INFO:root:The new embedding has 5845 word and vectors have 700 dimensions
100%|██████████| 999/999 [00:00<00:00, 63166.85it/s]
100%|██████████| 287/287 [00:00<00:00, 74675.26it/s]
100%|██████████| 771/771 [00:00<00:00, 76603.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76613.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 65398.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74423.39it/s]
100%|██████████| 353/353 [00:00<00:00, 74698.01it/s]
100%|██████████| 252/252 [00:00<00:00, 75116.52it/s]
100%|██████████| 203/203 [00:00<00:00, 71961.10it/s]
100%|██████████| 153/153 [00:00<00:00, 77447.32it/s]
100%|██████████| 200/200 [00:00<00:00, 75328.74it/s]
100%|██████████| 65/65 [00:00<00:00, 65206.83it/s]
100%|██████████| 144/144 [00:00<00:00, 73165.33it/s]
100%|██████████| 30/30 [00:00<00:00, 68200.07it/s]
100%|██████████| 130/130 [00:00<00:00, 74621.53it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73782.51it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:50<00:00, 115.40it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 87714.25it/s]
100%|██████████| 287/287 [00:00<00:00, 68766.94it/s]
100%|██████████| 771/771 [00:00<00:00, 82432.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89528.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77267.36it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78751.98it/s]
100%|██████████| 353/353 [00:00<00:00, 84580.94it/s]
100%|██████████| 252/252 [00:00<00:00, 70174.25it/s]
100%|██████████| 203/203 [00:00<00:00, 71298.25it/s]
100%|██████████| 153/153 [00:00<00:00, 74776.10it/s]
100%|██████████| 200/200 [00:00<00:00, 73895.42it/s]
100%|██████████| 65/65 [00:00<00:00, 69869.24it/s]
100%|██████████| 144/144 [00:00<00:00, 66480.99it/s]
100%|██████████| 30/30 [00:00<00:00, 61802.12it/s]
100%|██████████| 130/130 [00:00<00:00, 41338.86it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84998.34it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 169.72it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 89970.58it/s]
100%|██████████| 287/287 [00:00<00:00, 76024.08it/s]
100%|██████████| 771/771 [00:00<00:00, 88466.61it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93088.84it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89428.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80060.27it/s]
100%|██████████| 353/353 [00:00<00:00, 84177.00it/s]
100%|██████████| 252/252 [00:00<00:00, 72593.72it/s]
100%|██████████| 203/203 [00:00<00:00, 71760.95it/s]
100%|██████████| 153/153 [00:00<00:00, 72331.89it/s]
100%|██████████| 200/200 [00:00<00:00, 72085.66it/s]
100%|██████████| 65/65 [00:00<00:00, 64865.52it/s]
100%|██████████| 144/144 [00:00<00:00, 64362.72it/s]
100%|██████████| 30/30 [00:00<00:00, 64660.39it/s]
100%|██████████| 130/130 [00:00<00:00, 66309.07it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89940.90it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.62it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60583.11it/s]
100%|██████████| 287/287 [00:00<00:00, 76211.79it/s]
100%|██████████| 771/771 [00:00<00:00, 79145.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76982.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79058.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95989.75it/s]
100%|██████████| 353/353 [00:00<00:00, 74864.20it/s]
100%|██████████| 252/252 [00:00<00:00, 79698.73it/s]
100%|██████████| 203/203 [00:00<00:00, 78830.08it/s]
100%|██████████| 153/153 [00:00<00:00, 77936.42it/s]
100%|██████████| 200/200 [00:00<00:00, 81355.91it/s]
100%|██████████| 65/65 [00:00<00:00, 54788.94it/s]
100%|██████████| 144/144 [00:00<00:00, 79754.36it/s]
100%|██████████| 30/30 [00:00<00:00, 56476.27it/s]
100%|██████████| 130/130 [00:00<00:00, 63365.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95789.73it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.26it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77767.44it/s]
100%|██████████| 287/287 [00:00<00:00, 78656.90it/s]
100%|██████████| 771/771 [00:00<00:00, 77885.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81126.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81368.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86948.40it/s]
100%|██████████| 353/353 [00:00<00:00, 78884.83it/s]
100%|██████████| 252/252 [00:00<00:00, 78783.89it/s]
100%|██████████| 203/203 [00:00<00:00, 77835.61it/s]
100%|██████████| 153/153 [00:00<00:00, 78585.42it/s]
100%|██████████| 200/200 [00:00<00:00, 78530.31it/s]
100%|██████████| 65/65 [00:00<00:00, 76927.13it/s]
100%|██████████| 144/144 [00:00<00:00, 31580.64it/s]
100%|██████████| 30/30 [00:00<00:00, 51067.01it/s]
100%|██████████| 130/130 [00:00<00:00, 78341.89it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91966.52it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.84it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 90038.24it/s]
100%|██████████| 287/287 [00:00<00:00, 59704.65it/s]
100%|██████████| 771/771 [00:00<00:00, 79985.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86563.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83025.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83470.95it/s]
100%|██████████| 353/353 [00:00<00:00, 65798.12it/s]
100%|██████████| 252/252 [00:00<00:00, 76719.50it/s]
100%|██████████| 203/203 [00:00<00:00, 74232.23it/s]
100%|██████████| 153/153 [00:00<00:00, 79264.89it/s]
100%|██████████| 200/200 [00:00<00:00, 75403.22it/s]
100%|██████████| 65/65 [00:00<00:00, 71631.57it/s]
100%|██████████| 144/144 [00:00<00:00, 70814.84it/s]
100%|██████████| 30/30 [00:00<00:00, 49675.93it/s]
100%|██████████| 130/130 [00:00<00:00, 64072.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82408.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.44it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 89984.10it/s]
100%|██████████| 287/287 [00:00<00:00, 78217.37it/s]
100%|██████████| 771/771 [00:00<00:00, 89681.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95016.29it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80577.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88196.54it/s]
100%|██████████| 353/353 [00:00<00:00, 84162.65it/s]
100%|██████████| 252/252 [00:00<00:00, 76658.30it/s]
100%|██████████| 203/203 [00:00<00:00, 75737.74it/s]
100%|██████████| 153/153 [00:00<00:00, 73542.12it/s]
100%|██████████| 200/200 [00:00<00:00, 73122.45it/s]
100%|██████████| 65/65 [00:00<00:00, 62458.14it/s]
100%|██████████| 144/144 [00:00<00:00, 68556.16it/s]
100%|██████████| 30/30 [00:00<00:00, 58416.49it/s]
100%|██████████| 130/130 [00:00<00:00, 68336.82it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90562.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.58it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81705.63it/s]
100%|██████████| 287/287 [00:00<00:00, 80811.31it/s]
100%|██████████| 771/771 [00:00<00:00, 80519.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81257.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81422.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80003.26it/s]
100%|██████████| 353/353 [00:00<00:00, 78629.28it/s]
100%|██████████| 252/252 [00:00<00:00, 77620.96it/s]
100%|██████████| 203/203 [00:00<00:00, 78800.90it/s]
100%|██████████| 153/153 [00:00<00:00, 76160.52it/s]
100%|██████████| 200/200 [00:00<00:00, 76426.82it/s]
100%|██████████| 65/65 [00:00<00:00, 72915.15it/s]
100%|██████████| 144/144 [00:00<00:00, 78063.82it/s]
100%|██████████| 30/30 [00:00<00:00, 69557.28it/s]
100%|██████████| 130/130 [00:00<00:00, 77429.64it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92858.90it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.95it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 64145.46it/s]
100%|██████████| 287/287 [00:00<00:00, 81236.69it/s]
100%|██████████| 771/771 [00:00<00:00, 81443.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83085.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81050.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79167.69it/s]
100%|██████████| 353/353 [00:00<00:00, 80760.89it/s]
100%|██████████| 252/252 [00:00<00:00, 81669.34it/s]
100%|██████████| 203/203 [00:00<00:00, 79812.87it/s]
100%|██████████| 153/153 [00:00<00:00, 74880.81it/s]
100%|██████████| 200/200 [00:00<00:00, 78033.56it/s]
100%|██████████| 65/65 [00:00<00:00, 76516.91it/s]
100%|██████████| 144/144 [00:00<00:00, 50277.18it/s]
100%|██████████| 30/30 [00:00<00:00, 27455.62it/s]
100%|██████████| 130/130 [00:00<00:00, 69186.59it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74512.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [04:51<00:00, 20.08it/s]
INFO:root:The new embedding has 5826 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 52529.36it/s]
100%|██████████| 287/287 [00:00<00:00, 60971.75it/s]
100%|██████████| 771/771 [00:00<00:00, 74957.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77983.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74982.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 70569.20it/s]
100%|██████████| 353/353 [00:00<00:00, 73467.44it/s]
100%|██████████| 252/252 [00:00<00:00, 66555.29it/s]
100%|██████████| 203/203 [00:00<00:00, 61698.82it/s]
100%|██████████| 153/153 [00:00<00:00, 58739.45it/s]
100%|██████████| 200/200 [00:00<00:00, 70849.73it/s]
100%|██████████| 65/65 [00:00<00:00, 60557.48it/s]
100%|██████████| 144/144 [00:00<00:00, 64041.97it/s]
100%|██████████| 30/30 [00:00<00:00, 37572.15it/s]
100%|██████████| 130/130 [00:00<00:00, 63277.19it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74155.22it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [02:51<00:00, 34.02it/s]
INFO:root:The new embedding has 5826 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 52705.12it/s]
100%|██████████| 287/287 [00:00<00:00, 83041.20it/s]
100%|██████████| 771/771 [00:00<00:00, 90720.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92922.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90456.87it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88037.33it/s]
100%|██████████| 353/353 [00:00<00:00, 80664.09it/s]
100%|██████████| 252/252 [00:00<00:00, 72192.10it/s]
100%|██████████| 203/203 [00:00<00:00, 69290.67it/s]
100%|██████████| 153/153 [00:00<00:00, 68429.14it/s]
100%|██████████| 200/200 [00:00<00:00, 68939.91it/s]
100%|██████████| 65/65 [00:00<00:00, 68072.35it/s]
100%|██████████| 144/144 [00:00<00:00, 70873.01it/s]
100%|██████████| 30/30 [00:00<00:00, 58661.59it/s]
100%|██████████| 130/130 [00:00<00:00, 85263.41it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87733.31it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [02:52<00:00, 33.96it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 55356.63it/s]
100%|██████████| 287/287 [00:00<00:00, 73458.55it/s]
100%|██████████| 771/771 [00:00<00:00, 81259.63it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79118.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79848.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79877.30it/s]
100%|██████████| 353/353 [00:00<00:00, 76551.85it/s]
100%|██████████| 252/252 [00:00<00:00, 78836.77it/s]
100%|██████████| 203/203 [00:00<00:00, 79152.53it/s]
100%|██████████| 153/153 [00:00<00:00, 63790.11it/s]
100%|██████████| 200/200 [00:00<00:00, 62760.80it/s]
100%|██████████| 65/65 [00:00<00:00, 74836.61it/s]
100%|██████████| 144/144 [00:00<00:00, 73980.86it/s]
100%|██████████| 30/30 [00:00<00:00, 63905.09it/s]
100%|██████████| 130/130 [00:00<00:00, 71981.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78035.64it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [02:50<00:00, 34.30it/s]
INFO:root:The new embedding has 5826 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78650.58it/s]
100%|██████████| 287/287 [00:00<00:00, 75741.85it/s]
100%|██████████| 771/771 [00:00<00:00, 62130.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81357.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84617.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88408.47it/s]
100%|██████████| 353/353 [00:00<00:00, 80620.16it/s]
100%|██████████| 252/252 [00:00<00:00, 82504.46it/s]
100%|██████████| 203/203 [00:00<00:00, 78149.95it/s]
100%|██████████| 153/153 [00:00<00:00, 75899.29it/s]
100%|██████████| 200/200 [00:00<00:00, 75675.31it/s]
100%|██████████| 65/65 [00:00<00:00, 68915.51it/s]
100%|██████████| 144/144 [00:00<00:00, 74787.00it/s]
100%|██████████| 30/30 [00:00<00:00, 67396.42it/s]
100%|██████████| 130/130 [00:00<00:00, 74529.73it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77584.45it/s]
100%|██████████| 2034

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['extravert' 'extroversive']
['deviationism' 'desertion']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['kazakhstani' 'asian']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['latinist' 'classicist']


100%|██████████| 5846/5846 [00:35<00:00, 166.59it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 91101.22it/s]
100%|██████████| 287/287 [00:00<00:00, 80740.84it/s]
100%|██████████| 771/771 [00:00<00:00, 79548.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93281.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74978.62it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90997.21it/s]
100%|██████████| 353/353 [00:00<00:00, 72421.70it/s]
100%|██████████| 252/252 [00:00<00:00, 75068.51it/s]
100%|██████████| 203/203 [00:00<00:00, 73546.14it/s]
100%|██████████| 153/153 [00:00<00:00, 70372.68it/s]
100%|██████████| 200/200 [00:00<00:00, 71289.27it/s]
100%|██████████| 65/65 [00:00<00:00, 61375.45it/s]
100%|██████████| 144/144 [00:00<00:00, 72185.94it/s]
100%|██████████| 30/30 [00:00<00:00, 61832.49it/s]
100%|██████████| 130/130 [00:00<00:00, 66284.89it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90855.47it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:30<00:00, 193.39it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 82072.11it/s]
100%|██████████| 287/287 [00:00<00:00, 89927.18it/s]
100%|██████████| 771/771 [00:00<00:00, 91180.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96468.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81510.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84642.79it/s]
100%|██████████| 353/353 [00:00<00:00, 72156.99it/s]
100%|██████████| 252/252 [00:00<00:00, 82330.94it/s]
100%|██████████| 203/203 [00:00<00:00, 71167.14it/s]
100%|██████████| 153/153 [00:00<00:00, 69376.06it/s]
100%|██████████| 200/200 [00:00<00:00, 71368.11it/s]
100%|██████████| 65/65 [00:00<00:00, 69424.44it/s]
100%|██████████| 144/144 [00:00<00:00, 72865.22it/s]
100%|██████████| 30/30 [00:00<00:00, 53681.37it/s]
100%|██████████| 130/130 [00:00<00:00, 62130.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90680.93it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:40<00:00, 143.87it/s]
INFO:root:The new embedding has 5828 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88520.33it/s]
100%|██████████| 287/287 [00:00<00:00, 77492.29it/s]
100%|██████████| 771/771 [00:00<00:00, 86042.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90417.87it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89750.37it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89336.82it/s]
100%|██████████| 353/353 [00:00<00:00, 71862.80it/s]
100%|██████████| 252/252 [00:00<00:00, 63397.59it/s]
100%|██████████| 203/203 [00:00<00:00, 69088.26it/s]
100%|██████████| 153/153 [00:00<00:00, 72931.98it/s]
100%|██████████| 200/200 [00:00<00:00, 74426.48it/s]
100%|██████████| 65/65 [00:00<00:00, 50996.96it/s]
100%|██████████| 144/144 [00:00<00:00, 66088.17it/s]
100%|██████████| 30/30 [00:00<00:00, 45872.81it/s]
100%|██████████| 130/130 [00:00<00:00, 61389.27it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87224.54it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:32<00:00, 179.58it/s]
INFO:root:The new embedding has 5828 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 92055.93it/s]
100%|██████████| 287/287 [00:00<00:00, 87216.73it/s]
100%|██████████| 771/771 [00:00<00:00, 89623.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93766.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88329.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78842.28it/s]
100%|██████████| 353/353 [00:00<00:00, 78040.76it/s]
100%|██████████| 252/252 [00:00<00:00, 76514.02it/s]
100%|██████████| 203/203 [00:00<00:00, 80805.14it/s]
100%|██████████| 153/153 [00:00<00:00, 78278.67it/s]
100%|██████████| 200/200 [00:00<00:00, 70807.87it/s]
100%|██████████| 65/65 [00:00<00:00, 64087.86it/s]
100%|██████████| 144/144 [00:00<00:00, 70731.91it/s]
100%|██████████| 30/30 [00:00<00:00, 53340.03it/s]
100%|██████████| 130/130 [00:00<00:00, 68225.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88854.84it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:33<00:00, 173.46it/s]
INFO:root:The new embedding has 5828 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 71907.29it/s]
100%|██████████| 287/287 [00:00<00:00, 75475.91it/s]
100%|██████████| 771/771 [00:00<00:00, 85210.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79981.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81777.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79556.11it/s]
100%|██████████| 353/353 [00:00<00:00, 76746.28it/s]
100%|██████████| 252/252 [00:00<00:00, 78497.19it/s]
100%|██████████| 203/203 [00:00<00:00, 76623.80it/s]
100%|██████████| 153/153 [00:00<00:00, 75595.30it/s]
100%|██████████| 200/200 [00:00<00:00, 76889.17it/s]
100%|██████████| 65/65 [00:00<00:00, 65646.46it/s]
100%|██████████| 144/144 [00:00<00:00, 78643.20it/s]
100%|██████████| 30/30 [00:00<00:00, 62076.53it/s]
100%|██████████| 130/130 [00:00<00:00, 74499.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80618.50it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:33<00:00, 176.71it/s]
INFO:root:The new embedding has 5828 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 62283.31it/s]
100%|██████████| 287/287 [00:00<00:00, 72511.61it/s]
100%|██████████| 771/771 [00:00<00:00, 84997.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88239.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94850.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96531.74it/s]
100%|██████████| 353/353 [00:00<00:00, 79439.28it/s]
100%|██████████| 252/252 [00:00<00:00, 77872.59it/s]
100%|██████████| 203/203 [00:00<00:00, 80736.18it/s]
100%|██████████| 153/153 [00:00<00:00, 74994.57it/s]
100%|██████████| 200/200 [00:00<00:00, 75382.89it/s]
100%|██████████| 65/65 [00:00<00:00, 77849.73it/s]
100%|██████████| 144/144 [00:00<00:00, 80487.71it/s]
100%|██████████| 30/30 [00:00<00:00, 64660.39it/s]
100%|██████████| 130/130 [00:00<00:00, 49438.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78898.35it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
['constrict' 'astringe']


100%|██████████| 5846/5846 [00:47<00:00, 123.31it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 24861.07it/s]
100%|██████████| 287/287 [00:00<00:00, 52036.71it/s]
100%|██████████| 771/771 [00:00<00:00, 63104.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93984.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86290.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89964.69it/s]
100%|██████████| 353/353 [00:00<00:00, 81119.29it/s]
100%|██████████| 252/252 [00:00<00:00, 71731.56it/s]
100%|██████████| 203/203 [00:00<00:00, 71779.10it/s]
100%|██████████| 153/153 [00:00<00:00, 68795.94it/s]
100%|██████████| 200/200 [00:00<00:00, 86125.34it/s]
100%|██████████| 65/65 [00:00<00:00, 60383.11it/s]
100%|██████████| 144/144 [00:00<00:00, 81541.75it/s]
100%|██████████| 30/30 [00:00<00:00, 64826.96it/s]
100%|██████████| 130/130 [00:00<00:00, 81956.94it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86883.31it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 147.63it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 90374.21it/s]
100%|██████████| 287/287 [00:00<00:00, 85506.84it/s]
100%|██████████| 771/771 [00:00<00:00, 89808.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90765.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83849.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80866.00it/s]
100%|██████████| 353/353 [00:00<00:00, 53535.92it/s]
100%|██████████| 252/252 [00:00<00:00, 53891.02it/s]
100%|██████████| 203/203 [00:00<00:00, 53112.33it/s]
100%|██████████| 153/153 [00:00<00:00, 51186.77it/s]
100%|██████████| 200/200 [00:00<00:00, 53403.41it/s]
100%|██████████| 65/65 [00:00<00:00, 50375.05it/s]
100%|██████████| 144/144 [00:00<00:00, 74547.00it/s]
100%|██████████| 30/30 [00:00<00:00, 50051.36it/s]
100%|██████████| 130/130 [00:00<00:00, 64291.89it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82580.83it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 144.67it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 52232.73it/s]
100%|██████████| 287/287 [00:00<00:00, 74219.45it/s]
100%|██████████| 771/771 [00:00<00:00, 77696.56it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92148.08it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80938.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80781.38it/s]
100%|██████████| 353/353 [00:00<00:00, 87196.07it/s]
100%|██████████| 252/252 [00:00<00:00, 78045.09it/s]
100%|██████████| 203/203 [00:00<00:00, 79925.25it/s]
100%|██████████| 153/153 [00:00<00:00, 73457.93it/s]
100%|██████████| 200/200 [00:00<00:00, 74006.25it/s]
100%|██████████| 65/65 [00:00<00:00, 66903.01it/s]
100%|██████████| 144/144 [00:00<00:00, 73782.04it/s]
100%|██████████| 30/30 [00:00<00:00, 69442.12it/s]
100%|██████████| 130/130 [00:00<00:00, 72507.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 101003.59it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 143.24it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 63304.27it/s]
100%|██████████| 287/287 [00:00<00:00, 76487.82it/s]
100%|██████████| 771/771 [00:00<00:00, 83931.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83510.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87129.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77847.69it/s]
100%|██████████| 353/353 [00:00<00:00, 77680.45it/s]
100%|██████████| 252/252 [00:00<00:00, 78235.72it/s]
100%|██████████| 203/203 [00:00<00:00, 77906.83it/s]
100%|██████████| 153/153 [00:00<00:00, 76523.79it/s]
100%|██████████| 200/200 [00:00<00:00, 77917.59it/s]
100%|██████████| 65/65 [00:00<00:00, 70428.77it/s]
100%|██████████| 144/144 [00:00<00:00, 77018.59it/s]
100%|██████████| 30/30 [00:00<00:00, 67001.66it/s]
100%|██████████| 130/130 [00:00<00:00, 75343.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78698.29it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.08it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 90162.24it/s]
100%|██████████| 287/287 [00:00<00:00, 74384.55it/s]
100%|██████████| 771/771 [00:00<00:00, 83339.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92104.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88262.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87755.51it/s]
100%|██████████| 353/353 [00:00<00:00, 68800.62it/s]
100%|██████████| 252/252 [00:00<00:00, 73222.35it/s]
100%|██████████| 203/203 [00:00<00:00, 70812.02it/s]
100%|██████████| 153/153 [00:00<00:00, 69278.69it/s]
100%|██████████| 200/200 [00:00<00:00, 76267.01it/s]
100%|██████████| 65/65 [00:00<00:00, 65035.73it/s]
100%|██████████| 144/144 [00:00<00:00, 67581.94it/s]
100%|██████████| 30/30 [00:00<00:00, 55043.36it/s]
100%|██████████| 130/130 [00:00<00:00, 65441.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78633.79it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.70it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 71105.58it/s]
100%|██████████| 287/287 [00:00<00:00, 82574.10it/s]
100%|██████████| 771/771 [00:00<00:00, 87122.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91856.47it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84753.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82014.51it/s]
100%|██████████| 353/353 [00:00<00:00, 86919.65it/s]
100%|██████████| 252/252 [00:00<00:00, 51990.39it/s]
100%|██████████| 203/203 [00:00<00:00, 76768.89it/s]
100%|██████████| 153/153 [00:00<00:00, 62140.85it/s]
100%|██████████| 200/200 [00:00<00:00, 70397.85it/s]
100%|██████████| 65/65 [00:00<00:00, 55065.59it/s]
100%|██████████| 144/144 [00:00<00:00, 57260.12it/s]
100%|██████████| 30/30 [00:00<00:00, 56936.25it/s]
100%|██████████| 130/130 [00:00<00:00, 64935.04it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79414.37it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.05it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 50250.16it/s]
100%|██████████| 287/287 [00:00<00:00, 79529.95it/s]
100%|██████████| 771/771 [00:00<00:00, 81082.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78578.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88015.78it/s]
100%|██████████| 3000/3000 [00:00<00:00, 103268.13it/s]
100%|██████████| 353/353 [00:00<00:00, 75842.09it/s]
100%|██████████| 252/252 [00:00<00:00, 42290.43it/s]
100%|██████████| 203/203 [00:00<00:00, 53712.07it/s]
100%|██████████| 153/153 [00:00<00:00, 67238.95it/s]
100%|██████████| 200/200 [00:00<00:00, 73448.98it/s]
100%|██████████| 65/65 [00:00<00:00, 70960.37it/s]
100%|██████████| 144/144 [00:00<00:00, 74053.43it/s]
100%|██████████| 30/30 [00:00<00:00, 58362.30it/s]
100%|██████████| 130/130 [00:00<00:00, 75125.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87126.18it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 167.00it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79507.21it/s]
100%|██████████| 287/287 [00:00<00:00, 76062.51it/s]
100%|██████████| 771/771 [00:00<00:00, 77926.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92535.36it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82089.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92685.66it/s]
100%|██████████| 353/353 [00:00<00:00, 77721.22it/s]
100%|██████████| 252/252 [00:00<00:00, 79286.22it/s]
100%|██████████| 203/203 [00:00<00:00, 76596.23it/s]
100%|██████████| 153/153 [00:00<00:00, 72372.68it/s]
100%|██████████| 200/200 [00:00<00:00, 67688.28it/s]
100%|██████████| 65/65 [00:00<00:00, 59036.33it/s]
100%|██████████| 144/144 [00:00<00:00, 80348.51it/s]
100%|██████████| 30/30 [00:00<00:00, 68871.99it/s]
100%|██████████| 130/130 [00:00<00:00, 77805.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78546.28it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.69it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 84386.15it/s]
100%|██████████| 287/287 [00:00<00:00, 78569.63it/s]
100%|██████████| 771/771 [00:00<00:00, 86802.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93974.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81340.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92572.46it/s]
100%|██████████| 353/353 [00:00<00:00, 77856.09it/s]
100%|██████████| 252/252 [00:00<00:00, 73055.34it/s]
100%|██████████| 203/203 [00:00<00:00, 83968.81it/s]
100%|██████████| 153/153 [00:00<00:00, 68995.65it/s]
100%|██████████| 200/200 [00:00<00:00, 63281.59it/s]
100%|██████████| 65/65 [00:00<00:00, 57432.01it/s]
100%|██████████| 144/144 [00:00<00:00, 66819.31it/s]
100%|██████████| 30/30 [00:00<00:00, 58092.85it/s]
100%|██████████| 130/130 [00:00<00:00, 67885.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81847.38it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.94it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 91962.99it/s]
100%|██████████| 287/287 [00:00<00:00, 89253.74it/s]
100%|██████████| 771/771 [00:00<00:00, 92717.71it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94642.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93721.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82971.18it/s]
100%|██████████| 353/353 [00:00<00:00, 73101.08it/s]
100%|██████████| 252/252 [00:00<00:00, 71931.71it/s]
100%|██████████| 203/203 [00:00<00:00, 70071.90it/s]
100%|██████████| 153/153 [00:00<00:00, 71910.41it/s]
100%|██████████| 200/200 [00:00<00:00, 71881.82it/s]
100%|██████████| 65/65 [00:00<00:00, 63653.92it/s]
100%|██████████| 144/144 [00:00<00:00, 73782.04it/s]
100%|██████████| 30/30 [00:00<00:00, 66017.38it/s]
100%|██████████| 130/130 [00:00<00:00, 66503.17it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85559.13it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.34it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92500.99it/s]
100%|██████████| 287/287 [00:00<00:00, 78186.88it/s]
100%|██████████| 771/771 [00:00<00:00, 79750.63it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78259.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80497.15it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87469.41it/s]
100%|██████████| 353/353 [00:00<00:00, 87175.54it/s]
100%|██████████| 252/252 [00:00<00:00, 80807.69it/s]
100%|██████████| 203/203 [00:00<00:00, 80705.57it/s]
100%|██████████| 153/153 [00:00<00:00, 81365.35it/s]
100%|██████████| 200/200 [00:00<00:00, 79800.30it/s]
100%|██████████| 65/65 [00:00<00:00, 74124.46it/s]
100%|██████████| 144/144 [00:00<00:00, 77136.63it/s]
100%|██████████| 30/30 [00:00<00:00, 56375.05it/s]
100%|██████████| 130/130 [00:00<00:00, 74898.29it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87610.79it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.02it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 96499.61it/s]
100%|██████████| 287/287 [00:00<00:00, 75357.78it/s]
100%|██████████| 771/771 [00:00<00:00, 81019.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79221.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77402.82it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79083.60it/s]
100%|██████████| 353/353 [00:00<00:00, 79941.11it/s]
100%|██████████| 252/252 [00:00<00:00, 79066.77it/s]
100%|██████████| 203/203 [00:00<00:00, 77892.57it/s]
100%|██████████| 153/153 [00:00<00:00, 76578.58it/s]
100%|██████████| 200/200 [00:00<00:00, 77737.08it/s]
100%|██████████| 65/65 [00:00<00:00, 70519.86it/s]
100%|██████████| 144/144 [00:00<00:00, 79565.25it/s]
100%|██████████| 30/30 [00:00<00:00, 69136.88it/s]
100%|██████████| 130/130 [00:00<00:00, 78218.26it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70425.21it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 146.64it/s]
INFO:root:The new embedding has 5843 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 90618.52it/s]
100%|██████████| 287/287 [00:00<00:00, 80719.19it/s]
100%|██████████| 771/771 [00:00<00:00, 95081.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94569.61it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94951.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89864.46it/s]
100%|██████████| 353/353 [00:00<00:00, 89004.47it/s]
100%|██████████| 252/252 [00:00<00:00, 71204.84it/s]
100%|██████████| 203/203 [00:00<00:00, 69664.84it/s]
100%|██████████| 153/153 [00:00<00:00, 82601.17it/s]
100%|██████████| 200/200 [00:00<00:00, 88319.73it/s]
100%|██████████| 65/65 [00:00<00:00, 64390.59it/s]
100%|██████████| 144/144 [00:00<00:00, 66576.25it/s]
100%|██████████| 30/30 [00:00<00:00, 42930.44it/s]
100%|██████████| 130/130 [00:00<00:00, 73110.69it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87993.62it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.24it/s]
INFO:root:The new embedding has 5843 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 92439.77it/s]
100%|██████████| 287/287 [00:00<00:00, 79894.16it/s]
100%|██████████| 771/771 [00:00<00:00, 85127.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81036.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72656.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87957.95it/s]
100%|██████████| 353/353 [00:00<00:00, 74114.70it/s]
100%|██████████| 252/252 [00:00<00:00, 71966.00it/s]
100%|██████████| 203/203 [00:00<00:00, 71202.85it/s]
100%|██████████| 153/153 [00:00<00:00, 64612.21it/s]
100%|██████████| 200/200 [00:00<00:00, 70338.82it/s]
100%|██████████| 65/65 [00:00<00:00, 70174.97it/s]
100%|██████████| 144/144 [00:00<00:00, 68978.96it/s]
100%|██████████| 30/30 [00:00<00:00, 43736.23it/s]
100%|██████████| 130/130 [00:00<00:00, 78760.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89333.37it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.31it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 83834.05it/s]
100%|██████████| 287/287 [00:00<00:00, 75207.13it/s]
100%|██████████| 771/771 [00:00<00:00, 81055.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84348.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82133.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97411.32it/s]
100%|██████████| 353/353 [00:00<00:00, 78708.70it/s]
100%|██████████| 252/252 [00:00<00:00, 86149.21it/s]
100%|██████████| 203/203 [00:00<00:00, 79027.63it/s]
100%|██████████| 153/153 [00:00<00:00, 77223.65it/s]
100%|██████████| 200/200 [00:00<00:00, 77421.39it/s]
100%|██████████| 65/65 [00:00<00:00, 68157.44it/s]
100%|██████████| 144/144 [00:00<00:00, 78235.72it/s]
100%|██████████| 30/30 [00:00<00:00, 61380.06it/s]
100%|██████████| 130/130 [00:00<00:00, 76057.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78393.18it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.25it/s]
INFO:root:The new embedding has 5843 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88773.51it/s]
100%|██████████| 287/287 [00:00<00:00, 69872.61it/s]
100%|██████████| 771/771 [00:00<00:00, 93984.20it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89458.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76626.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79992.07it/s]
100%|██████████| 353/353 [00:00<00:00, 78683.60it/s]
100%|██████████| 252/252 [00:00<00:00, 72959.52it/s]
100%|██████████| 203/203 [00:00<00:00, 71107.71it/s]
100%|██████████| 153/153 [00:00<00:00, 75899.29it/s]
100%|██████████| 200/200 [00:00<00:00, 73934.50it/s]
100%|██████████| 65/65 [00:00<00:00, 64742.28it/s]
100%|██████████| 144/144 [00:00<00:00, 72203.20it/s]
100%|██████████| 30/30 [00:00<00:00, 63517.98it/s]
100%|██████████| 130/130 [00:00<00:00, 73843.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87741.18it/s]
100%|██████████| 203

['monsignori' 'priest']
['nondescripts' 'person']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.45it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 82609.32it/s]
100%|██████████| 287/287 [00:00<00:00, 85671.14it/s]
100%|██████████| 771/771 [00:00<00:00, 86449.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88037.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89229.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92769.71it/s]
100%|██████████| 353/353 [00:00<00:00, 69131.50it/s]
100%|██████████| 252/252 [00:00<00:00, 83594.16it/s]
100%|██████████| 203/203 [00:00<00:00, 64635.52it/s]
100%|██████████| 153/153 [00:00<00:00, 68290.79it/s]
100%|██████████| 200/200 [00:00<00:00, 70963.61it/s]
100%|██████████| 65/65 [00:00<00:00, 58216.90it/s]
100%|██████████| 144/144 [00:00<00:00, 64617.50it/s]
100%|██████████| 30/30 [00:00<00:00, 62045.92it/s]
100%|██████████| 130/130 [00:00<00:00, 65868.51it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87207.44it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 155.61it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 80299.53it/s]
100%|██████████| 287/287 [00:00<00:00, 74018.65it/s]
100%|██████████| 771/771 [00:00<00:00, 85345.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79882.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72622.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92216.28it/s]
100%|██████████| 353/353 [00:00<00:00, 90805.85it/s]
100%|██████████| 252/252 [00:00<00:00, 88323.27it/s]
100%|██████████| 203/203 [00:00<00:00, 78582.71it/s]
100%|██████████| 153/153 [00:00<00:00, 66062.23it/s]
100%|██████████| 200/200 [00:00<00:00, 68094.88it/s]
100%|██████████| 65/65 [00:00<00:00, 55604.68it/s]
100%|██████████| 144/144 [00:00<00:00, 62731.59it/s]
100%|██████████| 30/30 [00:00<00:00, 41228.41it/s]
100%|██████████| 130/130 [00:00<00:00, 71229.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84666.46it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.55it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80330.32it/s]
100%|██████████| 287/287 [00:00<00:00, 68778.73it/s]
100%|██████████| 771/771 [00:00<00:00, 58888.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 59399.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 59455.72it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78744.09it/s]
100%|██████████| 353/353 [00:00<00:00, 74382.78it/s]
100%|██████████| 252/252 [00:00<00:00, 76825.45it/s]
100%|██████████| 203/203 [00:00<00:00, 57885.90it/s]
100%|██████████| 153/153 [00:00<00:00, 57343.27it/s]
100%|██████████| 200/200 [00:00<00:00, 55513.26it/s]
100%|██████████| 65/65 [00:00<00:00, 54624.28it/s]
100%|██████████| 144/144 [00:00<00:00, 57379.80it/s]
100%|██████████| 30/30 [00:00<00:00, 43904.09it/s]
100%|██████████| 130/130 [00:00<00:00, 56803.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 57743.47it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 155.92it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77255.56it/s]
100%|██████████| 287/287 [00:00<00:00, 80540.96it/s]
100%|██████████| 771/771 [00:00<00:00, 79256.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80953.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79514.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 99042.17it/s]
100%|██████████| 353/353 [00:00<00:00, 80694.86it/s]
100%|██████████| 252/252 [00:00<00:00, 77849.64it/s]
100%|██████████| 203/203 [00:00<00:00, 81205.89it/s]
100%|██████████| 153/153 [00:00<00:00, 76945.86it/s]
100%|██████████| 200/200 [00:00<00:00, 80350.65it/s]
100%|██████████| 65/65 [00:00<00:00, 76818.75it/s]
100%|██████████| 144/144 [00:00<00:00, 105461.81it/s]
100%|██████████| 30/30 [00:00<00:00, 70217.14it/s]
100%|██████████| 130/130 [00:00<00:00, 76484.71it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78833.10it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 171.02it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 93468.73it/s]
100%|██████████| 287/287 [00:00<00:00, 73570.79it/s]
100%|██████████| 771/771 [00:00<00:00, 93196.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90222.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85825.74it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78475.46it/s]
100%|██████████| 353/353 [00:00<00:00, 71650.66it/s]
100%|██████████| 252/252 [00:00<00:00, 73558.68it/s]
100%|██████████| 203/203 [00:00<00:00, 73223.57it/s]
100%|██████████| 153/153 [00:00<00:00, 71287.33it/s]
100%|██████████| 200/200 [00:00<00:00, 72553.26it/s]
100%|██████████| 65/65 [00:00<00:00, 64390.59it/s]
100%|██████████| 144/144 [00:00<00:00, 72751.12it/s]
100%|██████████| 30/30 [00:00<00:00, 64067.78it/s]
100%|██████████| 130/130 [00:00<00:00, 63915.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91475.40it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 176.47it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 92849.44it/s]
100%|██████████| 287/287 [00:00<00:00, 82966.80it/s]
100%|██████████| 771/771 [00:00<00:00, 94398.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83531.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74393.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90755.68it/s]
100%|██████████| 353/353 [00:00<00:00, 75990.01it/s]
100%|██████████| 252/252 [00:00<00:00, 85660.48it/s]
100%|██████████| 203/203 [00:00<00:00, 74537.66it/s]
100%|██████████| 153/153 [00:00<00:00, 68174.71it/s]
100%|██████████| 200/200 [00:00<00:00, 71101.95it/s]
100%|██████████| 65/65 [00:00<00:00, 62017.69it/s]
100%|██████████| 144/144 [00:00<00:00, 69375.12it/s]
100%|██████████| 30/30 [00:00<00:00, 61893.32it/s]
100%|██████████| 130/130 [00:00<00:00, 69204.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87332.47it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:36<00:00, 160.93it/s]
INFO:root:The new embedding has 5832 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 89137.99it/s]
100%|██████████| 287/287 [00:00<00:00, 72787.84it/s]
100%|██████████| 771/771 [00:00<00:00, 91974.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84261.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81498.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90643.23it/s]
100%|██████████| 353/353 [00:00<00:00, 77538.06it/s]
100%|██████████| 252/252 [00:00<00:00, 64539.57it/s]
100%|██████████| 203/203 [00:00<00:00, 85135.86it/s]
100%|██████████| 153/153 [00:00<00:00, 69443.62it/s]
100%|██████████| 200/200 [00:00<00:00, 70115.41it/s]
100%|██████████| 65/65 [00:00<00:00, 62962.99it/s]
100%|██████████| 144/144 [00:00<00:00, 84995.75it/s]
100%|██████████| 30/30 [00:00<00:00, 63517.98it/s]
100%|██████████| 130/130 [00:00<00:00, 78308.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89444.41it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 166.98it/s]
INFO:root:The new embedding has 5832 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 92662.59it/s]
100%|██████████| 287/287 [00:00<00:00, 70022.99it/s]
100%|██████████| 771/771 [00:00<00:00, 88309.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92393.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86831.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87746.95it/s]
100%|██████████| 353/353 [00:00<00:00, 77323.44it/s]
100%|██████████| 252/252 [00:00<00:00, 72162.53it/s]
100%|██████████| 203/203 [00:00<00:00, 71018.74it/s]
100%|██████████| 153/153 [00:00<00:00, 69722.78it/s]
100%|██████████| 200/200 [00:00<00:00, 70097.84it/s]
100%|██████████| 65/65 [00:00<00:00, 63402.27it/s]
100%|██████████| 144/144 [00:00<00:00, 67794.34it/s]
100%|██████████| 30/30 [00:00<00:00, 64693.63it/s]
100%|██████████| 130/130 [00:00<00:00, 70611.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88618.30it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.77it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80918.27it/s]
100%|██████████| 287/287 [00:00<00:00, 68442.42it/s]
100%|██████████| 771/771 [00:00<00:00, 75982.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79243.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81201.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80772.05it/s]
100%|██████████| 353/353 [00:00<00:00, 78197.39it/s]
100%|██████████| 252/252 [00:00<00:00, 78282.08it/s]
100%|██████████| 203/203 [00:00<00:00, 79351.70it/s]
100%|██████████| 153/153 [00:00<00:00, 80135.93it/s]
100%|██████████| 200/200 [00:00<00:00, 76440.75it/s]
100%|██████████| 65/65 [00:00<00:00, 74428.00it/s]
100%|██████████| 144/144 [00:00<00:00, 74666.80it/s]
100%|██████████| 30/30 [00:00<00:00, 59747.92it/s]
100%|██████████| 130/130 [00:00<00:00, 74336.68it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86832.94it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.68it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 85388.72it/s]
100%|██████████| 287/287 [00:00<00:00, 61564.22it/s]
100%|██████████| 771/771 [00:00<00:00, 71704.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95670.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79698.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94684.54it/s]
100%|██████████| 353/353 [00:00<00:00, 77733.47it/s]
100%|██████████| 252/252 [00:00<00:00, 79084.52it/s]
100%|██████████| 203/203 [00:00<00:00, 76225.94it/s]
100%|██████████| 153/153 [00:00<00:00, 75117.47it/s]
100%|██████████| 200/200 [00:00<00:00, 76371.16it/s]
100%|██████████| 65/65 [00:00<00:00, 66919.43it/s]
100%|██████████| 144/144 [00:00<00:00, 74620.68it/s]
100%|██████████| 30/30 [00:00<00:00, 64329.82it/s]
100%|██████████| 130/130 [00:00<00:00, 62024.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90312.18it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 168.76it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 91631.16it/s]
100%|██████████| 287/287 [00:00<00:00, 69433.31it/s]
100%|██████████| 771/771 [00:00<00:00, 94230.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94985.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75137.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81413.81it/s]
100%|██████████| 353/353 [00:00<00:00, 82890.46it/s]
100%|██████████| 252/252 [00:00<00:00, 71926.82it/s]
100%|██████████| 203/203 [00:00<00:00, 71155.25it/s]
100%|██████████| 153/153 [00:00<00:00, 69032.76it/s]
100%|██████████| 200/200 [00:00<00:00, 70688.53it/s]
100%|██████████| 65/65 [00:00<00:00, 71164.12it/s]
100%|██████████| 144/144 [00:00<00:00, 69791.98it/s]
100%|██████████| 30/30 [00:00<00:00, 57430.00it/s]
100%|██████████| 130/130 [00:00<00:00, 81846.22it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77816.81it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 172.29it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 85564.83it/s]
100%|██████████| 287/287 [00:00<00:00, 86657.93it/s]
100%|██████████| 771/771 [00:00<00:00, 75978.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 71252.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73469.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92166.30it/s]
100%|██████████| 353/353 [00:00<00:00, 71786.15it/s]
100%|██████████| 252/252 [00:00<00:00, 73779.46it/s]
100%|██████████| 203/203 [00:00<00:00, 73393.99it/s]
100%|██████████| 153/153 [00:00<00:00, 70854.42it/s]
100%|██████████| 200/200 [00:00<00:00, 73218.19it/s]
100%|██████████| 65/65 [00:00<00:00, 70356.07it/s]
100%|██████████| 144/144 [00:00<00:00, 74253.72it/s]
100%|██████████| 30/30 [00:00<00:00, 67759.35it/s]
100%|██████████| 130/130 [00:00<00:00, 74275.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90633.34it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:57<00:00, 102.15it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 67557.35it/s]
100%|██████████| 287/287 [00:00<00:00, 72831.88it/s]
100%|██████████| 771/771 [00:00<00:00, 89120.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79418.77it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91032.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90399.68it/s]
100%|██████████| 353/353 [00:00<00:00, 59060.57it/s]
100%|██████████| 252/252 [00:00<00:00, 87780.47it/s]
100%|██████████| 203/203 [00:00<00:00, 72910.06it/s]
100%|██████████| 153/153 [00:00<00:00, 74776.10it/s]
100%|██████████| 200/200 [00:00<00:00, 71593.48it/s]
100%|██████████| 65/65 [00:00<00:00, 60116.82it/s]
100%|██████████| 144/144 [00:00<00:00, 68161.58it/s]
100%|██████████| 30/30 [00:00<00:00, 55602.79it/s]
100%|██████████| 130/130 [00:00<00:00, 67357.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84142.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 128.92it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88412.00it/s]
100%|██████████| 287/287 [00:00<00:00, 81722.01it/s]
100%|██████████| 771/771 [00:00<00:00, 87258.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88889.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81594.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85531.13it/s]
100%|██████████| 353/353 [00:00<00:00, 68318.07it/s]
100%|██████████| 252/252 [00:00<00:00, 79120.04it/s]
100%|██████████| 203/203 [00:00<00:00, 67892.81it/s]
100%|██████████| 153/153 [00:00<00:00, 38037.37it/s]
100%|██████████| 200/200 [00:00<00:00, 48080.52it/s]
100%|██████████| 65/65 [00:00<00:00, 30736.16it/s]
100%|██████████| 144/144 [00:00<00:00, 67483.77it/s]
100%|██████████| 30/30 [00:00<00:00, 16456.86it/s]
100%|██████████| 130/130 [00:00<00:00, 59299.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85637.49it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.25it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 61265.18it/s]
100%|██████████| 287/287 [00:00<00:00, 77812.88it/s]
100%|██████████| 771/771 [00:00<00:00, 79644.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79628.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 98363.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 103124.25it/s]
100%|██████████| 353/353 [00:00<00:00, 76559.77it/s]
100%|██████████| 252/252 [00:00<00:00, 76786.39it/s]
100%|██████████| 203/203 [00:00<00:00, 62795.47it/s]
100%|██████████| 153/153 [00:00<00:00, 78050.17it/s]
100%|██████████| 200/200 [00:00<00:00, 78026.30it/s]
100%|██████████| 65/65 [00:00<00:00, 56062.05it/s]
100%|██████████| 144/144 [00:00<00:00, 72306.93it/s]
100%|██████████| 30/30 [00:00<00:00, 69136.88it/s]
100%|██████████| 130/130 [00:00<00:00, 77639.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84035.90it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.38it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 83211.39it/s]
100%|██████████| 287/287 [00:00<00:00, 72472.32it/s]
100%|██████████| 771/771 [00:00<00:00, 83001.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79997.41it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79119.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88587.10it/s]
100%|██████████| 353/353 [00:00<00:00, 77860.19it/s]
100%|██████████| 252/252 [00:00<00:00, 76419.97it/s]
100%|██████████| 203/203 [00:00<00:00, 74038.58it/s]
100%|██████████| 153/153 [00:00<00:00, 78662.48it/s]
100%|██████████| 200/200 [00:00<00:00, 79982.91it/s]
100%|██████████| 65/65 [00:00<00:00, 70776.16it/s]
100%|██████████| 144/144 [00:00<00:00, 75206.05it/s]
100%|██████████| 30/30 [00:00<00:00, 63421.94it/s]
100%|██████████| 130/130 [00:00<00:00, 53331.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77922.97it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [01:03<00:00, 91.50it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 89411.90it/s]
100%|██████████| 287/287 [00:00<00:00, 80384.99it/s]
100%|██████████| 771/771 [00:00<00:00, 86211.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83116.42it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85557.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74616.70it/s]
100%|██████████| 353/353 [00:00<00:00, 79443.54it/s]
100%|██████████| 252/252 [00:00<00:00, 73217.28it/s]
100%|██████████| 203/203 [00:00<00:00, 50396.19it/s]
100%|██████████| 153/153 [00:00<00:00, 67893.41it/s]
100%|██████████| 200/200 [00:00<00:00, 65108.72it/s]
100%|██████████| 65/65 [00:00<00:00, 64405.80it/s]
100%|██████████| 144/144 [00:00<00:00, 42277.74it/s]
100%|██████████| 30/30 [00:00<00:00, 24174.66it/s]
100%|██████████| 130/130 [00:00<00:00, 60557.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76788.62it/s]
100%|██████████| 2034

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.18it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 85021.40it/s]
100%|██████████| 287/287 [00:00<00:00, 65475.40it/s]
100%|██████████| 771/771 [00:00<00:00, 61703.30it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85884.61it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89627.63it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90831.02it/s]
100%|██████████| 353/353 [00:00<00:00, 74133.25it/s]
100%|██████████| 252/252 [00:00<00:00, 70899.16it/s]
100%|██████████| 203/203 [00:00<00:00, 78604.48it/s]
100%|██████████| 153/153 [00:00<00:00, 75926.23it/s]
100%|██████████| 200/200 [00:00<00:00, 87281.32it/s]
100%|██████████| 65/65 [00:00<00:00, 65725.59it/s]
100%|██████████| 144/144 [00:00<00:00, 66701.25it/s]
100%|██████████| 30/30 [00:00<00:00, 55800.05it/s]
100%|██████████| 130/130 [00:00<00:00, 68396.83it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88768.88it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 147.53it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60480.80it/s]
100%|██████████| 287/287 [00:00<00:00, 68140.23it/s]
100%|██████████| 771/771 [00:00<00:00, 73312.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87210.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77701.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85748.54it/s]
100%|██████████| 353/353 [00:00<00:00, 85071.78it/s]
100%|██████████| 252/252 [00:00<00:00, 72868.98it/s]
100%|██████████| 203/203 [00:00<00:00, 76534.27it/s]
100%|██████████| 153/153 [00:00<00:00, 70357.25it/s]
100%|██████████| 200/200 [00:00<00:00, 61853.77it/s]
100%|██████████| 65/65 [00:00<00:00, 72009.97it/s]
100%|██████████| 144/144 [00:00<00:00, 74198.99it/s]
100%|██████████| 30/30 [00:00<00:00, 68759.08it/s]
100%|██████████| 130/130 [00:00<00:00, 57233.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87470.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.09it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79700.79it/s]
100%|██████████| 287/287 [00:00<00:00, 78421.19it/s]
100%|██████████| 771/771 [00:00<00:00, 68605.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80907.08it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78587.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84146.37it/s]
100%|██████████| 353/353 [00:00<00:00, 72734.79it/s]
100%|██████████| 252/252 [00:00<00:00, 73789.77it/s]
100%|██████████| 203/203 [00:00<00:00, 77871.20it/s]
100%|██████████| 153/153 [00:00<00:00, 80934.36it/s]
100%|██████████| 200/200 [00:00<00:00, 78004.54it/s]
100%|██████████| 65/65 [00:00<00:00, 67117.12it/s]
100%|██████████| 144/144 [00:00<00:00, 75905.46it/s]
100%|██████████| 30/30 [00:00<00:00, 58200.33it/s]
100%|██████████| 130/130 [00:00<00:00, 77683.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71493.59it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [01:00<00:00, 97.11it/s] 
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 68103.07it/s]
100%|██████████| 287/287 [00:00<00:00, 70751.45it/s]
100%|██████████| 771/771 [00:00<00:00, 73651.32it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87124.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74392.15it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76320.67it/s]
100%|██████████| 353/353 [00:00<00:00, 72280.28it/s]
100%|██████████| 252/252 [00:00<00:00, 72295.80it/s]
100%|██████████| 203/203 [00:00<00:00, 69721.89it/s]
100%|██████████| 153/153 [00:00<00:00, 70318.71it/s]
100%|██████████| 200/200 [00:00<00:00, 71660.76it/s]
100%|██████████| 65/65 [00:00<00:00, 66560.00it/s]
100%|██████████| 144/144 [00:00<00:00, 70476.05it/s]
100%|██████████| 30/30 [00:00<00:00, 45442.08it/s]
100%|██████████| 130/130 [00:00<00:00, 64201.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91240.03it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 112.32it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 77072.25it/s]
100%|██████████| 287/287 [00:00<00:00, 79693.16it/s]
100%|██████████| 771/771 [00:00<00:00, 78737.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84271.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85284.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82004.35it/s]
100%|██████████| 353/353 [00:00<00:00, 75259.97it/s]
100%|██████████| 252/252 [00:00<00:00, 70643.27it/s]
100%|██████████| 203/203 [00:00<00:00, 79277.81it/s]
100%|██████████| 153/153 [00:00<00:00, 72015.32it/s]
100%|██████████| 200/200 [00:00<00:00, 77621.99it/s]
100%|██████████| 65/65 [00:00<00:00, 62045.92it/s]
100%|██████████| 144/144 [00:00<00:00, 74482.65it/s]
100%|██████████| 30/30 [00:00<00:00, 53294.84it/s]
100%|██████████| 130/130 [00:00<00:00, 77772.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69342.08it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 119.68it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 64873.43it/s]
100%|██████████| 287/287 [00:00<00:00, 72906.86it/s]
100%|██████████| 771/771 [00:00<00:00, 75383.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79969.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81035.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79966.14it/s]
100%|██████████| 353/353 [00:00<00:00, 72642.00it/s]
100%|██████████| 252/252 [00:00<00:00, 78334.29it/s]
100%|██████████| 203/203 [00:00<00:00, 76212.29it/s]
100%|██████████| 153/153 [00:00<00:00, 75872.37it/s]
100%|██████████| 200/200 [00:00<00:00, 77179.21it/s]
100%|██████████| 65/65 [00:00<00:00, 69708.45it/s]
100%|██████████| 144/144 [00:00<00:00, 74153.44it/s]
100%|██████████| 30/30 [00:00<00:00, 55973.81it/s]
100%|██████████| 130/130 [00:00<00:00, 74560.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70539.93it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 120.96it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77662.22it/s]
100%|██████████| 287/287 [00:00<00:00, 73048.44it/s]
100%|██████████| 771/771 [00:00<00:00, 76666.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95508.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81531.45it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93844.90it/s]
100%|██████████| 353/353 [00:00<00:00, 83141.81it/s]
100%|██████████| 252/252 [00:00<00:00, 82164.54it/s]
100%|██████████| 203/203 [00:00<00:00, 78214.56it/s]
100%|██████████| 153/153 [00:00<00:00, 76798.53it/s]
100%|██████████| 200/200 [00:00<00:00, 78832.89it/s]
100%|██████████| 65/65 [00:00<00:00, 72353.97it/s]
100%|██████████| 144/144 [00:00<00:00, 75876.86it/s]
100%|██████████| 30/30 [00:00<00:00, 60147.76it/s]
100%|██████████| 130/130 [00:00<00:00, 69265.69it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91179.39it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 157.68it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 91928.69it/s]
100%|██████████| 287/287 [00:00<00:00, 86038.54it/s]
100%|██████████| 771/771 [00:00<00:00, 85160.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92094.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91119.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84828.81it/s]
100%|██████████| 353/353 [00:00<00:00, 81083.75it/s]
100%|██████████| 252/252 [00:00<00:00, 72290.86it/s]
100%|██████████| 203/203 [00:00<00:00, 70989.14it/s]
100%|██████████| 153/153 [00:00<00:00, 71208.22it/s]
100%|██████████| 200/200 [00:00<00:00, 81736.41it/s]
100%|██████████| 65/65 [00:00<00:00, 62443.83it/s]
100%|██████████| 144/144 [00:00<00:00, 72289.62it/s]
100%|██████████| 30/30 [00:00<00:00, 65061.59it/s]
100%|██████████| 130/130 [00:00<00:00, 62251.34it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87447.96it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 163.99it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 93460.39it/s]
100%|██████████| 287/287 [00:00<00:00, 87578.41it/s]
100%|██████████| 771/771 [00:00<00:00, 92789.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95775.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90574.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89183.58it/s]
100%|██████████| 353/353 [00:00<00:00, 78884.83it/s]
100%|██████████| 252/252 [00:00<00:00, 72504.09it/s]
100%|██████████| 203/203 [00:00<00:00, 73980.69it/s]
100%|██████████| 153/153 [00:00<00:00, 73787.34it/s]
100%|██████████| 200/200 [00:00<00:00, 74281.48it/s]
100%|██████████| 65/65 [00:00<00:00, 70283.52it/s]
100%|██████████| 144/144 [00:00<00:00, 68393.14it/s]
100%|██████████| 30/30 [00:00<00:00, 50758.02it/s]
100%|██████████| 130/130 [00:00<00:00, 82577.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89218.27it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.72it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88186.84it/s]
100%|██████████| 287/287 [00:00<00:00, 77918.65it/s]
100%|██████████| 771/771 [00:00<00:00, 80549.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80072.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86829.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87439.02it/s]
100%|██████████| 353/353 [00:00<00:00, 81489.86it/s]
100%|██████████| 252/252 [00:00<00:00, 77975.99it/s]
100%|██████████| 203/203 [00:00<00:00, 79499.88it/s]
100%|██████████| 153/153 [00:00<00:00, 74636.95it/s]
100%|██████████| 200/200 [00:00<00:00, 78552.37it/s]
100%|██████████| 65/65 [00:00<00:00, 68932.94it/s]
100%|██████████| 144/144 [00:00<00:00, 73881.32it/s]
100%|██████████| 30/30 [00:00<00:00, 68947.46it/s]
100%|██████████| 130/130 [00:00<00:00, 79588.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 99296.97it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.88it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79507.21it/s]
100%|██████████| 287/287 [00:00<00:00, 77139.71it/s]
100%|██████████| 771/771 [00:00<00:00, 76819.85it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80490.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80882.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77388.06it/s]
100%|██████████| 353/353 [00:00<00:00, 80274.85it/s]
100%|██████████| 252/252 [00:00<00:00, 84651.98it/s]
100%|██████████| 203/203 [00:00<00:00, 76893.68it/s]
100%|██████████| 153/153 [00:00<00:00, 80761.20it/s]
100%|██████████| 200/200 [00:00<00:00, 76727.41it/s]
100%|██████████| 65/65 [00:00<00:00, 64543.03it/s]
100%|██████████| 144/144 [00:00<00:00, 76202.34it/s]
100%|██████████| 30/30 [00:00<00:00, 54213.32it/s]
100%|██████████| 130/130 [00:00<00:00, 73149.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86235.12it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.82it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 89265.23it/s]
100%|██████████| 287/287 [00:00<00:00, 74633.59it/s]
100%|██████████| 771/771 [00:00<00:00, 88921.51it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92647.78it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74823.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 94082.07it/s]
100%|██████████| 353/353 [00:00<00:00, 74660.35it/s]
100%|██████████| 252/252 [00:00<00:00, 94837.56it/s]
100%|██████████| 203/203 [00:00<00:00, 74616.05it/s]
100%|██████████| 153/153 [00:00<00:00, 73897.80it/s]
100%|██████████| 200/200 [00:00<00:00, 71453.22it/s]
100%|██████████| 65/65 [00:00<00:00, 60503.72it/s]
100%|██████████| 144/144 [00:00<00:00, 71570.06it/s]
100%|██████████| 30/30 [00:00<00:00, 48321.47it/s]
100%|██████████| 130/130 [00:00<00:00, 71697.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71933.59it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.60it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 74182.24it/s]
100%|██████████| 287/287 [00:00<00:00, 89359.75it/s]
100%|██████████| 771/771 [00:00<00:00, 93733.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92007.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93560.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91294.31it/s]
100%|██████████| 353/353 [00:00<00:00, 82857.98it/s]
100%|██████████| 252/252 [00:00<00:00, 86430.99it/s]
100%|██████████| 203/203 [00:00<00:00, 78947.03it/s]
100%|██████████| 153/153 [00:00<00:00, 85598.04it/s]
100%|██████████| 200/200 [00:00<00:00, 86856.57it/s]
100%|██████████| 65/65 [00:00<00:00, 61513.94it/s]
100%|██████████| 144/144 [00:00<00:00, 84543.64it/s]
100%|██████████| 30/30 [00:00<00:00, 63678.70it/s]
100%|██████████| 130/130 [00:00<00:00, 68474.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89442.23it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 157.25it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76328.14it/s]
100%|██████████| 287/287 [00:00<00:00, 77105.13it/s]
100%|██████████| 771/771 [00:00<00:00, 88990.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87778.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76629.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92042.92it/s]
100%|██████████| 353/353 [00:00<00:00, 70957.03it/s]
100%|██████████| 252/252 [00:00<00:00, 77569.69it/s]
100%|██████████| 203/203 [00:00<00:00, 74885.11it/s]
100%|██████████| 153/153 [00:00<00:00, 68854.99it/s]
100%|██████████| 200/200 [00:00<00:00, 74651.67it/s]
100%|██████████| 65/65 [00:00<00:00, 72740.06it/s]
100%|██████████| 144/144 [00:00<00:00, 77413.46it/s]
100%|██████████| 30/30 [00:00<00:00, 62446.21it/s]
100%|██████████| 130/130 [00:00<00:00, 71716.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94205.03it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.59it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76457.67it/s]
100%|██████████| 287/287 [00:00<00:00, 83874.39it/s]
100%|██████████| 771/771 [00:00<00:00, 78919.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 64822.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79695.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87609.48it/s]
100%|██████████| 353/353 [00:00<00:00, 79294.63it/s]
100%|██████████| 252/252 [00:00<00:00, 79560.75it/s]
100%|██████████| 203/203 [00:00<00:00, 79962.78it/s]
100%|██████████| 153/153 [00:00<00:00, 79926.33it/s]
100%|██████████| 200/200 [00:00<00:00, 77708.27it/s]
100%|██████████| 65/65 [00:00<00:00, 76495.44it/s]
100%|██████████| 144/144 [00:00<00:00, 75981.86it/s]
100%|██████████| 30/30 [00:00<00:00, 63326.18it/s]
100%|██████████| 130/130 [00:00<00:00, 74939.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 100029.05it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [01:07<00:00, 86.12it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 68516.22it/s]
100%|██████████| 287/287 [00:00<00:00, 62840.12it/s]
100%|██████████| 771/771 [00:00<00:00, 72294.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92018.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87842.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92127.16it/s]
100%|██████████| 353/353 [00:00<00:00, 71841.88it/s]
100%|██████████| 252/252 [00:00<00:00, 72904.17it/s]
100%|██████████| 203/203 [00:00<00:00, 70396.34it/s]
100%|██████████| 153/153 [00:00<00:00, 71042.68it/s]
100%|██████████| 200/200 [00:00<00:00, 70623.07it/s]
100%|██████████| 65/65 [00:00<00:00, 69195.37it/s]
100%|██████████| 144/144 [00:00<00:00, 66167.81it/s]
100%|██████████| 30/30 [00:00<00:00, 47357.59it/s]
100%|██████████| 130/130 [00:00<00:00, 73022.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 53699.76it/s]
100%|██████████| 2034

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:31<00:00, 187.67it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 86490.31it/s]
100%|██████████| 287/287 [00:00<00:00, 75423.89it/s]
100%|██████████| 771/771 [00:00<00:00, 87706.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93120.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86434.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91598.02it/s]
100%|██████████| 353/353 [00:00<00:00, 71636.80it/s]
100%|██████████| 252/252 [00:00<00:00, 67875.97it/s]
100%|██████████| 203/203 [00:00<00:00, 69516.96it/s]
100%|██████████| 153/153 [00:00<00:00, 73474.76it/s]
100%|██████████| 200/200 [00:00<00:00, 66140.57it/s]
100%|██████████| 65/65 [00:00<00:00, 63639.07it/s]
100%|██████████| 144/144 [00:00<00:00, 69105.24it/s]
100%|██████████| 30/30 [00:00<00:00, 63970.07it/s]
100%|██████████| 130/130 [00:00<00:00, 73366.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91646.72it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:39<00:00, 146.26it/s]
INFO:root:The new embedding has 5832 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 87861.39it/s]
100%|██████████| 287/287 [00:00<00:00, 68751.23it/s]
100%|██████████| 771/771 [00:00<00:00, 80161.83it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85044.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79777.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83453.24it/s]
100%|██████████| 353/353 [00:00<00:00, 80681.67it/s]
100%|██████████| 252/252 [00:00<00:00, 78672.47it/s]
100%|██████████| 203/203 [00:00<00:00, 73635.19it/s]
100%|██████████| 153/153 [00:00<00:00, 55235.71it/s]
100%|██████████| 200/200 [00:00<00:00, 68261.11it/s]
100%|██████████| 65/65 [00:00<00:00, 52590.62it/s]
100%|██████████| 144/144 [00:00<00:00, 83227.20it/s]
100%|██████████| 30/30 [00:00<00:00, 37117.73it/s]
100%|██████████| 130/130 [00:00<00:00, 65012.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84954.57it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:32<00:00, 177.41it/s]
INFO:root:The new embedding has 5832 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 91309.68it/s]
100%|██████████| 287/287 [00:00<00:00, 86241.96it/s]
100%|██████████| 771/771 [00:00<00:00, 90712.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94127.11it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86660.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90983.39it/s]
100%|██████████| 353/353 [00:00<00:00, 81584.16it/s]
100%|██████████| 252/252 [00:00<00:00, 70150.97it/s]
100%|██████████| 203/203 [00:00<00:00, 69533.99it/s]
100%|██████████| 153/153 [00:00<00:00, 69647.11it/s]
100%|██████████| 200/200 [00:00<00:00, 73243.76it/s]
100%|██████████| 65/65 [00:00<00:00, 62003.58it/s]
100%|██████████| 144/144 [00:00<00:00, 67303.30it/s]
100%|██████████| 30/30 [00:00<00:00, 58173.43it/s]
100%|██████████| 130/130 [00:00<00:00, 66568.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86500.88it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 173.00it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 59801.47it/s]
100%|██████████| 287/287 [00:00<00:00, 75127.33it/s]
100%|██████████| 771/771 [00:00<00:00, 79888.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83689.41it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79607.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97843.07it/s]
100%|██████████| 353/353 [00:00<00:00, 77198.46it/s]
100%|██████████| 252/252 [00:00<00:00, 78731.07it/s]
100%|██████████| 203/203 [00:00<00:00, 79865.28it/s]
100%|██████████| 153/153 [00:00<00:00, 71854.05it/s]
100%|██████████| 200/200 [00:00<00:00, 78707.15it/s]
100%|██████████| 65/65 [00:00<00:00, 65964.13it/s]
100%|██████████| 144/144 [00:00<00:00, 75450.32it/s]
100%|██████████| 30/30 [00:00<00:00, 56705.33it/s]
100%|██████████| 130/130 [00:00<00:00, 74509.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74044.88it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:32<00:00, 177.48it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78834.07it/s]
100%|██████████| 287/287 [00:00<00:00, 77933.79it/s]
100%|██████████| 771/771 [00:00<00:00, 77894.94it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81233.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82279.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87142.30it/s]
100%|██████████| 353/353 [00:00<00:00, 74014.66it/s]
100%|██████████| 252/252 [00:00<00:00, 77999.01it/s]
100%|██████████| 203/203 [00:00<00:00, 81275.65it/s]
100%|██████████| 153/153 [00:00<00:00, 76587.72it/s]
100%|██████████| 200/200 [00:00<00:00, 73623.03it/s]
100%|██████████| 65/65 [00:00<00:00, 70483.39it/s]
100%|██████████| 144/144 [00:00<00:00, 55390.66it/s]
100%|██████████| 30/30 [00:00<00:00, 25768.81it/s]
100%|██████████| 130/130 [00:00<00:00, 59487.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90848.16it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:31<00:00, 184.33it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 94542.19it/s]
100%|██████████| 287/287 [00:00<00:00, 85306.87it/s]
100%|██████████| 771/771 [00:00<00:00, 77369.39it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92966.08it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74373.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73560.19it/s]
100%|██████████| 353/353 [00:00<00:00, 70514.33it/s]
100%|██████████| 252/252 [00:00<00:00, 73252.80it/s]
100%|██████████| 203/203 [00:00<00:00, 73884.39it/s]
100%|██████████| 153/153 [00:00<00:00, 74291.33it/s]
100%|██████████| 200/200 [00:00<00:00, 72079.46it/s]
100%|██████████| 65/65 [00:00<00:00, 62948.46it/s]
100%|██████████| 144/144 [00:00<00:00, 74482.65it/s]
100%|██████████| 30/30 [00:00<00:00, 55406.92it/s]
100%|██████████| 130/130 [00:00<00:00, 66665.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79611.62it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:30<00:00, 191.62it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 56317.16it/s]
100%|██████████| 287/287 [00:00<00:00, 54021.69it/s]
100%|██████████| 771/771 [00:00<00:00, 88553.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93283.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83909.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83859.25it/s]
100%|██████████| 353/353 [00:00<00:00, 74047.98it/s]
100%|██████████| 252/252 [00:00<00:00, 74287.64it/s]
100%|██████████| 203/203 [00:00<00:00, 72748.10it/s]
100%|██████████| 153/153 [00:00<00:00, 70264.81it/s]
100%|██████████| 200/200 [00:00<00:00, 71783.40it/s]
100%|██████████| 65/65 [00:00<00:00, 64269.16it/s]
100%|██████████| 144/144 [00:00<00:00, 65543.11it/s]
100%|██████████| 30/30 [00:00<00:00, 64231.30it/s]
100%|██████████| 130/130 [00:00<00:00, 72565.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89366.55it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:43<00:00, 134.73it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88975.21it/s]
100%|██████████| 287/287 [00:00<00:00, 73226.18it/s]
100%|██████████| 771/771 [00:00<00:00, 86881.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87575.64it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89598.91it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87561.32it/s]
100%|██████████| 353/353 [00:00<00:00, 85154.96it/s]
100%|██████████| 252/252 [00:00<00:00, 69145.92it/s]
100%|██████████| 203/203 [00:00<00:00, 70175.86it/s]
100%|██████████| 153/153 [00:00<00:00, 64723.00it/s]
100%|██████████| 200/200 [00:00<00:00, 65536.00it/s]
100%|██████████| 65/65 [00:00<00:00, 53331.33it/s]
100%|██████████| 144/144 [00:00<00:00, 53648.94it/s]
100%|██████████| 30/30 [00:00<00:00, 50111.16it/s]
100%|██████████| 130/130 [00:00<00:00, 59177.29it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85921.69it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 138.88it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 93256.54it/s]
100%|██████████| 287/287 [00:00<00:00, 78492.78it/s]
100%|██████████| 771/771 [00:00<00:00, 87056.71it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85455.03it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81963.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84386.77it/s]
100%|██████████| 353/353 [00:00<00:00, 87879.23it/s]
100%|██████████| 252/252 [00:00<00:00, 73645.81it/s]
100%|██████████| 203/203 [00:00<00:00, 60134.45it/s]
100%|██████████| 153/153 [00:00<00:00, 68298.05it/s]
100%|██████████| 200/200 [00:00<00:00, 64319.95it/s]
100%|██████████| 65/65 [00:00<00:00, 68880.69it/s]
100%|██████████| 144/144 [00:00<00:00, 49397.22it/s]
100%|██████████| 30/30 [00:00<00:00, 55750.61it/s]
100%|██████████| 130/130 [00:00<00:00, 73803.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87048.17it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.34it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 63068.92it/s]
100%|██████████| 287/287 [00:00<00:00, 76361.66it/s]
100%|██████████| 771/771 [00:00<00:00, 79046.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79663.89it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77975.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 77788.02it/s]
100%|██████████| 353/353 [00:00<00:00, 76813.97it/s]
100%|██████████| 252/252 [00:00<00:00, 75228.80it/s]
100%|██████████| 203/203 [00:00<00:00, 77144.49it/s]
100%|██████████| 153/153 [00:00<00:00, 74437.83it/s]
100%|██████████| 200/200 [00:00<00:00, 70250.46it/s]
100%|██████████| 65/65 [00:00<00:00, 63050.36it/s]
100%|██████████| 144/144 [00:00<00:00, 75103.18it/s]
100%|██████████| 30/30 [00:00<00:00, 67108.86it/s]
100%|██████████| 130/130 [00:00<00:00, 73022.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76544.38it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.57it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78722.99it/s]
100%|██████████| 287/287 [00:00<00:00, 78925.08it/s]
100%|██████████| 771/771 [00:00<00:00, 89499.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85009.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84786.51it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93494.16it/s]
100%|██████████| 353/353 [00:00<00:00, 78094.27it/s]
100%|██████████| 252/252 [00:00<00:00, 77399.28it/s]
100%|██████████| 203/203 [00:00<00:00, 77509.67it/s]
100%|██████████| 153/153 [00:00<00:00, 80477.62it/s]
100%|██████████| 200/200 [00:00<00:00, 76211.57it/s]
100%|██████████| 65/65 [00:00<00:00, 51333.04it/s]
100%|██████████| 144/144 [00:00<00:00, 65536.00it/s]
100%|██████████| 30/30 [00:00<00:00, 49325.41it/s]
100%|██████████| 130/130 [00:00<00:00, 71754.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87960.41it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 121.73it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 68700.46it/s]
100%|██████████| 287/287 [00:00<00:00, 67196.90it/s]
100%|██████████| 771/771 [00:00<00:00, 78834.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86134.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83266.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82067.46it/s]
100%|██████████| 353/353 [00:00<00:00, 73911.21it/s]
100%|██████████| 252/252 [00:00<00:00, 77297.40it/s]
100%|██████████| 203/203 [00:00<00:00, 66848.06it/s]
100%|██████████| 153/153 [00:00<00:00, 67714.31it/s]
100%|██████████| 200/200 [00:00<00:00, 66518.18it/s]
100%|██████████| 65/65 [00:00<00:00, 64757.66it/s]
100%|██████████| 144/144 [00:00<00:00, 56685.10it/s]
100%|██████████| 30/30 [00:00<00:00, 46603.38it/s]
100%|██████████| 130/130 [00:00<00:00, 67574.61it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82289.66it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 124.31it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 89507.40it/s]
100%|██████████| 287/287 [00:00<00:00, 73746.57it/s]
100%|██████████| 771/771 [00:00<00:00, 76310.46it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92852.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93310.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89027.73it/s]
100%|██████████| 353/353 [00:00<00:00, 75779.98it/s]
100%|██████████| 252/252 [00:00<00:00, 69546.30it/s]
100%|██████████| 203/203 [00:00<00:00, 81113.05it/s]
100%|██████████| 153/153 [00:00<00:00, 70745.07it/s]
100%|██████████| 200/200 [00:00<00:00, 69534.22it/s]
100%|██████████| 65/65 [00:00<00:00, 64466.72it/s]
100%|██████████| 144/144 [00:00<00:00, 67710.74it/s]
100%|██████████| 30/30 [00:00<00:00, 53204.70it/s]
100%|██████████| 130/130 [00:00<00:00, 79103.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88631.67it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.42it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79699.28it/s]
100%|██████████| 287/287 [00:00<00:00, 77742.52it/s]
100%|██████████| 771/771 [00:00<00:00, 80267.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79539.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80659.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81998.48it/s]
100%|██████████| 353/353 [00:00<00:00, 76409.63it/s]
100%|██████████| 252/252 [00:00<00:00, 78218.35it/s]
100%|██████████| 203/203 [00:00<00:00, 72119.58it/s]
100%|██████████| 153/153 [00:00<00:00, 77917.50it/s]
100%|██████████| 200/200 [00:00<00:00, 57252.31it/s]
100%|██████████| 65/65 [00:00<00:00, 69548.41it/s]
100%|██████████| 144/144 [00:00<00:00, 61361.35it/s]
100%|██████████| 30/30 [00:00<00:00, 60349.70it/s]
100%|██████████| 130/130 [00:00<00:00, 75135.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78005.78it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.40it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 85755.71it/s]
100%|██████████| 287/287 [00:00<00:00, 80800.46it/s]
100%|██████████| 771/771 [00:00<00:00, 79300.83it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85860.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80469.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92304.90it/s]
100%|██████████| 353/353 [00:00<00:00, 78304.91it/s]
100%|██████████| 252/252 [00:00<00:00, 81279.96it/s]
100%|██████████| 203/203 [00:00<00:00, 78466.84it/s]
100%|██████████| 153/153 [00:00<00:00, 75899.29it/s]
100%|██████████| 200/200 [00:00<00:00, 78766.27it/s]
100%|██████████| 65/65 [00:00<00:00, 76366.88it/s]
100%|██████████| 144/144 [00:00<00:00, 75554.14it/s]
100%|██████████| 30/30 [00:00<00:00, 69595.75it/s]
100%|██████████| 130/130 [00:00<00:00, 75541.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 70252.65it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.07it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 74270.34it/s]
100%|██████████| 287/287 [00:00<00:00, 86347.12it/s]
100%|██████████| 771/771 [00:00<00:00, 91451.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91083.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89879.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91140.90it/s]
100%|██████████| 353/353 [00:00<00:00, 75923.76it/s]
100%|██████████| 252/252 [00:00<00:00, 71204.84it/s]
100%|██████████| 203/203 [00:00<00:00, 68998.68it/s]
100%|██████████| 153/153 [00:00<00:00, 69768.27it/s]
100%|██████████| 200/200 [00:00<00:00, 70700.45it/s]
100%|██████████| 65/65 [00:00<00:00, 60010.95it/s]
100%|██████████| 144/144 [00:00<00:00, 48133.55it/s]
100%|██████████| 30/30 [00:00<00:00, 62291.64it/s]
100%|██████████| 130/130 [00:00<00:00, 65678.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69881.77it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:56<00:00, 104.04it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 83581.54it/s]
100%|██████████| 287/287 [00:00<00:00, 80016.30it/s]
100%|██████████| 771/771 [00:00<00:00, 85270.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85250.95it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88565.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88207.05it/s]
100%|██████████| 353/353 [00:00<00:00, 77521.82it/s]
100%|██████████| 252/252 [00:00<00:00, 54367.81it/s]
100%|██████████| 203/203 [00:00<00:00, 79115.75it/s]
100%|██████████| 153/153 [00:00<00:00, 58928.24it/s]
100%|██████████| 200/200 [00:00<00:00, 79085.58it/s]
100%|██████████| 65/65 [00:00<00:00, 50712.38it/s]
100%|██████████| 144/144 [00:00<00:00, 48426.86it/s]
100%|██████████| 30/30 [00:00<00:00, 39174.69it/s]
100%|██████████| 130/130 [00:00<00:00, 61890.98it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82480.15it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:57<00:00, 100.80it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 48966.47it/s]
100%|██████████| 287/287 [00:00<00:00, 77888.40it/s]
100%|██████████| 771/771 [00:00<00:00, 79674.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80490.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81848.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80051.61it/s]
100%|██████████| 353/353 [00:00<00:00, 83611.32it/s]
100%|██████████| 252/252 [00:00<00:00, 77564.00it/s]
100%|██████████| 203/203 [00:00<00:00, 76431.21it/s]
100%|██████████| 153/153 [00:00<00:00, 75038.41it/s]
100%|██████████| 200/200 [00:00<00:00, 80520.33it/s]
100%|██████████| 65/65 [00:00<00:00, 75270.50it/s]
100%|██████████| 144/144 [00:00<00:00, 74008.06it/s]
100%|██████████| 30/30 [00:00<00:00, 41623.92it/s]
100%|██████████| 130/130 [00:00<00:00, 77961.04it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95377.11it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:53<00:00, 109.66it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75165.66it/s]
100%|██████████| 287/287 [00:00<00:00, 77702.38it/s]
100%|██████████| 771/771 [00:00<00:00, 73693.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77397.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77719.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79371.43it/s]
100%|██████████| 353/353 [00:00<00:00, 76913.73it/s]
100%|██████████| 252/252 [00:00<00:00, 77999.01it/s]
100%|██████████| 203/203 [00:00<00:00, 80966.50it/s]
100%|██████████| 153/153 [00:00<00:00, 79245.31it/s]
100%|██████████| 200/200 [00:00<00:00, 81135.58it/s]
100%|██████████| 65/65 [00:00<00:00, 67970.52it/s]
100%|██████████| 144/144 [00:00<00:00, 76279.34it/s]
100%|██████████| 30/30 [00:00<00:00, 56249.05it/s]
100%|██████████| 130/130 [00:00<00:00, 71565.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89904.55it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:50<00:00, 115.96it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 92580.70it/s]
100%|██████████| 287/287 [00:00<00:00, 71237.14it/s]
100%|██████████| 771/771 [00:00<00:00, 92592.94it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94439.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75714.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91238.70it/s]
100%|██████████| 353/353 [00:00<00:00, 74110.99it/s]
100%|██████████| 252/252 [00:00<00:00, 73635.54it/s]
100%|██████████| 203/203 [00:00<00:00, 73667.05it/s]
100%|██████████| 153/153 [00:00<00:00, 75586.40it/s]
100%|██████████| 200/200 [00:00<00:00, 70724.29it/s]
100%|██████████| 65/65 [00:00<00:00, 71443.86it/s]
100%|██████████| 144/144 [00:00<00:00, 70156.79it/s]
100%|██████████| 30/30 [00:00<00:00, 66191.02it/s]
100%|██████████| 130/130 [00:00<00:00, 60807.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89503.31it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 154.46it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88803.61it/s]
100%|██████████| 287/287 [00:00<00:00, 47437.16it/s]
100%|██████████| 771/771 [00:00<00:00, 91162.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93472.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88567.77it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91236.06it/s]
100%|██████████| 353/353 [00:00<00:00, 87515.62it/s]
100%|██████████| 252/252 [00:00<00:00, 71228.83it/s]
100%|██████████| 203/203 [00:00<00:00, 71048.37it/s]
100%|██████████| 153/153 [00:00<00:00, 70126.60it/s]
100%|██████████| 200/200 [00:00<00:00, 88394.18it/s]
100%|██████████| 65/65 [00:00<00:00, 63728.32it/s]
100%|██████████| 144/144 [00:00<00:00, 86208.93it/s]
100%|██████████| 30/30 [00:00<00:00, 64893.82it/s]
100%|██████████| 130/130 [00:00<00:00, 69530.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90096.56it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.12it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78912.76it/s]
100%|██████████| 287/287 [00:00<00:00, 77557.20it/s]
100%|██████████| 771/771 [00:00<00:00, 79699.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84583.04it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92948.57it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89632.09it/s]
100%|██████████| 353/353 [00:00<00:00, 80396.90it/s]
100%|██████████| 252/252 [00:00<00:00, 78666.61it/s]
100%|██████████| 203/203 [00:00<00:00, 79723.19it/s]
100%|██████████| 153/153 [00:00<00:00, 77917.50it/s]
100%|██████████| 200/200 [00:00<00:00, 77243.17it/s]
100%|██████████| 65/65 [00:00<00:00, 72740.06it/s]
100%|██████████| 144/144 [00:00<00:00, 72830.07it/s]
100%|██████████| 30/30 [00:00<00:00, 69251.03it/s]
100%|██████████| 130/130 [00:00<00:00, 76624.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73924.44it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.19it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88451.19it/s]
100%|██████████| 287/287 [00:00<00:00, 77522.23it/s]
100%|██████████| 771/771 [00:00<00:00, 75364.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 101697.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80085.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93993.52it/s]
100%|██████████| 353/353 [00:00<00:00, 78612.58it/s]
100%|██████████| 252/252 [00:00<00:00, 78148.95it/s]
100%|██████████| 203/203 [00:00<00:00, 75974.28it/s]
100%|██████████| 153/153 [00:00<00:00, 75953.19it/s]
100%|██████████| 200/200 [00:00<00:00, 34496.89it/s]
100%|██████████| 65/65 [00:00<00:00, 53847.47it/s]
100%|██████████| 144/144 [00:00<00:00, 56877.27it/s]
100%|██████████| 30/30 [00:00<00:00, 47934.90it/s]
100%|██████████| 130/130 [00:00<00:00, 62251.34it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78166.52it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.70it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 88750.95it/s]
100%|██████████| 287/287 [00:00<00:00, 80936.28it/s]
100%|██████████| 771/771 [00:00<00:00, 90249.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94346.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73963.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91872.23it/s]
100%|██████████| 353/353 [00:00<00:00, 74815.02it/s]
100%|██████████| 252/252 [00:00<00:00, 79680.71it/s]
100%|██████████| 203/203 [00:00<00:00, 86484.89it/s]
100%|██████████| 153/153 [00:00<00:00, 63771.09it/s]
100%|██████████| 200/200 [00:00<00:00, 72540.71it/s]
100%|██████████| 65/65 [00:00<00:00, 59905.46it/s]
100%|██████████| 144/144 [00:00<00:00, 71417.73it/s]
100%|██████████| 30/30 [00:00<00:00, 61111.76it/s]
100%|██████████| 130/130 [00:00<00:00, 70129.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85732.01it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:38<00:00, 153.79it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 82105.89it/s]
100%|██████████| 287/287 [00:00<00:00, 78651.76it/s]
100%|██████████| 771/771 [00:00<00:00, 92013.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 72348.64it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80415.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92365.88it/s]
100%|██████████| 353/353 [00:00<00:00, 80902.10it/s]
100%|██████████| 252/252 [00:00<00:00, 88760.88it/s]
100%|██████████| 203/203 [00:00<00:00, 76314.75it/s]
100%|██████████| 153/153 [00:00<00:00, 68109.59it/s]
100%|██████████| 200/200 [00:00<00:00, 85746.79it/s]
100%|██████████| 65/65 [00:00<00:00, 63211.17it/s]
100%|██████████| 144/144 [00:00<00:00, 84331.16it/s]
100%|██████████| 30/30 [00:00<00:00, 48601.44it/s]
100%|██████████| 130/130 [00:00<00:00, 78184.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89923.82it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 137.58it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 68119.68it/s]
100%|██████████| 287/287 [00:00<00:00, 82653.48it/s]
100%|██████████| 771/771 [00:00<00:00, 82848.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89546.30it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88522.91it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87251.06it/s]
100%|██████████| 353/353 [00:00<00:00, 83639.66it/s]
100%|██████████| 252/252 [00:00<00:00, 72603.70it/s]
100%|██████████| 203/203 [00:00<00:00, 72186.83it/s]
100%|██████████| 153/153 [00:00<00:00, 70620.50it/s]
100%|██████████| 200/200 [00:00<00:00, 72459.26it/s]
100%|██████████| 65/65 [00:00<00:00, 62803.45it/s]
100%|██████████| 144/144 [00:00<00:00, 73602.21it/s]
100%|██████████| 30/30 [00:00<00:00, 64329.82it/s]
100%|██████████| 130/130 [00:00<00:00, 85678.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86688.34it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 145.67it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 84643.55it/s]
100%|██████████| 287/287 [00:00<00:00, 86958.41it/s]
100%|██████████| 771/771 [00:00<00:00, 88418.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93964.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84126.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78842.77it/s]
100%|██████████| 353/353 [00:00<00:00, 76025.13it/s]
100%|██████████| 252/252 [00:00<00:00, 75556.84it/s]
100%|██████████| 203/203 [00:00<00:00, 88719.78it/s]
100%|██████████| 153/153 [00:00<00:00, 71501.78it/s]
100%|██████████| 200/200 [00:00<00:00, 85808.18it/s]
100%|██████████| 65/65 [00:00<00:00, 64911.85it/s]
100%|██████████| 144/144 [00:00<00:00, 82930.08it/s]
100%|██████████| 30/30 [00:00<00:00, 46776.62it/s]
100%|██████████| 130/130 [00:00<00:00, 70611.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84243.75it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:49<00:00, 118.85it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 74946.51it/s]
100%|██████████| 287/287 [00:00<00:00, 64882.51it/s]
100%|██████████| 771/771 [00:00<00:00, 90211.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80934.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83541.89it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86863.17it/s]
100%|██████████| 353/353 [00:00<00:00, 82820.90it/s]
100%|██████████| 252/252 [00:00<00:00, 66862.64it/s]
100%|██████████| 203/203 [00:00<00:00, 59758.82it/s]
100%|██████████| 153/153 [00:00<00:00, 78269.12it/s]
100%|██████████| 200/200 [00:00<00:00, 70191.68it/s]
100%|██████████| 65/65 [00:00<00:00, 67282.76it/s]
100%|██████████| 144/144 [00:00<00:00, 65344.56it/s]
100%|██████████| 30/30 [00:00<00:00, 61052.46it/s]
100%|██████████| 130/130 [00:00<00:00, 76206.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81358.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 120.90it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 73894.43it/s]
100%|██████████| 287/287 [00:00<00:00, 77642.24it/s]
100%|██████████| 771/771 [00:00<00:00, 77098.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88471.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76368.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90630.17it/s]
100%|██████████| 353/353 [00:00<00:00, 72453.60it/s]
100%|██████████| 252/252 [00:00<00:00, 75486.69it/s]
100%|██████████| 203/203 [00:00<00:00, 50963.29it/s]
100%|██████████| 153/153 [00:00<00:00, 56739.92it/s]
100%|██████████| 200/200 [00:00<00:00, 54560.05it/s]
100%|██████████| 65/65 [00:00<00:00, 55390.04it/s]
100%|██████████| 144/144 [00:00<00:00, 68618.47it/s]
100%|██████████| 30/30 [00:00<00:00, 32564.47it/s]
100%|██████████| 130/130 [00:00<00:00, 40745.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85754.55it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.83it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88384.02it/s]
100%|██████████| 287/287 [00:00<00:00, 88000.97it/s]
100%|██████████| 771/771 [00:00<00:00, 92505.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94604.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94904.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84376.59it/s]
100%|██████████| 353/353 [00:00<00:00, 81003.90it/s]
100%|██████████| 252/252 [00:00<00:00, 69445.77it/s]
100%|██████████| 203/203 [00:00<00:00, 68797.97it/s]
100%|██████████| 153/153 [00:00<00:00, 69616.89it/s]
100%|██████████| 200/200 [00:00<00:00, 83493.66it/s]
100%|██████████| 65/65 [00:00<00:00, 61919.09it/s]
100%|██████████| 144/144 [00:00<00:00, 82129.42it/s]
100%|██████████| 30/30 [00:00<00:00, 58743.75it/s]
100%|██████████| 130/130 [00:00<00:00, 85383.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89780.28it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.25it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 80273.38it/s]
100%|██████████| 287/287 [00:00<00:00, 76038.48it/s]
100%|██████████| 771/771 [00:00<00:00, 72393.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86579.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83520.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83570.74it/s]
100%|██████████| 353/353 [00:00<00:00, 70601.75it/s]
100%|██████████| 252/252 [00:00<00:00, 66555.29it/s]
100%|██████████| 203/203 [00:00<00:00, 69876.38it/s]
100%|██████████| 153/153 [00:00<00:00, 53009.13it/s]
100%|██████████| 200/200 [00:00<00:00, 79543.03it/s]
100%|██████████| 65/65 [00:00<00:00, 66935.86it/s]
100%|██████████| 144/144 [00:00<00:00, 67650.06it/s]
100%|██████████| 30/30 [00:00<00:00, 34267.19it/s]
100%|██████████| 130/130 [00:00<00:00, 63513.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83883.68it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 146.35it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 74334.90it/s]
100%|██████████| 287/287 [00:00<00:00, 76927.74it/s]
100%|██████████| 771/771 [00:00<00:00, 72233.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74562.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77603.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 74280.61it/s]
100%|██████████| 353/353 [00:00<00:00, 78429.35it/s]
100%|██████████| 252/252 [00:00<00:00, 75573.05it/s]
100%|██████████| 203/203 [00:00<00:00, 75724.27it/s]
100%|██████████| 153/153 [00:00<00:00, 77167.93it/s]
100%|██████████| 200/200 [00:00<00:00, 72559.54it/s]
100%|██████████| 65/65 [00:00<00:00, 73248.19it/s]
100%|██████████| 144/144 [00:00<00:00, 72751.12it/s]
100%|██████████| 30/30 [00:00<00:00, 55529.18it/s]
100%|██████████| 130/130 [00:00<00:00, 73277.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 56012.39it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.48it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92291.13it/s]
100%|██████████| 287/287 [00:00<00:00, 78050.01it/s]
100%|██████████| 771/771 [00:00<00:00, 72938.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79214.04it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75890.28it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85176.79it/s]
100%|██████████| 353/353 [00:00<00:00, 80449.32it/s]
100%|██████████| 252/252 [00:00<00:00, 79584.72it/s]
100%|██████████| 203/203 [00:00<00:00, 60245.08it/s]
100%|██████████| 153/153 [00:00<00:00, 71303.17it/s]
100%|██████████| 200/200 [00:00<00:00, 79302.40it/s]
100%|██████████| 65/65 [00:00<00:00, 67067.59it/s]
100%|██████████| 144/144 [00:00<00:00, 52139.14it/s]
100%|██████████| 30/30 [00:00<00:00, 30923.84it/s]
100%|██████████| 130/130 [00:00<00:00, 73753.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85109.22it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 140.46it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 85508.95it/s]
100%|██████████| 287/287 [00:00<00:00, 64854.55it/s]
100%|██████████| 771/771 [00:00<00:00, 94247.16it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82986.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83986.86it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86466.23it/s]
100%|██████████| 353/353 [00:00<00:00, 75004.52it/s]
100%|██████████| 252/252 [00:00<00:00, 72904.17it/s]
100%|██████████| 203/203 [00:00<00:00, 80324.88it/s]
100%|██████████| 153/153 [00:00<00:00, 75012.10it/s]
100%|██████████| 200/200 [00:00<00:00, 83551.87it/s]
100%|██████████| 65/65 [00:00<00:00, 61736.81it/s]
100%|██████████| 144/144 [00:00<00:00, 70939.60it/s]
100%|██████████| 30/30 [00:00<00:00, 48118.21it/s]
100%|██████████| 130/130 [00:00<00:00, 70084.77it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87070.37it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.09it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 94199.99it/s]
100%|██████████| 287/287 [00:00<00:00, 90802.24it/s]
100%|██████████| 771/771 [00:00<00:00, 94233.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95965.22it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87454.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88559.67it/s]
100%|██████████| 353/353 [00:00<00:00, 90917.37it/s]
100%|██████████| 252/252 [00:00<00:00, 71397.23it/s]
100%|██████████| 203/203 [00:00<00:00, 73775.56it/s]
100%|██████████| 153/153 [00:00<00:00, 69271.21it/s]
100%|██████████| 200/200 [00:00<00:00, 69643.90it/s]
100%|██████████| 65/65 [00:00<00:00, 61820.81it/s]
100%|██████████| 144/144 [00:00<00:00, 68254.01it/s]
100%|██████████| 30/30 [00:00<00:00, 61954.27it/s]
100%|██████████| 130/130 [00:00<00:00, 72536.85it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74335.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.73it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81908.47it/s]
100%|██████████| 287/287 [00:00<00:00, 79593.05it/s]
100%|██████████| 771/771 [00:00<00:00, 81947.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82448.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83473.72it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81764.03it/s]
100%|██████████| 353/353 [00:00<00:00, 80620.16it/s]
100%|██████████| 252/252 [00:00<00:00, 77575.38it/s]
100%|██████████| 203/203 [00:00<00:00, 81501.26it/s]
100%|██████████| 153/153 [00:00<00:00, 75470.84it/s]
100%|██████████| 200/200 [00:00<00:00, 79093.04it/s]
100%|██████████| 65/65 [00:00<00:00, 68776.43it/s]
100%|██████████| 144/144 [00:00<00:00, 76989.14it/s]
100%|██████████| 30/30 [00:00<00:00, 54732.11it/s]
100%|██████████| 130/130 [00:00<00:00, 75384.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81325.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 138.87it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82924.85it/s]
100%|██████████| 287/287 [00:00<00:00, 76751.16it/s]
100%|██████████| 771/771 [00:00<00:00, 82729.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 107048.07it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82231.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81046.22it/s]
100%|██████████| 353/353 [00:00<00:00, 80392.53it/s]
100%|██████████| 252/252 [00:00<00:00, 80622.78it/s]
100%|██████████| 203/203 [00:00<00:00, 82400.44it/s]
100%|██████████| 153/153 [00:00<00:00, 75845.47it/s]
100%|██████████| 200/200 [00:00<00:00, 76818.75it/s]
100%|██████████| 65/65 [00:00<00:00, 77057.59it/s]
100%|██████████| 144/144 [00:00<00:00, 80573.61it/s]
100%|██████████| 30/30 [00:00<00:00, 68834.31it/s]
100%|██████████| 130/130 [00:00<00:00, 76905.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91233.22it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 150.90it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 79236.58it/s]
100%|██████████| 287/287 [00:00<00:00, 73230.64it/s]
100%|██████████| 771/771 [00:00<00:00, 72265.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77652.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86203.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82268.14it/s]
100%|██████████| 353/353 [00:00<00:00, 78061.33it/s]
100%|██████████| 252/252 [00:00<00:00, 62486.82it/s]
100%|██████████| 203/203 [00:00<00:00, 69324.52it/s]
100%|██████████| 153/153 [00:00<00:00, 66459.04it/s]
100%|██████████| 200/200 [00:00<00:00, 70825.80it/s]
100%|██████████| 65/65 [00:00<00:00, 39511.56it/s]
100%|██████████| 144/144 [00:00<00:00, 60452.38it/s]
100%|██████████| 30/30 [00:00<00:00, 31363.19it/s]
100%|██████████| 130/130 [00:00<00:00, 63086.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79191.17it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.80it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 81332.93it/s]
100%|██████████| 287/287 [00:00<00:00, 80925.39it/s]
100%|██████████| 771/771 [00:00<00:00, 82195.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85136.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82794.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81108.39it/s]
100%|██████████| 353/353 [00:00<00:00, 91842.27it/s]
100%|██████████| 252/252 [00:00<00:00, 80721.29it/s]
100%|██████████| 203/203 [00:00<00:00, 60245.08it/s]
100%|██████████| 153/153 [00:00<00:00, 62976.30it/s]
100%|██████████| 200/200 [00:00<00:00, 87940.12it/s]
100%|██████████| 65/65 [00:00<00:00, 59708.66it/s]
100%|██████████| 144/144 [00:00<00:00, 55727.97it/s]
100%|██████████| 30/30 [00:00<00:00, 33662.15it/s]
100%|██████████| 130/130 [00:00<00:00, 67809.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79872.81it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.48it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 74632.81it/s]
100%|██████████| 287/287 [00:00<00:00, 77772.66it/s]
100%|██████████| 771/771 [00:00<00:00, 80829.04it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92078.29it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93905.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93942.29it/s]
100%|██████████| 353/353 [00:00<00:00, 74491.31it/s]
100%|██████████| 252/252 [00:00<00:00, 71887.68it/s]
100%|██████████| 203/203 [00:00<00:00, 80105.72it/s]
100%|██████████| 153/153 [00:00<00:00, 81989.08it/s]
100%|██████████| 200/200 [00:00<00:00, 59062.23it/s]
100%|██████████| 65/65 [00:00<00:00, 76559.89it/s]
100%|██████████| 144/144 [00:00<00:00, 74262.85it/s]
100%|██████████| 30/30 [00:00<00:00, 63167.23it/s]
100%|██████████| 130/130 [00:00<00:00, 74296.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95766.61it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.37it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80985.52it/s]
100%|██████████| 287/287 [00:00<00:00, 81319.01it/s]
100%|██████████| 771/771 [00:00<00:00, 81785.75it/s]
100%|██████████| 2000/2000 [00:00<00:00, 101045.65it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83304.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80110.73it/s]
100%|██████████| 353/353 [00:00<00:00, 82751.47it/s]
100%|██████████| 252/252 [00:00<00:00, 79728.79it/s]
100%|██████████| 203/203 [00:00<00:00, 81932.61it/s]
100%|██████████| 153/153 [00:00<00:00, 77625.32it/s]
100%|██████████| 200/200 [00:00<00:00, 78456.86it/s]
100%|██████████| 65/65 [00:00<00:00, 66462.64it/s]
100%|██████████| 144/144 [00:00<00:00, 75677.21it/s]
100%|██████████| 30/30 [00:00<00:00, 49833.31it/s]
100%|██████████| 130/130 [00:00<00:00, 74428.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80006.02it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 162.93it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 93350.04it/s]
100%|██████████| 287/287 [00:00<00:00, 92122.54it/s]
100%|██████████| 771/771 [00:00<00:00, 93368.22it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97244.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94213.80it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88430.21it/s]
100%|██████████| 353/353 [00:00<00:00, 76917.73it/s]
100%|██████████| 252/252 [00:00<00:00, 74723.55it/s]
100%|██████████| 203/203 [00:00<00:00, 72395.52it/s]
100%|██████████| 153/153 [00:00<00:00, 75099.88it/s]
100%|██████████| 200/200 [00:00<00:00, 69794.56it/s]
100%|██████████| 65/65 [00:00<00:00, 70138.86it/s]
100%|██████████| 144/144 [00:00<00:00, 68486.20it/s]
100%|██████████| 30/30 [00:00<00:00, 60004.35it/s]
100%|██████████| 130/130 [00:00<00:00, 60476.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 94343.07it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.54it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 72107.76it/s]
100%|██████████| 287/287 [00:00<00:00, 72289.53it/s]
100%|██████████| 771/771 [00:00<00:00, 91557.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93598.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93765.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91516.75it/s]
100%|██████████| 353/353 [00:00<00:00, 71974.59it/s]
100%|██████████| 252/252 [00:00<00:00, 71089.90it/s]
100%|██████████| 203/203 [00:00<00:00, 75282.38it/s]
100%|██████████| 153/153 [00:00<00:00, 69099.66it/s]
100%|██████████| 200/200 [00:00<00:00, 65377.66it/s]
100%|██████████| 65/65 [00:00<00:00, 69459.81it/s]
100%|██████████| 144/144 [00:00<00:00, 71876.68it/s]
100%|██████████| 30/30 [00:00<00:00, 36749.16it/s]
100%|██████████| 130/130 [00:00<00:00, 57438.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89393.76it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.42it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82527.96it/s]
100%|██████████| 287/287 [00:00<00:00, 76702.26it/s]
100%|██████████| 771/771 [00:00<00:00, 76490.96it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80314.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81299.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78142.11it/s]
100%|██████████| 353/353 [00:00<00:00, 76185.52it/s]
100%|██████████| 252/252 [00:00<00:00, 77581.08it/s]
100%|██████████| 203/203 [00:00<00:00, 77025.85it/s]
100%|██████████| 153/153 [00:00<00:00, 63180.91it/s]
100%|██████████| 200/200 [00:00<00:00, 77044.53it/s]
100%|██████████| 65/65 [00:00<00:00, 61653.04it/s]
100%|██████████| 144/144 [00:00<00:00, 78205.33it/s]
100%|██████████| 30/30 [00:00<00:00, 55382.54it/s]
100%|██████████| 130/130 [00:00<00:00, 70446.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77394.25it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 157.67it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80955.79it/s]
100%|██████████| 287/287 [00:00<00:00, 79299.42it/s]
100%|██████████| 771/771 [00:00<00:00, 79856.98it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79634.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94932.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90493.30it/s]
100%|██████████| 353/353 [00:00<00:00, 79954.06it/s]
100%|██████████| 252/252 [00:00<00:00, 78549.69it/s]
100%|██████████| 203/203 [00:00<00:00, 77878.32it/s]
100%|██████████| 153/153 [00:00<00:00, 80306.41it/s]
100%|██████████| 200/200 [00:00<00:00, 80651.94it/s]
100%|██████████| 65/65 [00:00<00:00, 76948.85it/s]
100%|██████████| 144/144 [00:00<00:00, 75159.26it/s]
100%|██████████| 30/30 [00:00<00:00, 63970.07it/s]
100%|██████████| 130/130 [00:00<00:00, 76377.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 103322.52it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 154.20it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 93076.32it/s]
100%|██████████| 287/287 [00:00<00:00, 73973.16it/s]
100%|██████████| 771/771 [00:00<00:00, 85203.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88343.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85545.67it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86333.93it/s]
100%|██████████| 353/353 [00:00<00:00, 75328.89it/s]
100%|██████████| 252/252 [00:00<00:00, 69368.29it/s]
100%|██████████| 203/203 [00:00<00:00, 83156.92it/s]
100%|██████████| 153/153 [00:00<00:00, 85279.54it/s]
100%|██████████| 200/200 [00:00<00:00, 62341.02it/s]
100%|██████████| 65/65 [00:00<00:00, 64027.66it/s]
100%|██████████| 144/144 [00:00<00:00, 74400.07it/s]
100%|██████████| 30/30 [00:00<00:00, 52958.38it/s]
100%|██████████| 130/130 [00:00<00:00, 70229.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84465.27it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 176.29it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 88316.96it/s]
100%|██████████| 287/287 [00:00<00:00, 75235.33it/s]
100%|██████████| 771/771 [00:00<00:00, 80873.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94578.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90339.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92516.65it/s]
100%|██████████| 353/353 [00:00<00:00, 71702.71it/s]
100%|██████████| 252/252 [00:00<00:00, 68389.82it/s]
100%|██████████| 203/203 [00:00<00:00, 66706.65it/s]
100%|██████████| 153/153 [00:00<00:00, 59723.45it/s]
100%|██████████| 200/200 [00:00<00:00, 66719.22it/s]
100%|██████████| 65/65 [00:00<00:00, 41788.74it/s]
100%|██████████| 144/144 [00:00<00:00, 58553.54it/s]
100%|██████████| 30/30 [00:00<00:00, 38362.54it/s]
100%|██████████| 130/130 [00:00<00:00, 59454.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88327.70it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:36<00:00, 160.25it/s]
INFO:root:The new embedding has 5832 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88009.03it/s]
100%|██████████| 287/287 [00:00<00:00, 71372.30it/s]
100%|██████████| 771/771 [00:00<00:00, 56475.87it/s]
100%|██████████| 2000/2000 [00:00<00:00, 55244.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77434.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 65571.52it/s]
100%|██████████| 353/353 [00:00<00:00, 75563.40it/s]
100%|██████████| 252/252 [00:00<00:00, 65309.23it/s]
100%|██████████| 203/203 [00:00<00:00, 72107.36it/s]
100%|██████████| 153/153 [00:00<00:00, 60432.10it/s]
100%|██████████| 200/200 [00:00<00:00, 69287.26it/s]
100%|██████████| 65/65 [00:00<00:00, 54701.00it/s]
100%|██████████| 144/144 [00:00<00:00, 74044.35it/s]
100%|██████████| 30/30 [00:00<00:00, 55899.21it/s]
100%|██████████| 130/130 [00:00<00:00, 54580.53it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81821.83it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.73it/s]
INFO:root:The new embedding has 5832 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 93068.05it/s]
100%|██████████| 287/287 [00:00<00:00, 89485.97it/s]
100%|██████████| 771/771 [00:00<00:00, 91409.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95103.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89715.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92582.00it/s]
100%|██████████| 353/353 [00:00<00:00, 78197.39it/s]
100%|██████████| 252/252 [00:00<00:00, 72753.62it/s]
100%|██████████| 203/203 [00:00<00:00, 71634.17it/s]
100%|██████████| 153/153 [00:00<00:00, 73164.81it/s]
100%|██████████| 200/200 [00:00<00:00, 71017.68it/s]
100%|██████████| 65/65 [00:00<00:00, 65191.24it/s]
100%|██████████| 144/144 [00:00<00:00, 69136.88it/s]
100%|██████████| 30/30 [00:00<00:00, 66295.64it/s]
100%|██████████| 130/130 [00:00<00:00, 70274.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86711.38it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:35<00:00, 164.30it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80195.02it/s]
100%|██████████| 287/287 [00:00<00:00, 78136.13it/s]
100%|██████████| 771/771 [00:00<00:00, 81509.51it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81495.02it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80524.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80289.64it/s]
100%|██████████| 353/353 [00:00<00:00, 80677.27it/s]
100%|██████████| 252/252 [00:00<00:00, 78206.78it/s]
100%|██████████| 203/203 [00:00<00:00, 78264.89it/s]
100%|██████████| 153/153 [00:00<00:00, 79421.85it/s]
100%|██████████| 200/200 [00:00<00:00, 81143.43it/s]
100%|██████████| 65/65 [00:00<00:00, 68880.69it/s]
100%|██████████| 144/144 [00:00<00:00, 76288.97it/s]
100%|██████████| 30/30 [00:00<00:00, 52626.15it/s]
100%|██████████| 130/130 [00:00<00:00, 78251.94it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78534.93it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:34<00:00, 167.62it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79735.67it/s]
100%|██████████| 287/287 [00:00<00:00, 76981.85it/s]
100%|██████████| 771/771 [00:00<00:00, 81302.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82211.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81409.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80691.76it/s]
100%|██████████| 353/353 [00:00<00:00, 78914.26it/s]
100%|██████████| 252/252 [00:00<00:00, 79060.86it/s]
100%|██████████| 203/203 [00:00<00:00, 77764.52it/s]
100%|██████████| 153/153 [00:00<00:00, 75702.31it/s]
100%|██████████| 200/200 [00:00<00:00, 78405.53it/s]
100%|██████████| 65/65 [00:00<00:00, 66952.30it/s]
100%|██████████| 144/144 [00:00<00:00, 75686.69it/s]
100%|██████████| 30/30 [00:00<00:00, 53911.36it/s]
100%|██████████| 130/130 [00:00<00:00, 68294.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92143.74it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:33<00:00, 174.67it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 86191.42it/s]
100%|██████████| 287/287 [00:00<00:00, 75310.64it/s]
100%|██████████| 771/771 [00:00<00:00, 90527.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90880.22it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89026.47it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91838.70it/s]
100%|██████████| 353/353 [00:00<00:00, 71137.72it/s]
100%|██████████| 252/252 [00:00<00:00, 75330.67it/s]
100%|██████████| 203/203 [00:00<00:00, 72537.38it/s]
100%|██████████| 153/153 [00:00<00:00, 71837.96it/s]
100%|██████████| 200/200 [00:00<00:00, 75709.46it/s]
100%|██████████| 65/65 [00:00<00:00, 72219.80it/s]
100%|██████████| 144/144 [00:00<00:00, 74926.16it/s]
100%|██████████| 30/30 [00:00<00:00, 65672.82it/s]
100%|██████████| 130/130 [00:00<00:00, 58223.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79894.55it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:34<00:00, 168.11it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 88369.11it/s]
100%|██████████| 287/287 [00:00<00:00, 48347.87it/s]
100%|██████████| 771/771 [00:00<00:00, 60629.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91225.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84474.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86626.36it/s]
100%|██████████| 353/353 [00:00<00:00, 71419.10it/s]
100%|██████████| 252/252 [00:00<00:00, 75063.18it/s]
100%|██████████| 203/203 [00:00<00:00, 70083.44it/s]
100%|██████████| 153/153 [00:00<00:00, 50930.83it/s]
100%|██████████| 200/200 [00:00<00:00, 66782.96it/s]
100%|██████████| 65/65 [00:00<00:00, 67117.12it/s]
100%|██████████| 144/144 [00:00<00:00, 67544.15it/s]
100%|██████████| 30/30 [00:00<00:00, 59975.75it/s]
100%|██████████| 130/130 [00:00<00:00, 60611.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89532.78it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 138.39it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 87613.38it/s]
100%|██████████| 287/287 [00:00<00:00, 76125.04it/s]
100%|██████████| 771/771 [00:00<00:00, 89765.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94193.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74251.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87093.44it/s]
100%|██████████| 353/353 [00:00<00:00, 90945.29it/s]
100%|██████████| 252/252 [00:00<00:00, 71595.52it/s]
100%|██████████| 203/203 [00:00<00:00, 70647.50it/s]
100%|██████████| 153/153 [00:00<00:00, 70768.47it/s]
100%|██████████| 200/200 [00:00<00:00, 70539.93it/s]
100%|██████████| 65/65 [00:00<00:00, 68985.26it/s]
100%|██████████| 144/144 [00:00<00:00, 71224.03it/s]
100%|██████████| 30/30 [00:00<00:00, 61954.27it/s]
100%|██████████| 130/130 [00:00<00:00, 65717.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88072.81it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.39it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 93487.50it/s]
100%|██████████| 287/287 [00:00<00:00, 89759.54it/s]
100%|██████████| 771/771 [00:00<00:00, 82476.18it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95120.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73978.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86995.89it/s]
100%|██████████| 353/353 [00:00<00:00, 86655.12it/s]
100%|██████████| 252/252 [00:00<00:00, 82899.18it/s]
100%|██████████| 203/203 [00:00<00:00, 66895.33it/s]
100%|██████████| 153/153 [00:00<00:00, 86790.44it/s]
100%|██████████| 200/200 [00:00<00:00, 88263.97it/s]
100%|██████████| 65/65 [00:00<00:00, 63832.77it/s]
100%|██████████| 144/144 [00:00<00:00, 70492.50it/s]
100%|██████████| 30/30 [00:00<00:00, 58039.26it/s]
100%|██████████| 130/130 [00:00<00:00, 62601.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89929.33it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.34it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79146.78it/s]
100%|██████████| 287/287 [00:00<00:00, 77228.80it/s]
100%|██████████| 771/771 [00:00<00:00, 81286.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87571.07it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81945.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92507.81it/s]
100%|██████████| 353/353 [00:00<00:00, 78541.69it/s]
100%|██████████| 252/252 [00:00<00:00, 80127.71it/s]
100%|██████████| 203/203 [00:00<00:00, 74505.05it/s]
100%|██████████| 153/153 [00:00<00:00, 87179.53it/s]
100%|██████████| 200/200 [00:00<00:00, 78818.08it/s]
100%|██████████| 65/65 [00:00<00:00, 68759.08it/s]
100%|██████████| 144/144 [00:00<00:00, 80252.43it/s]
100%|██████████| 30/30 [00:00<00:00, 71534.46it/s]
100%|██████████| 130/130 [00:00<00:00, 70766.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 100408.77it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 141.80it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80344.18it/s]
100%|██████████| 287/287 [00:00<00:00, 80540.96it/s]
100%|██████████| 771/771 [00:00<00:00, 81070.18it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80634.88it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82651.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80510.03it/s]
100%|██████████| 353/353 [00:00<00:00, 79023.77it/s]
100%|██████████| 252/252 [00:00<00:00, 78701.76it/s]
100%|██████████| 203/203 [00:00<00:00, 77899.70it/s]
100%|██████████| 153/153 [00:00<00:00, 80145.94it/s]
100%|██████████| 200/200 [00:00<00:00, 80605.44it/s]
100%|██████████| 65/65 [00:00<00:00, 75395.40it/s]
100%|██████████| 144/144 [00:00<00:00, 72698.58it/s]
100%|██████████| 30/30 [00:00<00:00, 64133.09it/s]
100%|██████████| 130/130 [00:00<00:00, 75228.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 69618.31it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 145.00it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 88326.27it/s]
100%|██████████| 287/287 [00:00<00:00, 68857.41it/s]
100%|██████████| 771/771 [00:00<00:00, 88899.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88306.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90705.30it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89547.89it/s]
100%|██████████| 353/353 [00:00<00:00, 69280.30it/s]
100%|██████████| 252/252 [00:00<00:00, 66313.11it/s]
100%|██████████| 203/203 [00:00<00:00, 76328.44it/s]
100%|██████████| 153/153 [00:00<00:00, 75012.10it/s]
100%|██████████| 200/200 [00:00<00:00, 68657.78it/s]
100%|██████████| 65/65 [00:00<00:00, 46779.30it/s]
100%|██████████| 144/144 [00:00<00:00, 81267.46it/s]
100%|██████████| 30/30 [00:00<00:00, 56962.03it/s]
100%|██████████| 130/130 [00:00<00:00, 65757.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79365.85it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 140.94it/s]
INFO:root:The new embedding has 5837 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 95041.84it/s]
100%|██████████| 287/287 [00:00<00:00, 89639.23it/s]
100%|██████████| 771/771 [00:00<00:00, 93690.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 96130.18it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91672.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85919.51it/s]
100%|██████████| 353/353 [00:00<00:00, 77680.45it/s]
100%|██████████| 252/252 [00:00<00:00, 72894.11it/s]
100%|██████████| 203/203 [00:00<00:00, 71107.71it/s]
100%|██████████| 153/153 [00:00<00:00, 69760.68it/s]
100%|██████████| 200/200 [00:00<00:00, 88217.56it/s]
100%|██████████| 65/65 [00:00<00:00, 65457.33it/s]
100%|██████████| 144/144 [00:00<00:00, 70997.98it/s]
100%|██████████| 30/30 [00:00<00:00, 47038.92it/s]
100%|██████████| 130/130 [00:00<00:00, 81067.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91325.17it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.04it/s]
INFO:root:The new embedding has 5837 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78712.63it/s]
100%|██████████| 287/287 [00:00<00:00, 76756.06it/s]
100%|██████████| 771/771 [00:00<00:00, 80722.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86587.61it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79588.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79937.18it/s]
100%|██████████| 353/353 [00:00<00:00, 76790.07it/s]
100%|██████████| 252/252 [00:00<00:00, 79632.68it/s]
100%|██████████| 203/203 [00:00<00:00, 59255.60it/s]
100%|██████████| 153/153 [00:00<00:00, 76441.75it/s]
100%|██████████| 200/200 [00:00<00:00, 76559.35it/s]
100%|██████████| 65/65 [00:00<00:00, 70337.92it/s]
100%|██████████| 144/144 [00:00<00:00, 77116.93it/s]
100%|██████████| 30/30 [00:00<00:00, 53204.70it/s]
100%|██████████| 130/130 [00:00<00:00, 74114.38it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75365.86it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 143.23it/s]
INFO:root:The new embedding has 5837 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81317.14it/s]
100%|██████████| 287/287 [00:00<00:00, 77337.95it/s]
100%|██████████| 771/771 [00:00<00:00, 80385.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81694.22it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81707.75it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92322.51it/s]
100%|██████████| 353/353 [00:00<00:00, 79358.38it/s]
100%|██████████| 252/252 [00:00<00:00, 80925.24it/s]
100%|██████████| 203/203 [00:00<00:00, 78510.25it/s]
100%|██████████| 153/153 [00:00<00:00, 80366.75it/s]
100%|██████████| 200/200 [00:00<00:00, 76917.37it/s]
100%|██████████| 65/65 [00:00<00:00, 68259.83it/s]
100%|██████████| 144/144 [00:00<00:00, 79944.38it/s]
100%|██████████| 30/30 [00:00<00:00, 60845.80it/s]
100%|██████████| 130/130 [00:00<00:00, 77794.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78662.44it/s]
100%|██████████| 203

['summonings' 'page']
['summonings' 'demand']
['hypertexts' 'database']
['amazings' 'surprise']
['amazings' 'stump']
['monsignori' 'priest']
['cosigns' 'validate']
['cosigns' 'endorse']
['independences' 'independent']
['independences' 'victory']
['importances' 'standing']
['importances' 'deal']
['liverpools' 'england']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 161.72it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 93826.63it/s]
100%|██████████| 287/287 [00:00<00:00, 71136.11it/s]
100%|██████████| 771/771 [00:00<00:00, 90811.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94924.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94999.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 76384.14it/s]
100%|██████████| 353/353 [00:00<00:00, 80031.85it/s]
100%|██████████| 252/252 [00:00<00:00, 71416.53it/s]
100%|██████████| 203/203 [00:00<00:00, 71664.31it/s]
100%|██████████| 153/153 [00:00<00:00, 73660.30it/s]
100%|██████████| 200/200 [00:00<00:00, 73830.38it/s]
100%|██████████| 65/65 [00:00<00:00, 64072.80it/s]
100%|██████████| 144/144 [00:00<00:00, 70500.73it/s]
100%|██████████| 30/30 [00:00<00:00, 56987.83it/s]
100%|██████████| 130/130 [00:00<00:00, 73614.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90040.75it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.26it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 71750.91it/s]
100%|██████████| 287/287 [00:00<00:00, 71423.12it/s]
100%|██████████| 771/771 [00:00<00:00, 83407.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87392.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81843.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85404.57it/s]
100%|██████████| 353/353 [00:00<00:00, 75760.60it/s]
100%|██████████| 252/252 [00:00<00:00, 73666.34it/s]
100%|██████████| 203/203 [00:00<00:00, 72254.22it/s]
100%|██████████| 153/153 [00:00<00:00, 55159.75it/s]
100%|██████████| 200/200 [00:00<00:00, 68843.73it/s]
100%|██████████| 65/65 [00:00<00:00, 51712.78it/s]
100%|██████████| 144/144 [00:00<00:00, 67205.94it/s]
100%|██████████| 30/30 [00:00<00:00, 26732.34it/s]
100%|██████████| 130/130 [00:00<00:00, 64307.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83418.93it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 129.13it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82571.87it/s]
100%|██████████| 287/287 [00:00<00:00, 80181.53it/s]
100%|██████████| 771/771 [00:00<00:00, 81756.80it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82846.36it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81400.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93519.18it/s]
100%|██████████| 353/353 [00:00<00:00, 80023.20it/s]
100%|██████████| 252/252 [00:00<00:00, 77723.70it/s]
100%|██████████| 203/203 [00:00<00:00, 82249.20it/s]
100%|██████████| 153/153 [00:00<00:00, 77391.28it/s]
100%|██████████| 200/200 [00:00<00:00, 77773.11it/s]
100%|██████████| 65/65 [00:00<00:00, 72143.36it/s]
100%|██████████| 144/144 [00:00<00:00, 80455.54it/s]
100%|██████████| 30/30 [00:00<00:00, 56859.07it/s]
100%|██████████| 130/130 [00:00<00:00, 74939.46it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79967.23it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.69it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82176.74it/s]
100%|██████████| 287/287 [00:00<00:00, 77129.83it/s]
100%|██████████| 771/771 [00:00<00:00, 82026.39it/s]
100%|██████████| 2000/2000 [00:00<00:00, 100614.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90519.34it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96307.87it/s]
100%|██████████| 353/353 [00:00<00:00, 82328.14it/s]
100%|██████████| 252/252 [00:00<00:00, 79049.03it/s]
100%|██████████| 203/203 [00:00<00:00, 76963.18it/s]
100%|██████████| 153/153 [00:00<00:00, 81180.08it/s]
100%|██████████| 200/200 [00:00<00:00, 79868.69it/s]
100%|██████████| 65/65 [00:00<00:00, 71933.97it/s]
100%|██████████| 144/144 [00:00<00:00, 80071.56it/s]
100%|██████████| 30/30 [00:00<00:00, 61290.37it/s]
100%|██████████| 130/130 [00:00<00:00, 66381.73it/s]
100%|██████████| 3500/3500 [00:00<00:00, 98694.15it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 143.23it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 73851.45it/s]
100%|██████████| 287/287 [00:00<00:00, 68535.94it/s]
100%|██████████| 771/771 [00:00<00:00, 85210.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87466.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84959.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85188.90it/s]
100%|██████████| 353/353 [00:00<00:00, 90213.83it/s]
100%|██████████| 252/252 [00:00<00:00, 76342.69it/s]
100%|██████████| 203/203 [00:00<00:00, 62445.45it/s]
100%|██████████| 153/153 [00:00<00:00, 67302.41it/s]
100%|██████████| 200/200 [00:00<00:00, 81434.89it/s]
100%|██████████| 65/65 [00:00<00:00, 63137.97it/s]
100%|██████████| 144/144 [00:00<00:00, 65245.74it/s]
100%|██████████| 30/30 [00:00<00:00, 45035.48it/s]
100%|██████████| 130/130 [00:00<00:00, 48736.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88223.66it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.78it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 95279.57it/s]
100%|██████████| 287/287 [00:00<00:00, 76531.58it/s]
100%|██████████| 771/771 [00:00<00:00, 88011.55it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92811.79it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92697.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91257.89it/s]
100%|██████████| 353/353 [00:00<00:00, 79708.71it/s]
100%|██████████| 252/252 [00:00<00:00, 71907.25it/s]
100%|██████████| 203/203 [00:00<00:00, 71507.83it/s]
100%|██████████| 153/153 [00:00<00:00, 70095.96it/s]
100%|██████████| 200/200 [00:00<00:00, 69870.13it/s]
100%|██████████| 65/65 [00:00<00:00, 59721.74it/s]
100%|██████████| 144/144 [00:00<00:00, 68509.50it/s]
100%|██████████| 30/30 [00:00<00:00, 64793.57it/s]
100%|██████████| 130/130 [00:00<00:00, 74990.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73890.21it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.59it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80644.17it/s]
100%|██████████| 287/287 [00:00<00:00, 76033.68it/s]
100%|██████████| 771/771 [00:00<00:00, 72262.26it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94319.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79342.91it/s]
100%|██████████| 3000/3000 [00:00<00:00, 102688.31it/s]
100%|██████████| 353/353 [00:00<00:00, 79601.58it/s]
100%|██████████| 252/252 [00:00<00:00, 78073.91it/s]
100%|██████████| 203/203 [00:00<00:00, 76144.13it/s]
100%|██████████| 153/153 [00:00<00:00, 73719.53it/s]
100%|██████████| 200/200 [00:00<00:00, 80978.94it/s]
100%|██████████| 65/65 [00:00<00:00, 76174.84it/s]
100%|██████████| 144/144 [00:00<00:00, 80092.80it/s]
100%|██████████| 30/30 [00:00<00:00, 69711.42it/s]
100%|██████████| 130/130 [00:00<00:00, 76764.68it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91561.55it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 148.34it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79281.56it/s]
100%|██████████| 287/287 [00:00<00:00, 63199.73it/s]
100%|██████████| 771/771 [00:00<00:00, 74393.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80342.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88212.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84374.33it/s]
100%|██████████| 353/353 [00:00<00:00, 78712.88it/s]
100%|██████████| 252/252 [00:00<00:00, 77958.74it/s]
100%|██████████| 203/203 [00:00<00:00, 69750.45it/s]
100%|██████████| 153/153 [00:00<00:00, 70027.12it/s]
100%|██████████| 200/200 [00:00<00:00, 70957.60it/s]
100%|██████████| 65/65 [00:00<00:00, 75187.47it/s]
100%|██████████| 144/144 [00:00<00:00, 79065.29it/s]
100%|██████████| 30/30 [00:00<00:00, 66930.38it/s]
100%|██████████| 130/130 [00:00<00:00, 62522.59it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93680.81it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.57it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 87266.68it/s]
100%|██████████| 287/287 [00:00<00:00, 71043.75it/s]
100%|██████████| 771/771 [00:00<00:00, 76224.12it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95223.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86614.43it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91526.07it/s]
100%|██████████| 353/353 [00:00<00:00, 73234.87it/s]
100%|██████████| 252/252 [00:00<00:00, 71248.04it/s]
100%|██████████| 203/203 [00:00<00:00, 74951.03it/s]
100%|██████████| 153/153 [00:00<00:00, 70604.96it/s]
100%|██████████| 200/200 [00:00<00:00, 69661.25it/s]
100%|██████████| 65/65 [00:00<00:00, 70283.52it/s]
100%|██████████| 144/144 [00:00<00:00, 66642.37it/s]
100%|██████████| 30/30 [00:00<00:00, 65948.18it/s]
100%|██████████| 130/130 [00:00<00:00, 65709.75it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73259.30it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 173.15it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 94195.75it/s]
100%|██████████| 287/287 [00:00<00:00, 72770.24it/s]
100%|██████████| 771/771 [00:00<00:00, 89616.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98360.86it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74886.25it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95564.00it/s]
100%|██████████| 353/353 [00:00<00:00, 86065.76it/s]
100%|██████████| 252/252 [00:00<00:00, 74402.69it/s]
100%|██████████| 203/203 [00:00<00:00, 74871.94it/s]
100%|██████████| 153/153 [00:00<00:00, 71113.53it/s]
100%|██████████| 200/200 [00:00<00:00, 72868.38it/s]
100%|██████████| 65/65 [00:00<00:00, 69530.67it/s]
100%|██████████| 144/144 [00:00<00:00, 87800.52it/s]
100%|██████████| 30/30 [00:00<00:00, 66191.02it/s]
100%|██████████| 130/130 [00:00<00:00, 70895.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85873.94it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:44<00:00, 132.25it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88918.57it/s]
100%|██████████| 287/287 [00:00<00:00, 78421.19it/s]
100%|██████████| 771/771 [00:00<00:00, 89120.00it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92995.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93687.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91492.79it/s]
100%|██████████| 353/353 [00:00<00:00, 82145.43it/s]
100%|██████████| 252/252 [00:00<00:00, 86593.86it/s]
100%|██████████| 203/203 [00:00<00:00, 82760.86it/s]
100%|██████████| 153/153 [00:00<00:00, 74205.42it/s]
100%|██████████| 200/200 [00:00<00:00, 68945.57it/s]
100%|██████████| 65/65 [00:00<00:00, 61933.16it/s]
100%|██████████| 144/144 [00:00<00:00, 69921.25it/s]
100%|██████████| 30/30 [00:00<00:00, 56048.61it/s]
100%|██████████| 130/130 [00:00<00:00, 72440.48it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86017.85it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.75it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 80136.74it/s]
100%|██████████| 287/287 [00:00<00:00, 60020.21it/s]
100%|██████████| 771/771 [00:00<00:00, 87732.19it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83289.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86398.55it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84457.58it/s]
100%|██████████| 353/353 [00:00<00:00, 88753.71it/s]
100%|██████████| 252/252 [00:00<00:00, 73980.86it/s]
100%|██████████| 203/203 [00:00<00:00, 68898.18it/s]
100%|██████████| 153/153 [00:00<00:00, 78556.56it/s]
100%|██████████| 200/200 [00:00<00:00, 83245.09it/s]
100%|██████████| 65/65 [00:00<00:00, 64773.05it/s]
100%|██████████| 144/144 [00:00<00:00, 79722.78it/s]
100%|██████████| 30/30 [00:00<00:00, 43965.45it/s]
100%|██████████| 130/130 [00:00<00:00, 51914.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72452.64it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 132.91it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77323.99it/s]
100%|██████████| 287/287 [00:00<00:00, 54191.93it/s]
100%|██████████| 771/771 [00:00<00:00, 73383.90it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75695.79it/s]
100%|██████████| 1000/1000 [00:00<00:00, 100761.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90621.69it/s]
100%|██████████| 353/353 [00:00<00:00, 65186.87it/s]
100%|██████████| 252/252 [00:00<00:00, 79788.98it/s]
100%|██████████| 203/203 [00:00<00:00, 50087.87it/s]
100%|██████████| 153/153 [00:00<00:00, 61385.93it/s]
100%|██████████| 200/200 [00:00<00:00, 70368.32it/s]
100%|██████████| 65/65 [00:00<00:00, 72392.40it/s]
100%|██████████| 144/144 [00:00<00:00, 69800.04it/s]
100%|██████████| 30/30 [00:00<00:00, 38409.38it/s]
100%|██████████| 130/130 [00:00<00:00, 52743.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81699.79it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.84it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 61823.82it/s]
100%|██████████| 287/287 [00:00<00:00, 95453.59it/s]
100%|██████████| 771/771 [00:00<00:00, 86467.78it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76335.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75970.01it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86450.79it/s]
100%|██████████| 353/353 [00:00<00:00, 64617.87it/s]
100%|██████████| 252/252 [00:00<00:00, 53625.80it/s]
100%|██████████| 203/203 [00:00<00:00, 55898.35it/s]
100%|██████████| 153/153 [00:00<00:00, 58519.84it/s]
100%|██████████| 200/200 [00:00<00:00, 52718.75it/s]
100%|██████████| 65/65 [00:00<00:00, 48867.14it/s]
100%|██████████| 144/144 [00:00<00:00, 33424.45it/s]
100%|██████████| 30/30 [00:00<00:00, 61230.72it/s]
100%|██████████| 130/130 [00:00<00:00, 25721.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93202.02it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 129.23it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 69365.79it/s]
100%|██████████| 287/287 [00:00<00:00, 76303.58it/s]
100%|██████████| 771/771 [00:00<00:00, 88799.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93872.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88612.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92081.32it/s]
100%|██████████| 353/353 [00:00<00:00, 75382.58it/s]
100%|██████████| 252/252 [00:00<00:00, 69019.50it/s]
100%|██████████| 203/203 [00:00<00:00, 69426.26it/s]
100%|██████████| 153/153 [00:00<00:00, 70341.83it/s]
100%|██████████| 200/200 [00:00<00:00, 70468.82it/s]
100%|██████████| 65/65 [00:00<00:00, 69495.22it/s]
100%|██████████| 144/144 [00:00<00:00, 71791.25it/s]
100%|██████████| 30/30 [00:00<00:00, 58552.41it/s]
100%|██████████| 130/130 [00:00<00:00, 64118.01it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87272.24it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.41it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 93654.66it/s]
100%|██████████| 287/287 [00:00<00:00, 76478.10it/s]
100%|██████████| 771/771 [00:00<00:00, 89088.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90791.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82672.45it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82362.38it/s]
100%|██████████| 353/353 [00:00<00:00, 93383.12it/s]
100%|██████████| 252/252 [00:00<00:00, 74313.76it/s]
100%|██████████| 203/203 [00:00<00:00, 71718.64it/s]
100%|██████████| 153/153 [00:00<00:00, 75729.11it/s]
100%|██████████| 200/200 [00:00<00:00, 74565.40it/s]
100%|██████████| 65/65 [00:00<00:00, 66414.07it/s]
100%|██████████| 144/144 [00:00<00:00, 71680.49it/s]
100%|██████████| 30/30 [00:00<00:00, 67288.30it/s]
100%|██████████| 130/130 [00:00<00:00, 59093.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84923.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.46it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58085.44it/s]
100%|██████████| 287/287 [00:00<00:00, 59301.70it/s]
100%|██████████| 771/771 [00:00<00:00, 59743.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 62790.86it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80386.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80351.68it/s]
100%|██████████| 353/353 [00:00<00:00, 74600.16it/s]
100%|██████████| 252/252 [00:00<00:00, 79019.48it/s]
100%|██████████| 203/203 [00:00<00:00, 76314.75it/s]
100%|██████████| 153/153 [00:00<00:00, 82220.18it/s]
100%|██████████| 200/200 [00:00<00:00, 81577.44it/s]
100%|██████████| 65/65 [00:00<00:00, 68465.53it/s]
100%|██████████| 144/144 [00:00<00:00, 81962.24it/s]
100%|██████████| 30/30 [00:00<00:00, 55948.92it/s]
100%|██████████| 130/130 [00:00<00:00, 76927.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78210.67it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 141.40it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80176.61it/s]
100%|██████████| 287/287 [00:00<00:00, 78842.37it/s]
100%|██████████| 771/771 [00:00<00:00, 79318.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80046.26it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79735.07it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81231.44it/s]
100%|██████████| 353/353 [00:00<00:00, 78612.58it/s]
100%|██████████| 252/252 [00:00<00:00, 82698.12it/s]
100%|██████████| 203/203 [00:00<00:00, 81548.10it/s]
100%|██████████| 153/153 [00:00<00:00, 76945.86it/s]
100%|██████████| 200/200 [00:00<00:00, 78186.30it/s]
100%|██████████| 65/65 [00:00<00:00, 77805.30it/s]
100%|██████████| 144/144 [00:00<00:00, 77294.57it/s]
100%|██████████| 30/30 [00:00<00:00, 61470.01it/s]
100%|██████████| 130/130 [00:00<00:00, 66927.64it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89710.06it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 144.23it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 82549.10it/s]
100%|██████████| 287/287 [00:00<00:00, 91049.49it/s]
100%|██████████| 771/771 [00:00<00:00, 77302.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83579.34it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79788.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73181.14it/s]
100%|██████████| 353/353 [00:00<00:00, 72266.17it/s]
100%|██████████| 252/252 [00:00<00:00, 75800.67it/s]
100%|██████████| 203/203 [00:00<00:00, 73154.37it/s]
100%|██████████| 153/153 [00:00<00:00, 70893.56it/s]
100%|██████████| 200/200 [00:00<00:00, 64532.72it/s]
100%|██████████| 65/65 [00:00<00:00, 64436.25it/s]
100%|██████████| 144/144 [00:00<00:00, 70320.15it/s]
100%|██████████| 30/30 [00:00<00:00, 66365.57it/s]
100%|██████████| 130/130 [00:00<00:00, 44752.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85974.02it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 119.51it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 92944.18it/s]
100%|██████████| 287/287 [00:00<00:00, 88479.62it/s]
100%|██████████| 771/771 [00:00<00:00, 92715.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94346.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90925.53it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91000.50it/s]
100%|██████████| 353/353 [00:00<00:00, 80170.53it/s]
100%|██████████| 252/252 [00:00<00:00, 72753.62it/s]
100%|██████████| 203/203 [00:00<00:00, 70712.04it/s]
100%|██████████| 153/153 [00:00<00:00, 68225.44it/s]
100%|██████████| 200/200 [00:00<00:00, 76580.32it/s]
100%|██████████| 65/65 [00:00<00:00, 64329.82it/s]
100%|██████████| 144/144 [00:00<00:00, 31359.28it/s]
100%|██████████| 30/30 [00:00<00:00, 64893.82it/s]
100%|██████████| 130/130 [00:00<00:00, 71369.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90317.73it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:50<00:00, 116.49it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 66694.94it/s]
100%|██████████| 287/287 [00:00<00:00, 78090.51it/s]
100%|██████████| 771/771 [00:00<00:00, 76779.72it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81782.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77763.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79178.65it/s]
100%|██████████| 353/353 [00:00<00:00, 80818.19it/s]
100%|██████████| 252/252 [00:00<00:00, 79167.45it/s]
100%|██████████| 203/203 [00:00<00:00, 76603.12it/s]
100%|██████████| 153/153 [00:00<00:00, 80095.92it/s]
100%|██████████| 200/200 [00:00<00:00, 76720.40it/s]
100%|██████████| 65/65 [00:00<00:00, 55570.68it/s]
100%|██████████| 144/144 [00:00<00:00, 68400.88it/s]
100%|██████████| 30/30 [00:00<00:00, 49853.06it/s]
100%|██████████| 130/130 [00:00<00:00, 72057.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77554.53it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:49<00:00, 118.50it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79112.41it/s]
100%|██████████| 287/287 [00:00<00:00, 44992.16it/s]
100%|██████████| 771/771 [00:00<00:00, 77765.69it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94962.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78120.77it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96335.89it/s]
100%|██████████| 353/353 [00:00<00:00, 76468.82it/s]
100%|██████████| 252/252 [00:00<00:00, 76486.33it/s]
100%|██████████| 203/203 [00:00<00:00, 53345.26it/s]
100%|██████████| 153/153 [00:00<00:00, 80629.29it/s]
100%|██████████| 200/200 [00:00<00:00, 79769.95it/s]
100%|██████████| 65/65 [00:00<00:00, 72392.40it/s]
100%|██████████| 144/144 [00:00<00:00, 60811.50it/s]
100%|██████████| 30/30 [00:00<00:00, 55750.61it/s]
100%|██████████| 130/130 [00:00<00:00, 79137.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81115.19it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:49<00:00, 117.45it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 93654.66it/s]
100%|██████████| 287/287 [00:00<00:00, 91890.48it/s]
100%|██████████| 771/771 [00:00<00:00, 93171.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95980.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88396.05it/s]
100%|██████████| 3000/3000 [00:00<00:00, 60881.42it/s]
100%|██████████| 353/353 [00:00<00:00, 54802.14it/s]
100%|██████████| 252/252 [00:00<00:00, 54510.81it/s]
100%|██████████| 203/203 [00:00<00:00, 54871.67it/s]
100%|██████████| 153/153 [00:00<00:00, 53428.40it/s]
100%|██████████| 200/200 [00:00<00:00, 53444.24it/s]
100%|██████████| 65/65 [00:00<00:00, 51391.10it/s]
100%|██████████| 144/144 [00:00<00:00, 54144.31it/s]
100%|██████████| 30/30 [00:00<00:00, 43950.09it/s]
100%|██████████| 130/130 [00:00<00:00, 50046.77it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83256.19it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 157.85it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 90469.82it/s]
100%|██████████| 287/287 [00:00<00:00, 84380.01it/s]
100%|██████████| 771/771 [00:00<00:00, 91799.14it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90212.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90492.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88247.26it/s]
100%|██████████| 353/353 [00:00<00:00, 89787.10it/s]
100%|██████████| 252/252 [00:00<00:00, 72019.94it/s]
100%|██████████| 203/203 [00:00<00:00, 71369.97it/s]
100%|██████████| 153/153 [00:00<00:00, 66979.28it/s]
100%|██████████| 200/200 [00:00<00:00, 82727.89it/s]
100%|██████████| 65/65 [00:00<00:00, 61694.90it/s]
100%|██████████| 144/144 [00:00<00:00, 69783.91it/s]
100%|██████████| 30/30 [00:00<00:00, 64860.37it/s]
100%|██████████| 130/130 [00:00<00:00, 80911.04it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87820.96it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.72it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 57180.22it/s]
100%|██████████| 287/287 [00:00<00:00, 76269.74it/s]
100%|██████████| 771/771 [00:00<00:00, 79429.38it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84171.42it/s]
100%|██████████| 1000/1000 [00:00<00:00, 72225.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 97020.75it/s]
100%|██████████| 353/353 [00:00<00:00, 77299.22it/s]
100%|██████████| 252/252 [00:00<00:00, 80073.08it/s]
100%|██████████| 203/203 [00:00<00:00, 78873.90it/s]
100%|██████████| 153/153 [00:00<00:00, 74299.93it/s]
100%|██████████| 200/200 [00:00<00:00, 78339.63it/s]
100%|██████████| 65/65 [00:00<00:00, 68724.42it/s]
100%|██████████| 144/144 [00:00<00:00, 78817.67it/s]
100%|██████████| 30/30 [00:00<00:00, 65741.44it/s]
100%|██████████| 130/130 [00:00<00:00, 76388.28it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78967.53it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 150.93it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80259.54it/s]
100%|██████████| 287/287 [00:00<00:00, 87438.46it/s]
100%|██████████| 771/771 [00:00<00:00, 75685.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 101415.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80875.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79500.31it/s]
100%|██████████| 353/353 [00:00<00:00, 79790.33it/s]
100%|██████████| 252/252 [00:00<00:00, 79137.81it/s]
100%|██████████| 203/203 [00:00<00:00, 77700.65it/s]
100%|██████████| 153/153 [00:00<00:00, 75755.93it/s]
100%|██████████| 200/200 [00:00<00:00, 70068.56it/s]
100%|██████████| 65/65 [00:00<00:00, 71650.40it/s]
100%|██████████| 144/144 [00:00<00:00, 78408.38it/s]
100%|██████████| 30/30 [00:00<00:00, 56910.50it/s]
100%|██████████| 130/130 [00:00<00:00, 49519.53it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77960.63it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.82it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 68554.34it/s]
100%|██████████| 287/287 [00:00<00:00, 76677.83it/s]
100%|██████████| 771/771 [00:00<00:00, 81231.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91649.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73132.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88476.85it/s]
100%|██████████| 353/353 [00:00<00:00, 65935.84it/s]
100%|██████████| 252/252 [00:00<00:00, 68700.98it/s]
100%|██████████| 203/203 [00:00<00:00, 65065.24it/s]
100%|██████████| 153/153 [00:00<00:00, 55710.44it/s]
100%|██████████| 200/200 [00:00<00:00, 88552.81it/s]
100%|██████████| 65/65 [00:00<00:00, 64497.22it/s]
100%|██████████| 144/144 [00:00<00:00, 68688.70it/s]
100%|██████████| 30/30 [00:00<00:00, 65707.11it/s]
100%|██████████| 130/130 [00:00<00:00, 85024.09it/s]
100%|██████████| 3500/3500 [00:00<00:00, 92797.27it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:33<00:00, 172.96it/s]
INFO:root:The new embedding has 5845 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 88084.88it/s]
100%|██████████| 287/287 [00:00<00:00, 67821.58it/s]
100%|██████████| 771/771 [00:00<00:00, 89351.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94028.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 73371.89it/s]
100%|██████████| 3000/3000 [00:00<00:00, 72779.03it/s]
100%|██████████| 353/353 [00:00<00:00, 77627.50it/s]
100%|██████████| 252/252 [00:00<00:00, 73436.02it/s]
100%|██████████| 203/203 [00:00<00:00, 72015.88it/s]
100%|██████████| 153/153 [00:00<00:00, 72291.15it/s]
100%|██████████| 200/200 [00:00<00:00, 74871.55it/s]
100%|██████████| 65/65 [00:00<00:00, 71877.08it/s]
100%|██████████| 144/144 [00:00<00:00, 71988.05it/s]
100%|██████████| 30/30 [00:00<00:00, 65879.12it/s]
100%|██████████| 130/130 [00:00<00:00, 70256.35it/s]
100%|██████████| 3500/3500 [00:00<00:00, 55702.94it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:44<00:00, 130.89it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 89041.39it/s]
100%|██████████| 287/287 [00:00<00:00, 81110.79it/s]
100%|██████████| 771/771 [00:00<00:00, 86453.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 73881.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74184.26it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78202.82it/s]
100%|██████████| 353/353 [00:00<00:00, 85415.33it/s]
100%|██████████| 252/252 [00:00<00:00, 71985.60it/s]
100%|██████████| 203/203 [00:00<00:00, 72395.52it/s]
100%|██████████| 153/153 [00:00<00:00, 74732.56it/s]
100%|██████████| 200/200 [00:00<00:00, 71992.86it/s]
100%|██████████| 65/65 [00:00<00:00, 65035.73it/s]
100%|██████████| 144/144 [00:00<00:00, 73827.13it/s]
100%|██████████| 30/30 [00:00<00:00, 66541.05it/s]
100%|██████████| 130/130 [00:00<00:00, 68225.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91017.71it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.44it/s]
INFO:root:The new embedding has 5844 word and vectors have 1200 dimensions
100%|██████████| 999/999 [00:00<00:00, 88567.10it/s]
100%|██████████| 287/287 [00:00<00:00, 82410.16it/s]
100%|██████████| 771/771 [00:00<00:00, 91903.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93407.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94220.15it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90260.26it/s]
100%|██████████| 353/353 [00:00<00:00, 75896.52it/s]
100%|██████████| 252/252 [00:00<00:00, 87780.47it/s]
100%|██████████| 203/203 [00:00<00:00, 68164.58it/s]
100%|██████████| 153/153 [00:00<00:00, 83373.85it/s]
100%|██████████| 200/200 [00:00<00:00, 69957.53it/s]
100%|██████████| 65/65 [00:00<00:00, 63211.17it/s]
100%|██████████| 144/144 [00:00<00:00, 66124.35it/s]
100%|██████████| 30/30 [00:00<00:00, 53385.29it/s]
100%|██████████| 130/130 [00:00<00:00, 81686.82it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88334.61it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.02it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76590.44it/s]
100%|██████████| 287/287 [00:00<00:00, 76648.54it/s]
100%|██████████| 771/771 [00:00<00:00, 80422.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80457.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81929.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79580.26it/s]
100%|██████████| 353/353 [00:00<00:00, 77688.60it/s]
100%|██████████| 252/252 [00:00<00:00, 80340.88it/s]
100%|██████████| 203/203 [00:00<00:00, 77615.65it/s]
100%|██████████| 153/153 [00:00<00:00, 72816.13it/s]
100%|██████████| 200/200 [00:00<00:00, 77564.57it/s]
100%|██████████| 65/65 [00:00<00:00, 65820.80it/s]
100%|██████████| 144/144 [00:00<00:00, 75639.30it/s]
100%|██████████| 30/30 [00:00<00:00, 67577.40it/s]
100%|██████████| 130/130 [00:00<00:00, 52999.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 99774.11it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.53it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 101203.05it/s]
100%|██████████| 287/287 [00:00<00:00, 77050.84it/s]
100%|██████████| 771/771 [00:00<00:00, 94120.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81121.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 102073.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 100021.56it/s]
100%|██████████| 353/353 [00:00<00:00, 80322.75it/s]
100%|██████████| 252/252 [00:00<00:00, 87482.59it/s]
100%|██████████| 203/203 [00:00<00:00, 76956.23it/s]
100%|██████████| 153/153 [00:00<00:00, 74776.10it/s]
100%|██████████| 200/200 [00:00<00:00, 77030.38it/s]
100%|██████████| 65/65 [00:00<00:00, 68225.67it/s]
100%|██████████| 144/144 [00:00<00:00, 75962.74it/s]
100%|██████████| 30/30 [00:00<00:00, 69711.42it/s]
100%|██████████| 130/130 [00:00<00:00, 77330.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 99118.63it/s]
100%|██████████| 

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 149.83it/s]
INFO:root:The new embedding has 5846 word and vectors have 1000 dimensions
100%|██████████| 999/999 [00:00<00:00, 90624.40it/s]
100%|██████████| 287/287 [00:00<00:00, 83490.45it/s]
100%|██████████| 771/771 [00:00<00:00, 86701.92it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92786.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94413.15it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92823.09it/s]
100%|██████████| 353/353 [00:00<00:00, 74495.06it/s]
100%|██████████| 252/252 [00:00<00:00, 72583.75it/s]
100%|██████████| 203/203 [00:00<00:00, 84451.87it/s]
100%|██████████| 153/153 [00:00<00:00, 51465.92it/s]
100%|██████████| 200/200 [00:00<00:00, 60923.87it/s]
100%|██████████| 65/65 [00:00<00:00, 56480.17it/s]
100%|██████████| 144/144 [00:00<00:00, 55676.60it/s]
100%|██████████| 30/30 [00:00<00:00, 41775.94it/s]
100%|██████████| 130/130 [00:00<00:00, 51202.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77000.48it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.85it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90655.77it/s]
100%|██████████| 287/287 [00:00<00:00, 87955.96it/s]
100%|██████████| 771/771 [00:00<00:00, 89581.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91938.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90031.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89028.36it/s]
100%|██████████| 353/353 [00:00<00:00, 88908.26it/s]
100%|██████████| 252/252 [00:00<00:00, 66367.24it/s]
100%|██████████| 203/203 [00:00<00:00, 67074.50it/s]
100%|██████████| 153/153 [00:00<00:00, 69256.26it/s]
100%|██████████| 200/200 [00:00<00:00, 79025.98it/s]
100%|██████████| 65/65 [00:00<00:00, 64027.66it/s]
100%|██████████| 144/144 [00:00<00:00, 69375.12it/s]
100%|██████████| 30/30 [00:00<00:00, 54096.78it/s]
100%|██████████| 130/130 [00:00<00:00, 80043.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84358.97it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.84it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 60175.06it/s]
100%|██████████| 287/287 [00:00<00:00, 78436.52it/s]
100%|██████████| 771/771 [00:00<00:00, 78538.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87701.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79079.62it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80636.43it/s]
100%|██████████| 353/353 [00:00<00:00, 81342.12it/s]
100%|██████████| 252/252 [00:00<00:00, 82286.07it/s]
100%|██████████| 203/203 [00:00<00:00, 81626.28it/s]
100%|██████████| 153/153 [00:00<00:00, 80710.42it/s]
100%|██████████| 200/200 [00:00<00:00, 79107.96it/s]
100%|██████████| 65/65 [00:00<00:00, 67835.22it/s]
100%|██████████| 144/144 [00:00<00:00, 77314.36it/s]
100%|██████████| 30/30 [00:00<00:00, 54542.31it/s]
100%|██████████| 130/130 [00:00<00:00, 84628.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89598.36it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.67it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79311.57it/s]
100%|██████████| 287/287 [00:00<00:00, 74050.52it/s]
100%|██████████| 771/771 [00:00<00:00, 78507.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79231.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81798.58it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82831.91it/s]
100%|██████████| 353/353 [00:00<00:00, 78859.62it/s]
100%|██████████| 252/252 [00:00<00:00, 79801.03it/s]
100%|██████████| 203/203 [00:00<00:00, 77636.88it/s]
100%|██████████| 153/153 [00:00<00:00, 95823.28it/s]
100%|██████████| 200/200 [00:00<00:00, 77378.54it/s]
100%|██████████| 65/65 [00:00<00:00, 68055.36it/s]
100%|██████████| 144/144 [00:00<00:00, 80082.18it/s]
100%|██████████| 30/30 [00:00<00:00, 55750.61it/s]
100%|██████████| 130/130 [00:00<00:00, 75730.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77663.26it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 143.18it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 89918.45it/s]
100%|██████████| 287/287 [00:00<00:00, 85591.95it/s]
100%|██████████| 771/771 [00:00<00:00, 74395.15it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89963.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92275.80it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89639.76it/s]
100%|██████████| 353/353 [00:00<00:00, 88314.30it/s]
100%|██████████| 252/252 [00:00<00:00, 81631.50it/s]
100%|██████████| 203/203 [00:00<00:00, 85349.21it/s]
100%|██████████| 153/153 [00:00<00:00, 68803.31it/s]
100%|██████████| 200/200 [00:00<00:00, 88050.89it/s]
100%|██████████| 65/65 [00:00<00:00, 65175.65it/s]
100%|██████████| 144/144 [00:00<00:00, 72637.38it/s]
100%|██████████| 30/30 [00:00<00:00, 52276.33it/s]
100%|██████████| 130/130 [00:00<00:00, 80947.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85831.76it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.99it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 85943.92it/s]
100%|██████████| 287/287 [00:00<00:00, 77462.37it/s]
100%|██████████| 771/771 [00:00<00:00, 83345.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89807.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90050.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89442.87it/s]
100%|██████████| 353/353 [00:00<00:00, 78151.98it/s]
100%|██████████| 252/252 [00:00<00:00, 73738.29it/s]
100%|██████████| 203/203 [00:00<00:00, 77736.12it/s]
100%|██████████| 153/153 [00:00<00:00, 60948.67it/s]
100%|██████████| 200/200 [00:00<00:00, 80458.55it/s]
100%|██████████| 65/65 [00:00<00:00, 66108.09it/s]
100%|██████████| 144/144 [00:00<00:00, 84662.15it/s]
100%|██████████| 30/30 [00:00<00:00, 51909.70it/s]
100%|██████████| 130/130 [00:00<00:00, 48445.98it/s]
100%|██████████| 3500/3500 [00:00<00:00, 65477.83it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 149.67it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80052.53it/s]
100%|██████████| 287/287 [00:00<00:00, 76629.02it/s]
100%|██████████| 771/771 [00:00<00:00, 81025.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80062.30it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80135.73it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79859.05it/s]
100%|██████████| 353/353 [00:00<00:00, 80598.22it/s]
100%|██████████| 252/252 [00:00<00:00, 79155.59it/s]
100%|██████████| 203/203 [00:00<00:00, 75529.47it/s]
100%|██████████| 153/153 [00:00<00:00, 77559.65it/s]
100%|██████████| 200/200 [00:00<00:00, 78091.68it/s]
100%|██████████| 65/65 [00:00<00:00, 69318.53it/s]
100%|██████████| 144/144 [00:00<00:00, 74879.71it/s]
100%|██████████| 30/30 [00:00<00:00, 69212.94it/s]
100%|██████████| 130/130 [00:00<00:00, 77694.43it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79009.18it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 154.20it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79840.51it/s]
100%|██████████| 287/287 [00:00<00:00, 76216.62it/s]
100%|██████████| 771/771 [00:00<00:00, 80541.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79482.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80582.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80016.48it/s]
100%|██████████| 353/353 [00:00<00:00, 79910.91it/s]
100%|██████████| 252/252 [00:00<00:00, 76519.55it/s]
100%|██████████| 203/203 [00:00<00:00, 78286.48it/s]
100%|██████████| 153/153 [00:00<00:00, 76359.89it/s]
100%|██████████| 200/200 [00:00<00:00, 78004.54it/s]
100%|██████████| 65/65 [00:00<00:00, 69744.12it/s]
100%|██████████| 144/144 [00:00<00:00, 75422.05it/s]
100%|██████████| 30/30 [00:00<00:00, 70295.60it/s]
100%|██████████| 130/130 [00:00<00:00, 75458.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79024.92it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 160.30it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 87736.29it/s]
100%|██████████| 287/287 [00:00<00:00, 74842.41it/s]
100%|██████████| 771/771 [00:00<00:00, 85505.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89879.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87644.27it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89899.13it/s]
100%|██████████| 353/353 [00:00<00:00, 81665.16it/s]
100%|██████████| 252/252 [00:00<00:00, 73831.00it/s]
100%|██████████| 203/203 [00:00<00:00, 69211.81it/s]
100%|██████████| 153/153 [00:00<00:00, 69715.21it/s]
100%|██████████| 200/200 [00:00<00:00, 72919.05it/s]
100%|██████████| 65/65 [00:00<00:00, 66188.34it/s]
100%|██████████| 144/144 [00:00<00:00, 67408.46it/s]
100%|██████████| 30/30 [00:00<00:00, 50922.35it/s]
100%|██████████| 130/130 [00:00<00:00, 69833.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77281.80it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 129.26it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 89297.57it/s]
100%|██████████| 287/287 [00:00<00:00, 84050.08it/s]
100%|██████████| 771/771 [00:00<00:00, 90669.22it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91195.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89946.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89346.97it/s]
100%|██████████| 353/353 [00:00<00:00, 89052.65it/s]
100%|██████████| 252/252 [00:00<00:00, 74787.00it/s]
100%|██████████| 203/203 [00:00<00:00, 48637.25it/s]
100%|██████████| 153/153 [00:00<00:00, 59524.02it/s]
100%|██████████| 200/200 [00:00<00:00, 85189.48it/s]
100%|██████████| 65/65 [00:00<00:00, 49389.45it/s]
100%|██████████| 144/144 [00:00<00:00, 48617.87it/s]
100%|██████████| 30/30 [00:00<00:00, 36813.67it/s]
100%|██████████| 130/130 [00:00<00:00, 83590.30it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73487.03it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 126.85it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80776.31it/s]
100%|██████████| 287/287 [00:00<00:00, 81017.99it/s]
100%|██████████| 771/771 [00:00<00:00, 81031.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80514.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81980.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91388.46it/s]
100%|██████████| 353/353 [00:00<00:00, 81814.07it/s]
100%|██████████| 252/252 [00:00<00:00, 78866.18it/s]
100%|██████████| 203/203 [00:00<00:00, 81563.72it/s]
100%|██████████| 153/153 [00:00<00:00, 73382.33it/s]
100%|██████████| 200/200 [00:00<00:00, 75065.84it/s]
100%|██████████| 65/65 [00:00<00:00, 68276.92it/s]
100%|██████████| 144/144 [00:00<00:00, 75065.84it/s]
100%|██████████| 30/30 [00:00<00:00, 57535.03it/s]
100%|██████████| 130/130 [00:00<00:00, 76324.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 98168.80it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 129.29it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80191.95it/s]
100%|██████████| 287/287 [00:00<00:00, 78636.35it/s]
100%|██████████| 771/771 [00:00<00:00, 81043.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81155.99it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82321.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80251.75it/s]
100%|██████████| 353/353 [00:00<00:00, 77448.83it/s]
100%|██████████| 252/252 [00:00<00:00, 79310.02it/s]
100%|██████████| 203/203 [00:00<00:00, 78157.12it/s]
100%|██████████| 153/153 [00:00<00:00, 76908.98it/s]
100%|██████████| 200/200 [00:00<00:00, 78149.88it/s]
100%|██████████| 65/65 [00:00<00:00, 77760.91it/s]
100%|██████████| 144/144 [00:00<00:00, 71637.98it/s]
100%|██████████| 30/30 [00:00<00:00, 66191.02it/s]
100%|██████████| 130/130 [00:00<00:00, 73435.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85769.58it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.00it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 91339.53it/s]
100%|██████████| 287/287 [00:00<00:00, 79414.52it/s]
100%|██████████| 771/771 [00:00<00:00, 88285.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90473.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88110.08it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89658.92it/s]
100%|██████████| 353/353 [00:00<00:00, 84532.65it/s]
100%|██████████| 252/252 [00:00<00:00, 80420.35it/s]
100%|██████████| 203/203 [00:00<00:00, 77389.90it/s]
100%|██████████| 153/153 [00:00<00:00, 69737.94it/s]
100%|██████████| 200/200 [00:00<00:00, 84383.95it/s]
100%|██████████| 65/65 [00:00<00:00, 62372.40it/s]
100%|██████████| 144/144 [00:00<00:00, 82308.50it/s]
100%|██████████| 30/30 [00:00<00:00, 51909.70it/s]
100%|██████████| 130/130 [00:00<00:00, 72778.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88724.35it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.09it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 91347.50it/s]
100%|██████████| 287/287 [00:00<00:00, 86075.46it/s]
100%|██████████| 771/771 [00:00<00:00, 91731.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92237.24it/s]
100%|██████████| 1000/1000 [00:00<00:00, 94188.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91142.88it/s]
100%|██████████| 353/353 [00:00<00:00, 86792.27it/s]
100%|██████████| 252/252 [00:00<00:00, 72182.24it/s]
100%|██████████| 203/203 [00:00<00:00, 70876.86it/s]
100%|██████████| 153/153 [00:00<00:00, 74025.67it/s]
100%|██████████| 200/200 [00:00<00:00, 67076.67it/s]
100%|██████████| 65/65 [00:00<00:00, 60854.86it/s]
100%|██████████| 144/144 [00:00<00:00, 75309.20it/s]
100%|██████████| 30/30 [00:00<00:00, 54120.05it/s]
100%|██████████| 130/130 [00:00<00:00, 81589.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86415.84it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.09it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81664.22it/s]
100%|██████████| 287/287 [00:00<00:00, 79979.09it/s]
100%|██████████| 771/771 [00:00<00:00, 81092.54it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92790.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81687.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80569.31it/s]
100%|██████████| 353/353 [00:00<00:00, 92173.90it/s]
100%|██████████| 252/252 [00:00<00:00, 78154.73it/s]
100%|██████████| 203/203 [00:00<00:00, 76623.80it/s]
100%|██████████| 153/153 [00:00<00:00, 79599.17it/s]
100%|██████████| 200/200 [00:00<00:00, 78427.52it/s]
100%|██████████| 65/65 [00:00<00:00, 65457.33it/s]
100%|██████████| 144/144 [00:00<00:00, 78306.73it/s]
100%|██████████| 30/30 [00:00<00:00, 58826.14it/s]
100%|██████████| 130/130 [00:00<00:00, 76100.42it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76867.83it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.41it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80164.34it/s]
100%|██████████| 287/287 [00:00<00:00, 78176.73it/s]
100%|██████████| 771/771 [00:00<00:00, 81480.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 99929.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80610.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78631.90it/s]
100%|██████████| 353/353 [00:00<00:00, 80096.80it/s]
100%|██████████| 252/252 [00:00<00:00, 80267.66it/s]
100%|██████████| 203/203 [00:00<00:00, 78416.26it/s]
100%|██████████| 153/153 [00:00<00:00, 75711.24it/s]
100%|██████████| 200/200 [00:00<00:00, 77278.75it/s]
100%|██████████| 65/65 [00:00<00:00, 68967.81it/s]
100%|██████████| 144/144 [00:00<00:00, 76588.86it/s]
100%|██████████| 30/30 [00:00<00:00, 53544.31it/s]
100%|██████████| 130/130 [00:00<00:00, 74296.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71357.71it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.40it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 93458.31it/s]
100%|██████████| 287/287 [00:00<00:00, 75428.61it/s]
100%|██████████| 771/771 [00:00<00:00, 91866.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 74585.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90742.59it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93355.43it/s]
100%|██████████| 353/353 [00:00<00:00, 81186.01it/s]
100%|██████████| 252/252 [00:00<00:00, 63957.68it/s]
100%|██████████| 203/203 [00:00<00:00, 86979.64it/s]
100%|██████████| 153/153 [00:00<00:00, 71773.68it/s]
100%|██████████| 200/200 [00:00<00:00, 73980.14it/s]
100%|██████████| 65/65 [00:00<00:00, 58921.50it/s]
100%|██████████| 144/144 [00:00<00:00, 84108.03it/s]
100%|██████████| 30/30 [00:00<00:00, 63421.94it/s]
100%|██████████| 130/130 [00:00<00:00, 72827.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90457.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 150.70it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 91553.08it/s]
100%|██████████| 287/287 [00:00<00:00, 86272.86it/s]
100%|██████████| 771/771 [00:00<00:00, 89743.25it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93006.28it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93813.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91177.88it/s]
100%|██████████| 353/353 [00:00<00:00, 86080.77it/s]
100%|██████████| 252/252 [00:00<00:00, 81018.29it/s]
100%|██████████| 203/203 [00:00<00:00, 85891.63it/s]
100%|██████████| 153/153 [00:00<00:00, 81128.76it/s]
100%|██████████| 200/200 [00:00<00:00, 82973.37it/s]
100%|██████████| 65/65 [00:00<00:00, 76538.39it/s]
100%|██████████| 144/144 [00:00<00:00, 82252.45it/s]
100%|██████████| 30/30 [00:00<00:00, 60291.86it/s]
100%|██████████| 130/130 [00:00<00:00, 84183.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89298.05it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 146.85it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 65008.30it/s]
100%|██████████| 287/287 [00:00<00:00, 76629.02it/s]
100%|██████████| 771/771 [00:00<00:00, 81078.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80397.63it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81968.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81017.00it/s]
100%|██████████| 353/353 [00:00<00:00, 78662.70it/s]
100%|██████████| 252/252 [00:00<00:00, 66438.16it/s]
100%|██████████| 203/203 [00:00<00:00, 57143.87it/s]
100%|██████████| 153/153 [00:00<00:00, 54259.62it/s]
100%|██████████| 200/200 [00:00<00:00, 58436.84it/s]
100%|██████████| 65/65 [00:00<00:00, 53890.05it/s]
100%|██████████| 144/144 [00:00<00:00, 56589.50it/s]
100%|██████████| 30/30 [00:00<00:00, 46898.67it/s]
100%|██████████| 130/130 [00:00<00:00, 56845.24it/s]
100%|██████████| 3500/3500 [00:00<00:00, 59902.49it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 151.09it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75541.03it/s]
100%|██████████| 287/287 [00:00<00:00, 77969.12it/s]
100%|██████████| 771/771 [00:00<00:00, 93279.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91133.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 103453.22it/s]
100%|██████████| 3000/3000 [00:00<00:00, 101446.46it/s]
100%|██████████| 353/353 [00:00<00:00, 79631.54it/s]
100%|██████████| 252/252 [00:00<00:00, 75169.95it/s]
100%|██████████| 203/203 [00:00<00:00, 75063.36it/s]
100%|██████████| 153/153 [00:00<00:00, 78710.72it/s]
100%|██████████| 200/200 [00:00<00:00, 106117.75it/s]
100%|██████████| 65/65 [00:00<00:00, 66156.21it/s]
100%|██████████| 144/144 [00:00<00:00, 76773.84it/s]
100%|██████████| 30/30 [00:00<00:00, 69327.34it/s]
100%|██████████| 130/130 [00:00<00:00, 69504.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96950.59it/s]
100%|██████████| 

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 145.60it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92695.39it/s]
100%|██████████| 287/287 [00:00<00:00, 79730.11it/s]
100%|██████████| 771/771 [00:00<00:00, 89850.47it/s]
100%|██████████| 2000/2000 [00:00<00:00, 95495.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 95232.02it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92518.69it/s]
100%|██████████| 353/353 [00:00<00:00, 89015.17it/s]
100%|██████████| 252/252 [00:00<00:00, 84604.55it/s]
100%|██████████| 203/203 [00:00<00:00, 69516.96it/s]
100%|██████████| 153/153 [00:00<00:00, 71757.63it/s]
100%|██████████| 200/200 [00:00<00:00, 84904.94it/s]
100%|██████████| 65/65 [00:00<00:00, 52712.64it/s]
100%|██████████| 144/144 [00:00<00:00, 64700.57it/s]
100%|██████████| 30/30 [00:00<00:00, 57403.80it/s]
100%|██████████| 130/130 [00:00<00:00, 84497.06it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90877.41it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:35<00:00, 165.53it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 91353.47it/s]
100%|██████████| 287/287 [00:00<00:00, 88310.85it/s]
100%|██████████| 771/771 [00:00<00:00, 90274.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92336.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91859.48it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91150.14it/s]
100%|██████████| 353/353 [00:00<00:00, 85150.06it/s]
100%|██████████| 252/252 [00:00<00:00, 73543.32it/s]
100%|██████████| 203/203 [00:00<00:00, 85161.40it/s]
100%|██████████| 153/153 [00:00<00:00, 70034.76it/s]
100%|██████████| 200/200 [00:00<00:00, 77852.51it/s]
100%|██████████| 65/65 [00:00<00:00, 63123.35it/s]
100%|██████████| 144/144 [00:00<00:00, 82174.12it/s]
100%|██████████| 30/30 [00:00<00:00, 50151.10it/s]
100%|██████████| 130/130 [00:00<00:00, 80091.00it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89058.60it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 138.37it/s]
INFO:root:The new embedding has 5832 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 92547.98it/s]
100%|██████████| 287/287 [00:00<00:00, 85494.69it/s]
100%|██████████| 771/771 [00:00<00:00, 88987.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90820.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89927.40it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91759.00it/s]
100%|██████████| 353/353 [00:00<00:00, 88705.85it/s]
100%|██████████| 252/252 [00:00<00:00, 76965.31it/s]
100%|██████████| 203/203 [00:00<00:00, 85632.48it/s]
100%|██████████| 153/153 [00:00<00:00, 77260.84it/s]
100%|██████████| 200/200 [00:00<00:00, 83394.06it/s]
100%|██████████| 65/65 [00:00<00:00, 74652.18it/s]
100%|██████████| 144/144 [00:00<00:00, 83851.14it/s]
100%|██████████| 30/30 [00:00<00:00, 53092.46it/s]
100%|██████████| 130/130 [00:00<00:00, 81467.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87759.54it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.42it/s]
INFO:root:The new embedding has 5832 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 91693.32it/s]
100%|██████████| 287/287 [00:00<00:00, 85787.15it/s]
100%|██████████| 771/771 [00:00<00:00, 90783.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93037.22it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92365.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91771.72it/s]
100%|██████████| 353/353 [00:00<00:00, 89515.68it/s]
100%|██████████| 252/252 [00:00<00:00, 74022.31it/s]
100%|██████████| 203/203 [00:00<00:00, 83466.69it/s]
100%|██████████| 153/153 [00:00<00:00, 67550.37it/s]
100%|██████████| 200/200 [00:00<00:00, 85310.77it/s]
100%|██████████| 65/65 [00:00<00:00, 72837.23it/s]
100%|██████████| 144/144 [00:00<00:00, 85235.64it/s]
100%|██████████| 30/30 [00:00<00:00, 51931.13it/s]
100%|██████████| 130/130 [00:00<00:00, 83169.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85622.50it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 154.69it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79834.42it/s]
100%|██████████| 287/287 [00:00<00:00, 79304.65it/s]
100%|██████████| 771/771 [00:00<00:00, 76986.27it/s]
100%|██████████| 2000/2000 [00:00<00:00, 97204.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78437.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 95075.16it/s]
100%|██████████| 353/353 [00:00<00:00, 78650.16it/s]
100%|██████████| 252/252 [00:00<00:00, 78195.21it/s]
100%|██████████| 203/203 [00:00<00:00, 77992.46it/s]
100%|██████████| 153/153 [00:00<00:00, 76955.09it/s]
100%|██████████| 200/200 [00:00<00:00, 77292.99it/s]
100%|██████████| 65/65 [00:00<00:00, 69160.26it/s]
100%|██████████| 144/144 [00:00<00:00, 75876.86it/s]
100%|██████████| 30/30 [00:00<00:00, 56198.80it/s]
100%|██████████| 130/130 [00:00<00:00, 80611.99it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95782.86it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.65it/s]
INFO:root:The new embedding has 5832 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80706.30it/s]
100%|██████████| 287/287 [00:00<00:00, 77006.48it/s]
100%|██████████| 771/771 [00:00<00:00, 79351.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92502.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91506.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98076.43it/s]
100%|██████████| 353/353 [00:00<00:00, 79307.37it/s]
100%|██████████| 252/252 [00:00<00:00, 81267.46it/s]
100%|██████████| 203/203 [00:00<00:00, 75269.07it/s]
100%|██████████| 153/153 [00:00<00:00, 72601.94it/s]
100%|██████████| 200/200 [00:00<00:00, 75593.48it/s]
100%|██████████| 65/65 [00:00<00:00, 41712.02it/s]
100%|██████████| 144/144 [00:00<00:00, 55233.63it/s]
100%|██████████| 30/30 [00:00<00:00, 61230.72it/s]
100%|██████████| 130/130 [00:00<00:00, 69949.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77544.29it/s]
100%|██████████| 203

['preliterate' 'noncivilized']
['extravert' 'extroversive']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['impossibilities' 'unattainableness']
['newness' 'brand-newness']
['monotony' 'unvariedness']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['caesarism' 'autocracy']
['interpenetrate' 'spiritize']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 158.67it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88290.90it/s]
100%|██████████| 287/287 [00:00<00:00, 77782.71it/s]
100%|██████████| 771/771 [00:00<00:00, 84270.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91771.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85435.89it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90270.62it/s]
100%|██████████| 353/353 [00:00<00:00, 79962.70it/s]
100%|██████████| 252/252 [00:00<00:00, 75508.26it/s]
100%|██████████| 203/203 [00:00<00:00, 69206.19it/s]
100%|██████████| 153/153 [00:00<00:00, 66307.97it/s]
100%|██████████| 200/200 [00:00<00:00, 70504.35it/s]
100%|██████████| 65/65 [00:00<00:00, 44409.47it/s]
100%|██████████| 144/144 [00:00<00:00, 63224.09it/s]
100%|██████████| 30/30 [00:00<00:00, 57985.77it/s]
100%|██████████| 130/130 [00:00<00:00, 63446.53it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86951.24it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:35<00:00, 163.33it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 91878.30it/s]
100%|██████████| 287/287 [00:00<00:00, 86651.69it/s]
100%|██████████| 771/771 [00:00<00:00, 90415.71it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93156.04it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92438.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91183.16it/s]
100%|██████████| 353/353 [00:00<00:00, 81602.14it/s]
100%|██████████| 252/252 [00:00<00:00, 68776.98it/s]
100%|██████████| 203/203 [00:00<00:00, 69262.48it/s]
100%|██████████| 153/153 [00:00<00:00, 71263.58it/s]
100%|██████████| 200/200 [00:00<00:00, 82152.66it/s]
100%|██████████| 65/65 [00:00<00:00, 59164.44it/s]
100%|██████████| 144/144 [00:00<00:00, 69247.85it/s]
100%|██████████| 30/30 [00:00<00:00, 50171.10it/s]
100%|██████████| 130/130 [00:00<00:00, 78578.98it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87399.02it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 137.05it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 91337.54it/s]
100%|██████████| 287/287 [00:00<00:00, 86415.31it/s]
100%|██████████| 771/771 [00:00<00:00, 92141.79it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93528.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93612.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90823.15it/s]
100%|██████████| 353/353 [00:00<00:00, 91796.72it/s]
100%|██████████| 252/252 [00:00<00:00, 83919.38it/s]
100%|██████████| 203/203 [00:00<00:00, 87229.15it/s]
100%|██████████| 153/153 [00:00<00:00, 86451.37it/s]
100%|██████████| 200/200 [00:00<00:00, 87838.83it/s]
100%|██████████| 65/65 [00:00<00:00, 64057.74it/s]
100%|██████████| 144/144 [00:00<00:00, 84852.46it/s]
100%|██████████| 30/30 [00:00<00:00, 55358.17it/s]
100%|██████████| 130/130 [00:00<00:00, 78988.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82728.82it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 140.64it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90960.81it/s]
100%|██████████| 287/287 [00:00<00:00, 83461.50it/s]
100%|██████████| 771/771 [00:00<00:00, 89995.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92478.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92550.67it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89902.34it/s]
100%|██████████| 353/353 [00:00<00:00, 89857.94it/s]
100%|██████████| 252/252 [00:00<00:00, 81947.95it/s]
100%|██████████| 203/203 [00:00<00:00, 67779.31it/s]
100%|██████████| 153/153 [00:00<00:00, 63218.26it/s]
100%|██████████| 200/200 [00:00<00:00, 68411.42it/s]
100%|██████████| 65/65 [00:00<00:00, 57969.33it/s]
100%|██████████| 144/144 [00:00<00:00, 64610.59it/s]
100%|██████████| 30/30 [00:00<00:00, 63550.06it/s]
100%|██████████| 130/130 [00:00<00:00, 58523.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83923.01it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.20it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58815.99it/s]
100%|██████████| 287/287 [00:00<00:00, 45459.41it/s]
100%|██████████| 771/771 [00:00<00:00, 79242.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80628.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81739.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81000.31it/s]
100%|██████████| 353/353 [00:00<00:00, 79648.68it/s]
100%|██████████| 252/252 [00:00<00:00, 76414.45it/s]
100%|██████████| 203/203 [00:00<00:00, 74433.40it/s]
100%|██████████| 153/153 [00:00<00:00, 76052.21it/s]
100%|██████████| 200/200 [00:00<00:00, 77250.28it/s]
100%|██████████| 65/65 [00:00<00:00, 68724.42it/s]
100%|██████████| 144/144 [00:00<00:00, 77166.19it/s]
100%|██████████| 30/30 [00:00<00:00, 64893.82it/s]
100%|██████████| 130/130 [00:00<00:00, 76174.84it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86609.58it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.95it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79124.36it/s]
100%|██████████| 287/287 [00:00<00:00, 76912.99it/s]
100%|██████████| 771/771 [00:00<00:00, 77534.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90714.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87686.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96383.11it/s]
100%|██████████| 353/353 [00:00<00:00, 80401.27it/s]
100%|██████████| 252/252 [00:00<00:00, 78789.76it/s]
100%|██████████| 203/203 [00:00<00:00, 80294.58it/s]
100%|██████████| 153/153 [00:00<00:00, 57507.71it/s]
100%|██████████| 200/200 [00:00<00:00, 75274.66it/s]
100%|██████████| 65/65 [00:00<00:00, 68106.36it/s]
100%|██████████| 144/144 [00:00<00:00, 69200.25it/s]
100%|██████████| 30/30 [00:00<00:00, 56274.20it/s]
100%|██████████| 130/130 [00:00<00:00, 75867.47it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76239.48it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 142.07it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 91681.28it/s]
100%|██████████| 287/287 [00:00<00:00, 88577.28it/s]
100%|██████████| 771/771 [00:00<00:00, 90580.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 93423.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92693.85it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90823.15it/s]
100%|██████████| 353/353 [00:00<00:00, 89972.61it/s]
100%|██████████| 252/252 [00:00<00:00, 82286.07it/s]
100%|██████████| 203/203 [00:00<00:00, 87006.31it/s]
100%|██████████| 153/153 [00:00<00:00, 66951.33it/s]
100%|██████████| 200/200 [00:00<00:00, 69224.36it/s]
100%|██████████| 65/65 [00:00<00:00, 62644.71it/s]
100%|██████████| 144/144 [00:00<00:00, 83665.30it/s]
100%|██████████| 30/30 [00:00<00:00, 54027.10it/s]
100%|██████████| 130/130 [00:00<00:00, 84483.97it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88212.00it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.37it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90115.70it/s]
100%|██████████| 287/287 [00:00<00:00, 83757.67it/s]
100%|██████████| 771/771 [00:00<00:00, 88355.42it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92401.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91448.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91992.46it/s]
100%|██████████| 353/353 [00:00<00:00, 85756.69it/s]
100%|██████████| 252/252 [00:00<00:00, 87100.50it/s]
100%|██████████| 203/203 [00:00<00:00, 87202.35it/s]
100%|██████████| 153/153 [00:00<00:00, 64353.04it/s]
100%|██████████| 200/200 [00:00<00:00, 85172.18it/s]
100%|██████████| 65/65 [00:00<00:00, 68603.36it/s]
100%|██████████| 144/144 [00:00<00:00, 82918.70it/s]
100%|██████████| 30/30 [00:00<00:00, 58119.69it/s]
100%|██████████| 130/130 [00:00<00:00, 79264.36it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87286.25it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.77it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 75137.35it/s]
100%|██████████| 287/287 [00:00<00:00, 77727.46it/s]
100%|██████████| 771/771 [00:00<00:00, 80022.97it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85157.48it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78800.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79124.38it/s]
100%|██████████| 353/353 [00:00<00:00, 81235.01it/s]
100%|██████████| 252/252 [00:00<00:00, 80987.25it/s]
100%|██████████| 203/203 [00:00<00:00, 75229.17it/s]
100%|██████████| 153/153 [00:00<00:00, 75971.17it/s]
100%|██████████| 200/200 [00:00<00:00, 77990.03it/s]
100%|██████████| 65/65 [00:00<00:00, 60249.67it/s]
100%|██████████| 144/144 [00:00<00:00, 77166.19it/s]
100%|██████████| 30/30 [00:00<00:00, 59213.70it/s]
100%|██████████| 130/130 [00:00<00:00, 71791.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 77992.11it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.03it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58777.21it/s]
100%|██████████| 287/287 [00:00<00:00, 58302.19it/s]
100%|██████████| 771/771 [00:00<00:00, 59270.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 58787.80it/s]
100%|██████████| 1000/1000 [00:00<00:00, 59298.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 64240.48it/s]
100%|██████████| 353/353 [00:00<00:00, 79065.97it/s]
100%|██████████| 252/252 [00:00<00:00, 78608.11it/s]
100%|██████████| 203/203 [00:00<00:00, 79314.74it/s]
100%|██████████| 153/153 [00:00<00:00, 81510.04it/s]
100%|██████████| 200/200 [00:00<00:00, 74572.03it/s]
100%|██████████| 65/65 [00:00<00:00, 71201.30it/s]
100%|██████████| 144/144 [00:00<00:00, 77087.40it/s]
100%|██████████| 30/30 [00:00<00:00, 41134.07it/s]
100%|██████████| 130/130 [00:00<00:00, 57299.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 96332.20it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:36<00:00, 159.58it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 89255.72it/s]
100%|██████████| 287/287 [00:00<00:00, 87866.08it/s]
100%|██████████| 771/771 [00:00<00:00, 92105.05it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91990.44it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89854.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88316.63it/s]
100%|██████████| 353/353 [00:00<00:00, 88483.20it/s]
100%|██████████| 252/252 [00:00<00:00, 74178.16it/s]
100%|██████████| 203/203 [00:00<00:00, 87390.30it/s]
100%|██████████| 153/153 [00:00<00:00, 85849.97it/s]
100%|██████████| 200/200 [00:00<00:00, 86883.56it/s]
100%|██████████| 65/65 [00:00<00:00, 63937.56it/s]
100%|██████████| 144/144 [00:00<00:00, 85939.07it/s]
100%|██████████| 30/30 [00:00<00:00, 56859.07it/s]
100%|██████████| 130/130 [00:00<00:00, 84812.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89253.53it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 124.30it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 59838.19it/s]
100%|██████████| 287/287 [00:00<00:00, 63153.31it/s]
100%|██████████| 771/771 [00:00<00:00, 66312.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86991.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89246.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89191.17it/s]
100%|██████████| 353/353 [00:00<00:00, 56279.05it/s]
100%|██████████| 252/252 [00:00<00:00, 79698.73it/s]
100%|██████████| 203/203 [00:00<00:00, 82201.56it/s]
100%|██████████| 153/153 [00:00<00:00, 68766.45it/s]
100%|██████████| 200/200 [00:00<00:00, 84939.33it/s]
100%|██████████| 65/65 [00:00<00:00, 65789.03it/s]
100%|██████████| 144/144 [00:00<00:00, 71215.63it/s]
100%|██████████| 30/30 [00:00<00:00, 52189.60it/s]
100%|██████████| 130/130 [00:00<00:00, 64757.66it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71986.15it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:54<00:00, 107.31it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 86297.93it/s]
100%|██████████| 287/287 [00:00<00:00, 78405.87it/s]
100%|██████████| 771/771 [00:00<00:00, 78279.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98387.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76171.44it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86542.35it/s]
100%|██████████| 353/353 [00:00<00:00, 75853.75it/s]
100%|██████████| 252/252 [00:00<00:00, 74914.21it/s]
100%|██████████| 203/203 [00:00<00:00, 77651.05it/s]
100%|██████████| 153/153 [00:00<00:00, 75613.12it/s]
100%|██████████| 200/200 [00:00<00:00, 76776.57it/s]
100%|██████████| 65/65 [00:00<00:00, 66968.74it/s]
100%|██████████| 144/144 [00:00<00:00, 74008.06it/s]
100%|██████████| 30/30 [00:00<00:00, 66052.03it/s]
100%|██████████| 130/130 [00:00<00:00, 74539.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73292.58it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 125.37it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80829.29it/s]
100%|██████████| 287/287 [00:00<00:00, 73377.95it/s]
100%|██████████| 771/771 [00:00<00:00, 81635.03it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81301.51it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80860.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80589.43it/s]
100%|██████████| 353/353 [00:00<00:00, 77009.74it/s]
100%|██████████| 252/252 [00:00<00:00, 77382.28it/s]
100%|██████████| 203/203 [00:00<00:00, 77523.78it/s]
100%|██████████| 153/153 [00:00<00:00, 78681.77it/s]
100%|██████████| 200/200 [00:00<00:00, 76741.45it/s]
100%|██████████| 65/65 [00:00<00:00, 67499.32it/s]
100%|██████████| 144/144 [00:00<00:00, 77225.39it/s]
100%|██████████| 30/30 [00:00<00:00, 69480.46it/s]
100%|██████████| 130/130 [00:00<00:00, 77133.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 95045.51it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 120.04it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 91345.51it/s]
100%|██████████| 287/287 [00:00<00:00, 83769.33it/s]
100%|██████████| 771/771 [00:00<00:00, 55648.82it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85177.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90913.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89061.13it/s]
100%|██████████| 353/353 [00:00<00:00, 80699.26it/s]
100%|██████████| 252/252 [00:00<00:00, 72848.89it/s]
100%|██████████| 203/203 [00:00<00:00, 75109.71it/s]
100%|██████████| 153/153 [00:00<00:00, 67281.24it/s]
100%|██████████| 200/200 [00:00<00:00, 70474.74it/s]
100%|██████████| 65/65 [00:00<00:00, 61403.10it/s]
100%|██████████| 144/144 [00:00<00:00, 81740.39it/s]
100%|██████████| 30/30 [00:00<00:00, 55504.68it/s]
100%|██████████| 130/130 [00:00<00:00, 83628.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79181.35it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 146.62it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 89175.94it/s]
100%|██████████| 287/287 [00:00<00:00, 78375.24it/s]
100%|██████████| 771/771 [00:00<00:00, 76719.61it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87922.61it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89343.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89836.23it/s]
100%|██████████| 353/353 [00:00<00:00, 83862.32it/s]
100%|██████████| 252/252 [00:00<00:00, 82879.68it/s]
100%|██████████| 203/203 [00:00<00:00, 67526.66it/s]
100%|██████████| 153/153 [00:00<00:00, 79966.17it/s]
100%|██████████| 200/200 [00:00<00:00, 83369.19it/s]
100%|██████████| 65/65 [00:00<00:00, 60895.64it/s]
100%|██████████| 144/144 [00:00<00:00, 83816.23it/s]
100%|██████████| 30/30 [00:00<00:00, 61771.78it/s]
100%|██████████| 130/130 [00:00<00:00, 69994.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85671.47it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.11it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 65631.47it/s]
100%|██████████| 287/287 [00:00<00:00, 63941.64it/s]
100%|██████████| 771/771 [00:00<00:00, 80651.65it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88173.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91855.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90529.11it/s]
100%|██████████| 353/353 [00:00<00:00, 67864.02it/s]
100%|██████████| 252/252 [00:00<00:00, 59483.63it/s]
100%|██████████| 203/203 [00:00<00:00, 74602.97it/s]
100%|██████████| 153/153 [00:00<00:00, 62748.46it/s]
100%|██████████| 200/200 [00:00<00:00, 53539.75it/s]
100%|██████████| 65/65 [00:00<00:00, 73346.72it/s]
100%|██████████| 144/144 [00:00<00:00, 77473.03it/s]
100%|██████████| 30/30 [00:00<00:00, 61771.78it/s]
100%|██████████| 130/130 [00:00<00:00, 59656.40it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80366.49it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 140.00it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 98440.26it/s]
100%|██████████| 287/287 [00:00<00:00, 77288.30it/s]
100%|██████████| 771/771 [00:00<00:00, 73001.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94642.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85636.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80565.70it/s]
100%|██████████| 353/353 [00:00<00:00, 71796.59it/s]
100%|██████████| 252/252 [00:00<00:00, 45615.84it/s]
100%|██████████| 203/203 [00:00<00:00, 48818.51it/s]
100%|██████████| 153/153 [00:00<00:00, 52695.72it/s]
100%|██████████| 200/200 [00:00<00:00, 63748.07it/s]
100%|██████████| 65/65 [00:00<00:00, 69195.37it/s]
100%|██████████| 144/144 [00:00<00:00, 73334.12it/s]
100%|██████████| 30/30 [00:00<00:00, 36889.22it/s]
100%|██████████| 130/130 [00:00<00:00, 60611.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 59171.62it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 145.21it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 90528.46it/s]
100%|██████████| 287/287 [00:00<00:00, 66286.63it/s]
100%|██████████| 771/771 [00:00<00:00, 84812.31it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81968.03it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86509.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87905.72it/s]
100%|██████████| 353/353 [00:00<00:00, 78098.39it/s]
100%|██████████| 252/252 [00:00<00:00, 52028.78it/s]
100%|██████████| 203/203 [00:00<00:00, 76191.83it/s]
100%|██████████| 153/153 [00:00<00:00, 69836.60it/s]
100%|██████████| 200/200 [00:00<00:00, 71703.63it/s]
100%|██████████| 65/65 [00:00<00:00, 66430.25it/s]
100%|██████████| 144/144 [00:00<00:00, 68369.91it/s]
100%|██████████| 30/30 [00:00<00:00, 44104.14it/s]
100%|██████████| 130/130 [00:00<00:00, 63587.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85868.92it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:42<00:00, 139.15it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88816.79it/s]
100%|██████████| 287/287 [00:00<00:00, 66499.02it/s]
100%|██████████| 771/771 [00:00<00:00, 72249.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88449.17it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88819.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81692.90it/s]
100%|██████████| 353/353 [00:00<00:00, 89553.58it/s]
100%|██████████| 252/252 [00:00<00:00, 85081.27it/s]
100%|██████████| 203/203 [00:00<00:00, 81798.80it/s]
100%|██████████| 153/153 [00:00<00:00, 49912.77it/s]
100%|██████████| 200/200 [00:00<00:00, 60946.00it/s]
100%|██████████| 65/65 [00:00<00:00, 63773.04it/s]
100%|██████████| 144/144 [00:00<00:00, 68161.58it/s]
100%|██████████| 30/30 [00:00<00:00, 57456.22it/s]
100%|██████████| 130/130 [00:00<00:00, 65214.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74202.82it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:48<00:00, 119.35it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 86046.28it/s]
100%|██████████| 287/287 [00:00<00:00, 76260.07it/s]
100%|██████████| 771/771 [00:00<00:00, 83881.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88400.70it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87756.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85927.72it/s]
100%|██████████| 353/353 [00:00<00:00, 79652.96it/s]
100%|██████████| 252/252 [00:00<00:00, 73748.58it/s]
100%|██████████| 203/203 [00:00<00:00, 69189.32it/s]
100%|██████████| 153/153 [00:00<00:00, 64958.85it/s]
100%|██████████| 200/200 [00:00<00:00, 74274.91it/s]
100%|██████████| 65/65 [00:00<00:00, 41949.49it/s]
100%|██████████| 144/144 [00:00<00:00, 66989.77it/s]
100%|██████████| 30/30 [00:00<00:00, 37752.51it/s]
100%|██████████| 130/130 [00:00<00:00, 62258.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85768.58it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.55it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 89843.25it/s]
100%|██████████| 287/287 [00:00<00:00, 85458.27it/s]
100%|██████████| 771/771 [00:00<00:00, 76964.29it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87425.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89507.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88935.23it/s]
100%|██████████| 353/353 [00:00<00:00, 83857.57it/s]
100%|██████████| 252/252 [00:00<00:00, 68125.34it/s]
100%|██████████| 203/203 [00:00<00:00, 67291.84it/s]
100%|██████████| 153/153 [00:00<00:00, 65522.62it/s]
100%|██████████| 200/200 [00:00<00:00, 66932.16it/s]
100%|██████████| 65/65 [00:00<00:00, 60116.82it/s]
100%|██████████| 144/144 [00:00<00:00, 57065.36it/s]
100%|██████████| 30/30 [00:00<00:00, 44509.77it/s]
100%|██████████| 130/130 [00:00<00:00, 62265.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85105.27it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 127.37it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79799.45it/s]
100%|██████████| 287/287 [00:00<00:00, 58136.06it/s]
100%|██████████| 771/771 [00:00<00:00, 77814.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80895.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75385.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84026.68it/s]
100%|██████████| 353/353 [00:00<00:00, 76224.74it/s]
100%|██████████| 252/252 [00:00<00:00, 75784.37it/s]
100%|██████████| 203/203 [00:00<00:00, 69693.35it/s]
100%|██████████| 153/153 [00:00<00:00, 68612.05it/s]
100%|██████████| 200/200 [00:00<00:00, 64384.13it/s]
100%|██████████| 65/65 [00:00<00:00, 72105.20it/s]
100%|██████████| 144/144 [00:00<00:00, 72891.60it/s]
100%|██████████| 30/30 [00:00<00:00, 63807.87it/s]
100%|██████████| 130/130 [00:00<00:00, 58991.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78061.78it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 120.76it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77813.66it/s]
100%|██████████| 287/287 [00:00<00:00, 74642.85it/s]
100%|██████████| 771/771 [00:00<00:00, 80889.70it/s]
100%|██████████| 2000/2000 [00:00<00:00, 99731.41it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80728.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91596.02it/s]
100%|██████████| 353/353 [00:00<00:00, 80493.06it/s]
100%|██████████| 252/252 [00:00<00:00, 78264.69it/s]
100%|██████████| 203/203 [00:00<00:00, 80000.35it/s]
100%|██████████| 153/153 [00:00<00:00, 79255.10it/s]
100%|██████████| 200/200 [00:00<00:00, 81057.18it/s]
100%|██████████| 65/65 [00:00<00:00, 77166.65it/s]
100%|██████████| 144/144 [00:00<00:00, 78245.86it/s]
100%|██████████| 30/30 [00:00<00:00, 70099.79it/s]
100%|██████████| 130/130 [00:00<00:00, 76366.88it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90930.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:49<00:00, 117.30it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78976.72it/s]
100%|██████████| 287/287 [00:00<00:00, 72524.72it/s]
100%|██████████| 771/771 [00:00<00:00, 85033.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87326.75it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87246.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88725.78it/s]
100%|██████████| 353/353 [00:00<00:00, 84129.17it/s]
100%|██████████| 252/252 [00:00<00:00, 61383.62it/s]
100%|██████████| 203/203 [00:00<00:00, 67779.31it/s]
100%|██████████| 153/153 [00:00<00:00, 67014.26it/s]
100%|██████████| 200/200 [00:00<00:00, 78244.64it/s]
100%|██████████| 65/65 [00:00<00:00, 64543.03it/s]
100%|██████████| 144/144 [00:00<00:00, 67190.99it/s]
100%|██████████| 30/30 [00:00<00:00, 50594.74it/s]
100%|██████████| 130/130 [00:00<00:00, 80863.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76476.59it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.68it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90403.45it/s]
100%|██████████| 287/287 [00:00<00:00, 81023.44it/s]
100%|██████████| 771/771 [00:00<00:00, 86783.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90931.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 93084.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90569.51it/s]
100%|██████████| 353/353 [00:00<00:00, 88790.96it/s]
100%|██████████| 252/252 [00:00<00:00, 80499.97it/s]
100%|██████████| 203/203 [00:00<00:00, 85598.04it/s]
100%|██████████| 153/153 [00:00<00:00, 74784.82it/s]
100%|██████████| 200/200 [00:00<00:00, 66724.53it/s]
100%|██████████| 65/65 [00:00<00:00, 72817.78it/s]
100%|██████████| 144/144 [00:00<00:00, 83886.08it/s]
100%|██████████| 30/30 [00:00<00:00, 46534.44it/s]
100%|██████████| 130/130 [00:00<00:00, 83131.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88351.62it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 125.61it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 57095.30it/s]
100%|██████████| 287/287 [00:00<00:00, 43458.80it/s]
100%|██████████| 771/771 [00:00<00:00, 65447.13it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86337.19it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87080.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87932.13it/s]
100%|██████████| 353/353 [00:00<00:00, 52056.44it/s]
100%|██████████| 252/252 [00:00<00:00, 46349.97it/s]
100%|██████████| 203/203 [00:00<00:00, 55152.46it/s]
100%|██████████| 153/153 [00:00<00:00, 59535.07it/s]
100%|██████████| 200/200 [00:00<00:00, 61513.59it/s]
100%|██████████| 65/65 [00:00<00:00, 50674.68it/s]
100%|██████████| 144/144 [00:00<00:00, 41092.65it/s]
100%|██████████| 30/30 [00:00<00:00, 64100.42it/s]
100%|██████████| 130/130 [00:00<00:00, 67340.93it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84336.68it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 121.09it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79921.22it/s]
100%|██████████| 287/287 [00:00<00:00, 78656.90it/s]
100%|██████████| 771/771 [00:00<00:00, 78746.61it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80278.37it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79672.97it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87522.34it/s]
100%|██████████| 353/353 [00:00<00:00, 70233.35it/s]
100%|██████████| 252/252 [00:00<00:00, 77263.49it/s]
100%|██████████| 203/203 [00:00<00:00, 74720.82it/s]
100%|██████████| 153/153 [00:00<00:00, 74042.75it/s]
100%|██████████| 200/200 [00:00<00:00, 75335.50it/s]
100%|██████████| 65/65 [00:00<00:00, 65916.29it/s]
100%|██████████| 144/144 [00:00<00:00, 56262.67it/s]
100%|██████████| 30/30 [00:00<00:00, 59130.23it/s]
100%|██████████| 130/130 [00:00<00:00, 72837.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90326.07it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:57<00:00, 101.96it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78372.54it/s]
100%|██████████| 287/287 [00:00<00:00, 85701.64it/s]
100%|██████████| 771/771 [00:00<00:00, 87251.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90772.05it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90764.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89941.54it/s]
100%|██████████| 353/353 [00:00<00:00, 84842.66it/s]
100%|██████████| 252/252 [00:00<00:00, 73650.94it/s]
100%|██████████| 203/203 [00:00<00:00, 82809.15it/s]
100%|██████████| 153/153 [00:00<00:00, 84515.81it/s]
100%|██████████| 200/200 [00:00<00:00, 83802.28it/s]
100%|██████████| 65/65 [00:00<00:00, 69940.93it/s]
100%|██████████| 144/144 [00:00<00:00, 66495.63it/s]
100%|██████████| 30/30 [00:00<00:00, 52714.34it/s]
100%|██████████| 130/130 [00:00<00:00, 81321.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87311.69it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:55<00:00, 106.19it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 88077.47it/s]
100%|██████████| 287/287 [00:00<00:00, 72189.82it/s]
100%|██████████| 771/771 [00:00<00:00, 89191.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90191.36it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89447.95it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89568.29it/s]
100%|██████████| 353/353 [00:00<00:00, 87037.17it/s]
100%|██████████| 252/252 [00:00<00:00, 82931.71it/s]
100%|██████████| 203/203 [00:00<00:00, 80828.15it/s]
100%|██████████| 153/153 [00:00<00:00, 61122.82it/s]
100%|██████████| 200/200 [00:00<00:00, 72704.18it/s]
100%|██████████| 65/65 [00:00<00:00, 51178.85it/s]
100%|██████████| 144/144 [00:00<00:00, 64909.16it/s]
100%|██████████| 30/30 [00:00<00:00, 28820.23it/s]
100%|██████████| 130/130 [00:00<00:00, 78771.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85264.94it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:57<00:00, 101.08it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 58651.33it/s]
100%|██████████| 287/287 [00:00<00:00, 50970.29it/s]
100%|██████████| 771/771 [00:00<00:00, 73907.17it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89600.82it/s]
100%|██████████| 1000/1000 [00:00<00:00, 85918.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87130.83it/s]
100%|██████████| 353/353 [00:00<00:00, 65929.97it/s]
100%|██████████| 252/252 [00:00<00:00, 79161.52it/s]
100%|██████████| 203/203 [00:00<00:00, 79902.75it/s]
100%|██████████| 153/153 [00:00<00:00, 65522.62it/s]
100%|██████████| 200/200 [00:00<00:00, 65582.11it/s]
100%|██████████| 65/65 [00:00<00:00, 72546.50it/s]
100%|██████████| 144/144 [00:00<00:00, 68806.08it/s]
100%|██████████| 30/30 [00:00<00:00, 48922.67it/s]
100%|██████████| 130/130 [00:00<00:00, 61004.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 60489.20it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:54<00:00, 107.83it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 67166.42it/s]
100%|██████████| 287/287 [00:00<00:00, 12682.43it/s]
100%|██████████| 771/771 [00:00<00:00, 35153.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 70855.12it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82661.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80711.95it/s]
100%|██████████| 353/353 [00:00<00:00, 78333.91it/s]
100%|██████████| 252/252 [00:00<00:00, 78555.53it/s]
100%|██████████| 203/203 [00:00<00:00, 80560.48it/s]
100%|██████████| 153/153 [00:00<00:00, 77270.14it/s]
100%|██████████| 200/200 [00:00<00:00, 77650.73it/s]
100%|██████████| 65/65 [00:00<00:00, 68915.51it/s]
100%|██████████| 144/144 [00:00<00:00, 77403.53it/s]
100%|██████████| 30/30 [00:00<00:00, 57985.77it/s]
100%|██████████| 130/130 [00:00<00:00, 103484.44it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85383.46it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:49<00:00, 119.02it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92839.16it/s]
100%|██████████| 287/287 [00:00<00:00, 88858.44it/s]
100%|██████████| 771/771 [00:00<00:00, 86322.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92478.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89488.03it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91165.99it/s]
100%|██████████| 353/353 [00:00<00:00, 89808.89it/s]
100%|██████████| 252/252 [00:00<00:00, 74776.41it/s]
100%|██████████| 203/203 [00:00<00:00, 76103.30it/s]
100%|██████████| 153/153 [00:00<00:00, 69647.11it/s]
100%|██████████| 200/200 [00:00<00:00, 65953.36it/s]
100%|██████████| 65/65 [00:00<00:00, 65551.76it/s]
100%|██████████| 144/144 [00:00<00:00, 58787.21it/s]
100%|██████████| 30/30 [00:00<00:00, 45132.40it/s]
100%|██████████| 130/130 [00:00<00:00, 56445.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 68802.91it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 156.41it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 87944.37it/s]
100%|██████████| 287/287 [00:00<00:00, 84522.21it/s]
100%|██████████| 771/771 [00:00<00:00, 87331.78it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90540.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92971.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91234.07it/s]
100%|██████████| 353/353 [00:00<00:00, 89068.72it/s]
100%|██████████| 252/252 [00:00<00:00, 74360.81it/s]
100%|██████████| 203/203 [00:00<00:00, 78895.82it/s]
100%|██████████| 153/153 [00:00<00:00, 70597.20it/s]
100%|██████████| 200/200 [00:00<00:00, 68327.83it/s]
100%|██████████| 65/65 [00:00<00:00, 61444.62it/s]
100%|██████████| 144/144 [00:00<00:00, 81962.24it/s]
100%|██████████| 30/30 [00:00<00:00, 51760.23it/s]
100%|██████████| 130/130 [00:00<00:00, 81564.63it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88176.50it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 152.76it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78883.05it/s]
100%|██████████| 287/287 [00:00<00:00, 75875.53it/s]
100%|██████████| 771/771 [00:00<00:00, 79713.28it/s]
100%|██████████| 2000/2000 [00:00<00:00, 107515.93it/s]
100%|██████████| 1000/1000 [00:00<00:00, 101448.92it/s]
100%|██████████| 3000/3000 [00:00<00:00, 105736.09it/s]
100%|██████████| 353/353 [00:00<00:00, 81972.61it/s]
100%|██████████| 252/252 [00:00<00:00, 79399.38it/s]
100%|██████████| 203/203 [00:00<00:00, 74845.61it/s]
100%|██████████| 153/153 [00:00<00:00, 75684.46it/s]
100%|██████████| 200/200 [00:00<00:00, 77679.49it/s]
100%|██████████| 65/65 [00:00<00:00, 70941.91it/s]
100%|██████████| 144/144 [00:00<00:00, 76067.98it/s]
100%|██████████| 30/30 [00:00<00:00, 59804.71it/s]
100%|██████████| 130/130 [00:00<00:00, 79068.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80868.08it/s]
100%|██████████| 

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:39<00:00, 148.75it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82593.03it/s]
100%|██████████| 287/287 [00:00<00:00, 76726.70it/s]
100%|██████████| 771/771 [00:00<00:00, 82695.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86870.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79960.04it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75833.11it/s]
100%|██████████| 353/353 [00:00<00:00, 78696.15it/s]
100%|██████████| 252/252 [00:00<00:00, 67451.47it/s]
100%|██████████| 203/203 [00:00<00:00, 76548.03it/s]
100%|██████████| 153/153 [00:00<00:00, 74584.90it/s]
100%|██████████| 200/200 [00:00<00:00, 80389.15it/s]
100%|██████████| 65/65 [00:00<00:00, 69779.82it/s]
100%|██████████| 144/144 [00:00<00:00, 76010.54it/s]
100%|██████████| 30/30 [00:00<00:00, 49228.92it/s]
100%|██████████| 130/130 [00:00<00:00, 61764.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91624.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:38<00:00, 153.32it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 91946.85it/s]
100%|██████████| 287/287 [00:00<00:00, 78785.60it/s]
100%|██████████| 771/771 [00:00<00:00, 88948.41it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78353.54it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83101.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86337.49it/s]
100%|██████████| 353/353 [00:00<00:00, 70974.03it/s]
100%|██████████| 252/252 [00:00<00:00, 68411.95it/s]
100%|██████████| 203/203 [00:00<00:00, 70806.13it/s]
100%|██████████| 153/153 [00:00<00:00, 71216.13it/s]
100%|██████████| 200/200 [00:00<00:00, 60271.65it/s]
100%|██████████| 65/65 [00:00<00:00, 40923.11it/s]
100%|██████████| 144/144 [00:00<00:00, 64232.67it/s]
100%|██████████| 30/30 [00:00<00:00, 57169.07it/s]
100%|██████████| 130/130 [00:00<00:00, 68750.41it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80747.98it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:36<00:00, 159.90it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92814.48it/s]
100%|██████████| 287/287 [00:00<00:00, 75665.68it/s]
100%|██████████| 771/771 [00:00<00:00, 83992.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 86062.60it/s]
100%|██████████| 1000/1000 [00:00<00:00, 86368.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78337.68it/s]
100%|██████████| 353/353 [00:00<00:00, 86553.80it/s]
100%|██████████| 252/252 [00:00<00:00, 73789.77it/s]
100%|██████████| 203/203 [00:00<00:00, 84493.77it/s]
100%|██████████| 153/153 [00:00<00:00, 86265.43it/s]
100%|██████████| 200/200 [00:00<00:00, 85051.28it/s]
100%|██████████| 65/65 [00:00<00:00, 61334.03it/s]
100%|██████████| 144/144 [00:00<00:00, 85344.04it/s]
100%|██████████| 30/30 [00:00<00:00, 61802.12it/s]
100%|██████████| 130/130 [00:00<00:00, 70374.23it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89514.22it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:43<00:00, 135.84it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92278.94it/s]
100%|██████████| 287/287 [00:00<00:00, 87153.58it/s]
100%|██████████| 771/771 [00:00<00:00, 89990.49it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91575.69it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87616.80it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89164.63it/s]
100%|██████████| 353/353 [00:00<00:00, 84311.22it/s]
100%|██████████| 252/252 [00:00<00:00, 71455.15it/s]
100%|██████████| 203/203 [00:00<00:00, 71815.43it/s]
100%|██████████| 153/153 [00:00<00:00, 68044.59it/s]
100%|██████████| 200/200 [00:00<00:00, 71428.88it/s]
100%|██████████| 65/65 [00:00<00:00, 62230.03it/s]
100%|██████████| 144/144 [00:00<00:00, 83009.86it/s]
100%|██████████| 30/30 [00:00<00:00, 60176.53it/s]
100%|██████████| 130/130 [00:00<00:00, 83449.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89407.91it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 135.99it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90753.95it/s]
100%|██████████| 287/287 [00:00<00:00, 86676.65it/s]
100%|██████████| 771/771 [00:00<00:00, 78557.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83543.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82881.56it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75141.15it/s]
100%|██████████| 353/353 [00:00<00:00, 83786.39it/s]
100%|██████████| 252/252 [00:00<00:00, 75492.08it/s]
100%|██████████| 203/203 [00:00<00:00, 51652.74it/s]
100%|██████████| 153/153 [00:00<00:00, 72816.13it/s]
100%|██████████| 200/200 [00:00<00:00, 84146.94it/s]
100%|██████████| 65/65 [00:00<00:00, 67784.62it/s]
100%|██████████| 144/144 [00:00<00:00, 75112.52it/s]
100%|██████████| 30/30 [00:00<00:00, 53544.31it/s]
100%|██████████| 130/130 [00:00<00:00, 80983.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80702.70it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.62it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80675.22it/s]
100%|██████████| 287/287 [00:00<00:00, 75880.31it/s]
100%|██████████| 771/771 [00:00<00:00, 99664.33it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81693.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77041.70it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92110.30it/s]
100%|██████████| 353/353 [00:00<00:00, 80401.27it/s]
100%|██████████| 252/252 [00:00<00:00, 78520.51it/s]
100%|██████████| 203/203 [00:00<00:00, 77228.45it/s]
100%|██████████| 153/153 [00:00<00:00, 75488.59it/s]
100%|██████████| 200/200 [00:00<00:00, 74911.66it/s]
100%|██████████| 65/65 [00:00<00:00, 70483.39it/s]
100%|██████████| 144/144 [00:00<00:00, 80071.56it/s]
100%|██████████| 30/30 [00:00<00:00, 66330.59it/s]
100%|██████████| 130/130 [00:00<00:00, 74539.92it/s]
100%|██████████| 3500/3500 [00:00<00:00, 82821.24it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.36it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79922.74it/s]
100%|██████████| 287/287 [00:00<00:00, 79049.46it/s]
100%|██████████| 771/771 [00:00<00:00, 81493.08it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80384.53it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81487.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78638.78it/s]
100%|██████████| 353/353 [00:00<00:00, 79743.06it/s]
100%|██████████| 252/252 [00:00<00:00, 79692.72it/s]
100%|██████████| 203/203 [00:00<00:00, 78531.98it/s]
100%|██████████| 153/153 [00:00<00:00, 77353.97it/s]
100%|██████████| 200/200 [00:00<00:00, 79960.04it/s]
100%|██████████| 65/65 [00:00<00:00, 75709.46it/s]
100%|██████████| 144/144 [00:00<00:00, 78561.37it/s]
100%|██████████| 30/30 [00:00<00:00, 62199.27it/s]
100%|██████████| 130/130 [00:00<00:00, 71062.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76228.79it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.76it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 84203.00it/s]
100%|██████████| 287/287 [00:00<00:00, 84403.68it/s]
100%|██████████| 771/771 [00:00<00:00, 88439.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92484.35it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84390.74it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89855.48it/s]
100%|██████████| 353/353 [00:00<00:00, 88456.76it/s]
100%|██████████| 252/252 [00:00<00:00, 82581.81it/s]
100%|██████████| 203/203 [00:00<00:00, 63683.15it/s]
100%|██████████| 153/153 [00:00<00:00, 69624.45it/s]
100%|██████████| 200/200 [00:00<00:00, 55235.45it/s]
100%|██████████| 65/65 [00:00<00:00, 60868.44it/s]
100%|██████████| 144/144 [00:00<00:00, 84662.15it/s]
100%|██████████| 30/30 [00:00<00:00, 58881.20it/s]
100%|██████████| 130/130 [00:00<00:00, 66944.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89335.55it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.04it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 89107.66it/s]
100%|██████████| 287/287 [00:00<00:00, 86334.74it/s]
100%|██████████| 771/771 [00:00<00:00, 90256.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78194.32it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90646.50it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88886.85it/s]
100%|██████████| 353/353 [00:00<00:00, 82442.75it/s]
100%|██████████| 252/252 [00:00<00:00, 83554.51it/s]
100%|██████████| 203/203 [00:00<00:00, 85615.26it/s]
100%|██████████| 153/153 [00:00<00:00, 70815.33it/s]
100%|██████████| 200/200 [00:00<00:00, 76924.42it/s]
100%|██████████| 65/65 [00:00<00:00, 53815.59it/s]
100%|██████████| 144/144 [00:00<00:00, 83101.24it/s]
100%|██████████| 30/30 [00:00<00:00, 64067.78it/s]
100%|██████████| 130/130 [00:00<00:00, 81212.32it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83566.14it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.11it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78265.68it/s]
100%|██████████| 287/287 [00:00<00:00, 81264.11it/s]
100%|██████████| 771/771 [00:00<00:00, 80999.11it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88089.72it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80511.06it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81559.99it/s]
100%|██████████| 353/353 [00:00<00:00, 79332.87it/s]
100%|██████████| 252/252 [00:00<00:00, 78039.32it/s]
100%|██████████| 203/203 [00:00<00:00, 78372.95it/s]
100%|██████████| 153/153 [00:00<00:00, 78040.68it/s]
100%|██████████| 200/200 [00:00<00:00, 75437.12it/s]
100%|██████████| 65/65 [00:00<00:00, 65567.52it/s]
100%|██████████| 144/144 [00:00<00:00, 73764.02it/s]
100%|██████████| 30/30 [00:00<00:00, 57143.11it/s]
100%|██████████| 130/130 [00:00<00:00, 74601.11it/s]
100%|██████████| 3500/3500 [00:00<00:00, 91458.87it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 129.16it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 79493.64it/s]
100%|██████████| 287/287 [00:00<00:00, 75272.96it/s]
100%|██████████| 771/771 [00:00<00:00, 81343.44it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81475.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84779.66it/s]
100%|██████████| 3000/3000 [00:00<00:00, 93422.67it/s]
100%|██████████| 353/353 [00:00<00:00, 73896.45it/s]
100%|██████████| 252/252 [00:00<00:00, 75740.92it/s]
100%|██████████| 203/203 [00:00<00:00, 77949.62it/s]
100%|██████████| 153/153 [00:00<00:00, 75827.54it/s]
100%|██████████| 200/200 [00:00<00:00, 76853.94it/s]
100%|██████████| 65/65 [00:00<00:00, 67953.58it/s]
100%|██████████| 144/144 [00:00<00:00, 72350.24it/s]
100%|██████████| 30/30 [00:00<00:00, 59213.70it/s]
100%|██████████| 130/130 [00:00<00:00, 72954.18it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89142.97it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.25it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 90818.86it/s]
100%|██████████| 287/287 [00:00<00:00, 88162.10it/s]
100%|██████████| 771/771 [00:00<00:00, 75916.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90975.83it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80487.88it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90070.95it/s]
100%|██████████| 353/353 [00:00<00:00, 79087.08it/s]
100%|██████████| 252/252 [00:00<00:00, 67958.89it/s]
100%|██████████| 203/203 [00:00<00:00, 71393.91it/s]
100%|██████████| 153/153 [00:00<00:00, 63162.26it/s]
100%|██████████| 200/200 [00:00<00:00, 62991.72it/s]
100%|██████████| 65/65 [00:00<00:00, 62861.37it/s]
100%|██████████| 144/144 [00:00<00:00, 65621.44it/s]
100%|██████████| 30/30 [00:00<00:00, 50881.16it/s]
100%|██████████| 130/130 [00:00<00:00, 56503.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87911.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 137.28it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90640.08it/s]
100%|██████████| 287/287 [00:00<00:00, 86229.60it/s]
100%|██████████| 771/771 [00:00<00:00, 88782.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 92589.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89295.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87602.77it/s]
100%|██████████| 353/353 [00:00<00:00, 87340.10it/s]
100%|██████████| 252/252 [00:00<00:00, 71368.31it/s]
100%|██████████| 203/203 [00:00<00:00, 67666.19it/s]
100%|██████████| 153/153 [00:00<00:00, 64057.55it/s]
100%|██████████| 200/200 [00:00<00:00, 76959.71it/s]
100%|██████████| 65/65 [00:00<00:00, 73051.92it/s]
100%|██████████| 144/144 [00:00<00:00, 85235.64it/s]
100%|██████████| 30/30 [00:00<00:00, 64002.60it/s]
100%|██████████| 130/130 [00:00<00:00, 71952.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 88552.01it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 123.69it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 102958.69it/s]
100%|██████████| 287/287 [00:00<00:00, 79215.93it/s]
100%|██████████| 771/771 [00:00<00:00, 78938.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91224.15it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81192.13it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79782.60it/s]
100%|██████████| 353/353 [00:00<00:00, 78654.34it/s]
100%|██████████| 252/252 [00:00<00:00, 77269.14it/s]
100%|██████████| 203/203 [00:00<00:00, 51809.89it/s]
100%|██████████| 153/153 [00:00<00:00, 75881.34it/s]
100%|██████████| 200/200 [00:00<00:00, 74202.64it/s]
100%|██████████| 65/65 [00:00<00:00, 67734.10it/s]
100%|██████████| 144/144 [00:00<00:00, 76686.11it/s]
100%|██████████| 30/30 [00:00<00:00, 28728.11it/s]
100%|██████████| 130/130 [00:00<00:00, 70693.57it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74108.05it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.25it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81575.19it/s]
100%|██████████| 287/287 [00:00<00:00, 81983.60it/s]
100%|██████████| 771/771 [00:00<00:00, 80972.74it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82720.55it/s]
100%|██████████| 1000/1000 [00:00<00:00, 83631.84it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81856.05it/s]
100%|██████████| 353/353 [00:00<00:00, 96342.36it/s]
100%|██████████| 252/252 [00:00<00:00, 80567.47it/s]
100%|██████████| 203/203 [00:00<00:00, 79093.70it/s]
100%|██████████| 153/153 [00:00<00:00, 76214.79it/s]
100%|██████████| 200/200 [00:00<00:00, 80135.73it/s]
100%|██████████| 65/65 [00:00<00:00, 69566.15it/s]
100%|██████████| 144/144 [00:00<00:00, 78073.91it/s]
100%|██████████| 30/30 [00:00<00:00, 60552.99it/s]
100%|██████████| 130/130 [00:00<00:00, 74580.70it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79048.75it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:37<00:00, 154.64it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 88025.67it/s]
100%|██████████| 287/287 [00:00<00:00, 82772.83it/s]
100%|██████████| 771/771 [00:00<00:00, 79732.94it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89676.49it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90238.90it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85335.07it/s]
100%|██████████| 353/353 [00:00<00:00, 80831.43it/s]
100%|██████████| 252/252 [00:00<00:00, 69505.14it/s]
100%|██████████| 203/203 [00:00<00:00, 69178.07it/s]
100%|██████████| 153/153 [00:00<00:00, 67351.86it/s]
100%|██████████| 200/200 [00:00<00:00, 67677.35it/s]
100%|██████████| 65/65 [00:00<00:00, 64193.49it/s]
100%|██████████| 144/144 [00:00<00:00, 65807.34it/s]
100%|██████████| 30/30 [00:00<00:00, 65399.75it/s]
100%|██████████| 130/130 [00:00<00:00, 66422.16it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81539.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 123.70it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 81589.49it/s]
100%|██████████| 287/287 [00:00<00:00, 78212.28it/s]
100%|██████████| 771/771 [00:00<00:00, 80042.78it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85550.90it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76601.30it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85556.72it/s]
100%|██████████| 353/353 [00:00<00:00, 74226.16it/s]
100%|██████████| 252/252 [00:00<00:00, 78889.73it/s]
100%|██████████| 203/203 [00:00<00:00, 82169.82it/s]
100%|██████████| 153/153 [00:00<00:00, 70496.38it/s]
100%|██████████| 200/200 [00:00<00:00, 64562.52it/s]
100%|██████████| 65/65 [00:00<00:00, 69601.67it/s]
100%|██████████| 144/144 [00:00<00:00, 80897.37it/s]
100%|██████████| 30/30 [00:00<00:00, 51760.23it/s]
100%|██████████| 130/130 [00:00<00:00, 80126.31it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78112.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 121.59it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80706.30it/s]
100%|██████████| 287/287 [00:00<00:00, 78610.67it/s]
100%|██████████| 771/771 [00:00<00:00, 80831.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 83899.50it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74617.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83282.56it/s]
100%|██████████| 353/353 [00:00<00:00, 81687.69it/s]
100%|██████████| 252/252 [00:00<00:00, 75271.66it/s]
100%|██████████| 203/203 [00:00<00:00, 76355.82it/s]
100%|██████████| 153/153 [00:00<00:00, 75003.33it/s]
100%|██████████| 200/200 [00:00<00:00, 74691.55it/s]
100%|██████████| 65/65 [00:00<00:00, 48074.37it/s]
100%|██████████| 144/144 [00:00<00:00, 72628.64it/s]
100%|██████████| 30/30 [00:00<00:00, 57614.07it/s]
100%|██████████| 130/130 [00:00<00:00, 72219.80it/s]
100%|██████████| 3500/3500 [00:00<00:00, 79954.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 122.20it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 99563.02it/s]
100%|██████████| 287/287 [00:00<00:00, 56114.36it/s]
100%|██████████| 771/771 [00:00<00:00, 81918.34it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94470.56it/s]
100%|██████████| 1000/1000 [00:00<00:00, 75578.49it/s]
100%|██████████| 3000/3000 [00:00<00:00, 100116.26it/s]
100%|██████████| 353/353 [00:00<00:00, 77660.07it/s]
100%|██████████| 252/252 [00:00<00:00, 78508.85it/s]
100%|██████████| 203/203 [00:00<00:00, 58426.11it/s]
100%|██████████| 153/153 [00:00<00:00, 71533.67it/s]
100%|██████████| 200/200 [00:00<00:00, 75743.64it/s]
100%|██████████| 65/65 [00:00<00:00, 63668.79it/s]
100%|██████████| 144/144 [00:00<00:00, 78215.46it/s]
100%|██████████| 30/30 [00:00<00:00, 25170.86it/s]
100%|██████████| 130/130 [00:00<00:00, 56427.56it/s]
100%|██████████| 3500/3500 [00:00<00:00, 67496.72it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 127.87it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 89255.72it/s]
100%|██████████| 287/287 [00:00<00:00, 77953.97it/s]
100%|██████████| 771/771 [00:00<00:00, 86120.06it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91825.30it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90570.16it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81621.89it/s]
100%|██████████| 353/353 [00:00<00:00, 79439.28it/s]
100%|██████████| 252/252 [00:00<00:00, 73257.87it/s]
100%|██████████| 203/203 [00:00<00:00, 61788.37it/s]
100%|██████████| 153/153 [00:00<00:00, 70519.62it/s]
100%|██████████| 200/200 [00:00<00:00, 74711.51it/s]
100%|██████████| 65/65 [00:00<00:00, 60678.78it/s]
100%|██████████| 144/144 [00:00<00:00, 68704.33it/s]
100%|██████████| 30/30 [00:00<00:00, 44274.85it/s]
100%|██████████| 130/130 [00:00<00:00, 75952.02it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89088.87it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 139.89it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 90838.55it/s]
100%|██████████| 287/287 [00:00<00:00, 83536.80it/s]
100%|██████████| 771/771 [00:00<00:00, 90276.89it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90709.23it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89430.79it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90275.80it/s]
100%|██████████| 353/353 [00:00<00:00, 83319.60it/s]
100%|██████████| 252/252 [00:00<00:00, 83926.04it/s]
100%|██████████| 203/203 [00:00<00:00, 84293.01it/s]
100%|██████████| 153/153 [00:00<00:00, 84649.59it/s]
100%|██████████| 200/200 [00:00<00:00, 84639.37it/s]
100%|██████████| 65/65 [00:00<00:00, 72392.40it/s]
100%|██████████| 144/144 [00:00<00:00, 84026.12it/s]
100%|██████████| 30/30 [00:00<00:00, 54660.78it/s]
100%|██████████| 130/130 [00:00<00:00, 79634.81it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84618.64it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 141.99it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 65751.96it/s]
100%|██████████| 287/287 [00:00<00:00, 77817.91it/s]
100%|██████████| 771/771 [00:00<00:00, 81216.78it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80959.40it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82260.61it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80088.80it/s]
100%|██████████| 353/353 [00:00<00:00, 72044.64it/s]
100%|██████████| 252/252 [00:00<00:00, 77981.75it/s]
100%|██████████| 203/203 [00:00<00:00, 60532.04it/s]
100%|██████████| 153/153 [00:00<00:00, 75881.34it/s]
100%|██████████| 200/200 [00:00<00:00, 77442.84it/s]
100%|██████████| 65/65 [00:00<00:00, 75042.60it/s]
100%|██████████| 144/144 [00:00<00:00, 65401.17it/s]
100%|██████████| 30/30 [00:00<00:00, 68089.35it/s]
100%|██████████| 130/130 [00:00<00:00, 73258.03it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78938.23it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 145.65it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81241.46it/s]
100%|██████████| 287/287 [00:00<00:00, 81994.77it/s]
100%|██████████| 771/771 [00:00<00:00, 83416.52it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82387.45it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82755.64it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87853.55it/s]
100%|██████████| 353/353 [00:00<00:00, 79481.93it/s]
100%|██████████| 252/252 [00:00<00:00, 64264.89it/s]
100%|██████████| 203/203 [00:00<00:00, 66602.29it/s]
100%|██████████| 153/153 [00:00<00:00, 77167.93it/s]
100%|██████████| 200/200 [00:00<00:00, 78729.31it/s]
100%|██████████| 65/65 [00:00<00:00, 78184.62it/s]
100%|██████████| 144/144 [00:00<00:00, 75696.17it/s]
100%|██████████| 30/30 [00:00<00:00, 69136.88it/s]
100%|██████████| 130/130 [00:00<00:00, 76602.91it/s]
100%|██████████| 3500/3500 [00:00<00:00, 102654.20it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 141.13it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 89773.96it/s]
100%|██████████| 287/287 [00:00<00:00, 92087.30it/s]
100%|██████████| 771/771 [00:00<00:00, 87777.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91291.66it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88595.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91185.81it/s]
100%|██████████| 353/353 [00:00<00:00, 76635.06it/s]
100%|██████████| 252/252 [00:00<00:00, 77473.03it/s]
100%|██████████| 203/203 [00:00<00:00, 83165.04it/s]
100%|██████████| 153/153 [00:00<00:00, 67857.51it/s]
100%|██████████| 200/200 [00:00<00:00, 70097.84it/s]
100%|██████████| 65/65 [00:00<00:00, 58985.24it/s]
100%|██████████| 144/144 [00:00<00:00, 63926.73it/s]
100%|██████████| 30/30 [00:00<00:00, 59158.03it/s]
100%|██████████| 130/130 [00:00<00:00, 78375.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89372.53it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:38<00:00, 151.81it/s]
INFO:root:The new embedding has 5845 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 86956.99it/s]
100%|██████████| 287/287 [00:00<00:00, 84173.50it/s]
100%|██████████| 771/771 [00:00<00:00, 88078.67it/s]
100%|██████████| 2000/2000 [00:00<00:00, 94109.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91546.71it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83491.44it/s]
100%|██████████| 353/353 [00:00<00:00, 77615.29it/s]
100%|██████████| 252/252 [00:00<00:00, 73986.04it/s]
100%|██████████| 203/203 [00:00<00:00, 70759.06it/s]
100%|██████████| 153/153 [00:00<00:00, 70126.60it/s]
100%|██████████| 200/200 [00:00<00:00, 81096.37it/s]
100%|██████████| 65/65 [00:00<00:00, 66317.14it/s]
100%|██████████| 144/144 [00:00<00:00, 86270.50it/s]
100%|██████████| 30/30 [00:00<00:00, 64994.38it/s]
100%|██████████| 130/130 [00:00<00:00, 71556.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84679.65it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:44<00:00, 130.90it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92466.28it/s]
100%|██████████| 287/287 [00:00<00:00, 87642.17it/s]
100%|██████████| 771/771 [00:00<00:00, 84389.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89398.38it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91220.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86840.99it/s]
100%|██████████| 353/353 [00:00<00:00, 75880.96it/s]
100%|██████████| 252/252 [00:00<00:00, 71580.97it/s]
100%|██████████| 203/203 [00:00<00:00, 70402.16it/s]
100%|██████████| 153/153 [00:00<00:00, 69791.03it/s]
100%|██████████| 200/200 [00:00<00:00, 72685.28it/s]
100%|██████████| 65/65 [00:00<00:00, 70265.40it/s]
100%|██████████| 144/144 [00:00<00:00, 69566.89it/s]
100%|██████████| 30/30 [00:00<00:00, 52913.84it/s]
100%|██████████| 130/130 [00:00<00:00, 81601.25it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76002.65it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.28it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 91206.32it/s]
100%|██████████| 287/287 [00:00<00:00, 84338.63it/s]
100%|██████████| 771/771 [00:00<00:00, 91296.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91145.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92513.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75803.87it/s]
100%|██████████| 353/353 [00:00<00:00, 88812.27it/s]
100%|██████████| 252/252 [00:00<00:00, 84227.00it/s]
100%|██████████| 203/203 [00:00<00:00, 84729.20it/s]
100%|██████████| 153/153 [00:00<00:00, 84526.94it/s]
100%|██████████| 200/200 [00:00<00:00, 86418.13it/s]
100%|██████████| 65/65 [00:00<00:00, 78386.94it/s]
100%|██████████| 144/144 [00:00<00:00, 82918.70it/s]
100%|██████████| 30/30 [00:00<00:00, 58119.69it/s]
100%|██████████| 130/130 [00:00<00:00, 81503.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90279.41it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.07it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 64381.02it/s]
100%|██████████| 287/287 [00:00<00:00, 79153.42it/s]
100%|██████████| 771/771 [00:00<00:00, 81153.59it/s]
100%|██████████| 2000/2000 [00:00<00:00, 81341.71it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91936.00it/s]
100%|██████████| 3000/3000 [00:00<00:00, 85719.33it/s]
100%|██████████| 353/353 [00:00<00:00, 81868.36it/s]
100%|██████████| 252/252 [00:00<00:00, 78062.38it/s]
100%|██████████| 203/203 [00:00<00:00, 76991.02it/s]
100%|██████████| 153/153 [00:00<00:00, 74907.03it/s]
100%|██████████| 200/200 [00:00<00:00, 77179.21it/s]
100%|██████████| 65/65 [00:00<00:00, 65425.91it/s]
100%|██████████| 144/144 [00:00<00:00, 76029.68it/s]
100%|██████████| 30/30 [00:00<00:00, 70021.77it/s]
100%|██████████| 130/130 [00:00<00:00, 64223.74it/s]
100%|██████████| 3500/3500 [00:00<00:00, 97474.60it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.92it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 84717.14it/s]
100%|██████████| 287/287 [00:00<00:00, 71900.92it/s]
100%|██████████| 771/771 [00:00<00:00, 94591.76it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90609.29it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76192.19it/s]
100%|██████████| 3000/3000 [00:00<00:00, 90651.72it/s]
100%|██████████| 353/353 [00:00<00:00, 60764.56it/s]
100%|██████████| 252/252 [00:00<00:00, 45324.38it/s]
100%|██████████| 203/203 [00:00<00:00, 49356.19it/s]
100%|██████████| 153/153 [00:00<00:00, 74767.39it/s]
100%|██████████| 200/200 [00:00<00:00, 68172.35it/s]
100%|██████████| 65/65 [00:00<00:00, 68089.35it/s]
100%|██████████| 144/144 [00:00<00:00, 75403.22it/s]
100%|██████████| 30/30 [00:00<00:00, 59776.30it/s]
100%|██████████| 130/130 [00:00<00:00, 71877.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81035.93it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 132.48it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 92672.84it/s]
100%|██████████| 287/287 [00:00<00:00, 87610.28it/s]
100%|██████████| 771/771 [00:00<00:00, 87414.40it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90172.94it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89360.29it/s]
100%|██████████| 3000/3000 [00:00<00:00, 91753.65it/s]
100%|██████████| 353/353 [00:00<00:00, 70366.87it/s]
100%|██████████| 252/252 [00:00<00:00, 71585.82it/s]
100%|██████████| 203/203 [00:00<00:00, 84326.41it/s]
100%|██████████| 153/153 [00:00<00:00, 84873.50it/s]
100%|██████████| 200/200 [00:00<00:00, 84810.51it/s]
100%|██████████| 65/65 [00:00<00:00, 74980.68it/s]
100%|██████████| 144/144 [00:00<00:00, 74981.97it/s]
100%|██████████| 30/30 [00:00<00:00, 56501.63it/s]
100%|██████████| 130/130 [00:00<00:00, 77705.50it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85819.72it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.19it/s]
INFO:root:The new embedding has 5844 word and vectors have 1500 dimensions
100%|██████████| 999/999 [00:00<00:00, 70021.89it/s]
100%|██████████| 287/287 [00:00<00:00, 83467.29it/s]
100%|██████████| 771/771 [00:00<00:00, 86592.81it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90202.03it/s]
100%|██████████| 1000/1000 [00:00<00:00, 92014.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89761.89it/s]
100%|██████████| 353/353 [00:00<00:00, 88483.20it/s]
100%|██████████| 252/252 [00:00<00:00, 83846.15it/s]
100%|██████████| 203/203 [00:00<00:00, 85512.07it/s]
100%|██████████| 153/153 [00:00<00:00, 86277.03it/s]
100%|██████████| 200/200 [00:00<00:00, 83961.65it/s]
100%|██████████| 65/65 [00:00<00:00, 73485.11it/s]
100%|██████████| 144/144 [00:00<00:00, 82241.25it/s]
100%|██████████| 30/30 [00:00<00:00, 55309.50it/s]
100%|██████████| 130/130 [00:00<00:00, 73012.79it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87589.36it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.63it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 103643.75it/s]
100%|██████████| 287/287 [00:00<00:00, 76096.17it/s]
100%|██████████| 771/771 [00:00<00:00, 80418.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90921.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81351.18it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80139.81it/s]
100%|██████████| 353/353 [00:00<00:00, 77839.72it/s]
100%|██████████| 252/252 [00:00<00:00, 77212.70it/s]
100%|██████████| 203/203 [00:00<00:00, 81275.65it/s]
100%|██████████| 153/153 [00:00<00:00, 80276.27it/s]
100%|██████████| 200/200 [00:00<00:00, 80097.47it/s]
100%|██████████| 65/65 [00:00<00:00, 67767.78it/s]
100%|██████████| 144/144 [00:00<00:00, 78479.70it/s]
100%|██████████| 30/30 [00:00<00:00, 54565.97it/s]
100%|██████████| 130/130 [00:00<00:00, 78083.85it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80351.09it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 134.67it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81500.62it/s]
100%|██████████| 287/287 [00:00<00:00, 75751.38it/s]
100%|██████████| 771/771 [00:00<00:00, 81147.48it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78071.33it/s]
100%|██████████| 1000/1000 [00:00<00:00, 67705.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89531.97it/s]
100%|██████████| 353/353 [00:00<00:00, 79002.68it/s]
100%|██████████| 252/252 [00:00<00:00, 77235.27it/s]
100%|██████████| 203/203 [00:00<00:00, 76561.79it/s]
100%|██████████| 153/153 [00:00<00:00, 79147.57it/s]
100%|██████████| 200/200 [00:00<00:00, 72678.98it/s]
100%|██████████| 65/65 [00:00<00:00, 67666.86it/s]
100%|██████████| 144/144 [00:00<00:00, 74208.11it/s]
100%|██████████| 30/30 [00:00<00:00, 64793.57it/s]
100%|██████████| 130/130 [00:00<00:00, 51668.67it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93913.94it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 136.07it/s]
INFO:root:The new embedding has 5846 word and vectors have 1300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80185.81it/s]
100%|██████████| 287/287 [00:00<00:00, 80557.13it/s]
100%|██████████| 771/771 [00:00<00:00, 79858.95it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82028.14it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89248.11it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80788.12it/s]
100%|██████████| 353/353 [00:00<00:00, 83743.74it/s]
100%|██████████| 252/252 [00:00<00:00, 80097.35it/s]
100%|██████████| 203/203 [00:00<00:00, 78546.47it/s]
100%|██████████| 153/153 [00:00<00:00, 68818.07it/s]
100%|██████████| 200/200 [00:00<00:00, 82225.13it/s]
100%|██████████| 65/65 [00:00<00:00, 41769.54it/s]
100%|██████████| 144/144 [00:00<00:00, 78023.48it/s]
100%|██████████| 30/30 [00:00<00:00, 31053.58it/s]
100%|██████████| 130/130 [00:00<00:00, 57791.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 61308.71it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 135.81it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 85543.87it/s]
100%|██████████| 287/287 [00:00<00:00, 73841.57it/s]
100%|██████████| 771/771 [00:00<00:00, 85861.68it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89809.94it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88284.41it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88035.49it/s]
100%|██████████| 353/353 [00:00<00:00, 80668.48it/s]
100%|██████████| 252/252 [00:00<00:00, 70558.39it/s]
100%|██████████| 203/203 [00:00<00:00, 72903.82it/s]
100%|██████████| 153/153 [00:00<00:00, 68965.99it/s]
100%|██████████| 200/200 [00:00<00:00, 69759.73it/s]
100%|██████████| 65/65 [00:00<00:00, 49506.04it/s]
100%|██████████| 144/144 [00:00<00:00, 68517.27it/s]
100%|██████████| 30/30 [00:00<00:00, 52146.34it/s]
100%|██████████| 130/130 [00:00<00:00, 65457.33it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85972.01it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 125.03it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76289.23it/s]
100%|██████████| 287/287 [00:00<00:00, 57878.89it/s]
100%|██████████| 771/771 [00:00<00:00, 57252.77it/s]
100%|██████████| 2000/2000 [00:00<00:00, 58200.06it/s]
100%|██████████| 1000/1000 [00:00<00:00, 57199.21it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89105.90it/s]
100%|██████████| 353/353 [00:00<00:00, 77979.11it/s]
100%|██████████| 252/252 [00:00<00:00, 77433.30it/s]
100%|██████████| 203/203 [00:00<00:00, 79263.05it/s]
100%|██████████| 153/153 [00:00<00:00, 66219.02it/s]
100%|██████████| 200/200 [00:00<00:00, 77236.06it/s]
100%|██████████| 65/65 [00:00<00:00, 69107.67it/s]
100%|██████████| 144/144 [00:00<00:00, 73236.30it/s]
100%|██████████| 30/30 [00:00<00:00, 61052.46it/s]
100%|██████████| 130/130 [00:00<00:00, 68302.58it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78778.53it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 128.65it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78259.83it/s]
100%|██████████| 287/287 [00:00<00:00, 79404.04it/s]
100%|██████████| 771/771 [00:00<00:00, 77834.94it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80836.91it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79000.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 79080.61it/s]
100%|██████████| 353/353 [00:00<00:00, 71584.84it/s]
100%|██████████| 252/252 [00:00<00:00, 67083.31it/s]
100%|██████████| 203/203 [00:00<00:00, 73412.98it/s]
100%|██████████| 153/153 [00:00<00:00, 76955.09it/s]
100%|██████████| 200/200 [00:00<00:00, 76412.90it/s]
100%|██████████| 65/65 [00:00<00:00, 71313.04it/s]
100%|██████████| 144/144 [00:00<00:00, 76705.58it/s]
100%|██████████| 30/30 [00:00<00:00, 29433.71it/s]
100%|██████████| 130/130 [00:00<00:00, 65956.15it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81675.70it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 127.16it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 89543.74it/s]
100%|██████████| 287/287 [00:00<00:00, 85409.77it/s]
100%|██████████| 771/771 [00:00<00:00, 89178.99it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90544.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90546.69it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81463.89it/s]
100%|██████████| 353/353 [00:00<00:00, 67715.04it/s]
100%|██████████| 252/252 [00:00<00:00, 80912.85it/s]
100%|██████████| 203/203 [00:00<00:00, 82249.20it/s]
100%|██████████| 153/153 [00:00<00:00, 79020.87it/s]
100%|██████████| 200/200 [00:00<00:00, 79257.45it/s]
100%|██████████| 65/65 [00:00<00:00, 70997.33it/s]
100%|██████████| 144/144 [00:00<00:00, 81663.03it/s]
100%|██████████| 30/30 [00:00<00:00, 55067.45it/s]
100%|██████████| 130/130 [00:00<00:00, 75909.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78602.21it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.62it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 87670.20it/s]
100%|██████████| 287/287 [00:00<00:00, 83455.72it/s]
100%|██████████| 771/771 [00:00<00:00, 80355.04it/s]
100%|██████████| 2000/2000 [00:00<00:00, 84408.57it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84711.17it/s]
100%|██████████| 3000/3000 [00:00<00:00, 83149.93it/s]
100%|██████████| 353/353 [00:00<00:00, 78914.26it/s]
100%|██████████| 252/252 [00:00<00:00, 85848.33it/s]
100%|██████████| 203/203 [00:00<00:00, 50336.61it/s]
100%|██████████| 153/153 [00:00<00:00, 60041.96it/s]
100%|██████████| 200/200 [00:00<00:00, 65098.62it/s]
100%|██████████| 65/65 [00:00<00:00, 47167.78it/s]
100%|██████████| 144/144 [00:00<00:00, 62504.38it/s]
100%|██████████| 30/30 [00:00<00:00, 31536.12it/s]
100%|██████████| 130/130 [00:00<00:00, 46627.29it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83133.13it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 126.23it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 84175.94it/s]
100%|██████████| 287/287 [00:00<00:00, 79148.22it/s]
100%|██████████| 771/771 [00:00<00:00, 81812.64it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82324.39it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82878.28it/s]
100%|██████████| 3000/3000 [00:00<00:00, 92371.31it/s]
100%|██████████| 353/353 [00:00<00:00, 78028.42it/s]
100%|██████████| 252/252 [00:00<00:00, 82075.21it/s]
100%|██████████| 203/203 [00:00<00:00, 81213.63it/s]
100%|██████████| 153/153 [00:00<00:00, 81603.32it/s]
100%|██████████| 200/200 [00:00<00:00, 81720.49it/s]
100%|██████████| 65/65 [00:00<00:00, 76431.11it/s]
100%|██████████| 144/144 [00:00<00:00, 81289.34it/s]
100%|██████████| 30/30 [00:00<00:00, 69289.16it/s]
100%|██████████| 130/130 [00:00<00:00, 74094.24it/s]
100%|██████████| 3500/3500 [00:00<00:00, 100001.80it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:43<00:00, 133.27it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82347.93it/s]
100%|██████████| 287/287 [00:00<00:00, 81445.55it/s]
100%|██████████| 771/771 [00:00<00:00, 81800.23it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82988.97it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82545.54it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82105.49it/s]
100%|██████████| 353/353 [00:00<00:00, 81088.19it/s]
100%|██████████| 252/252 [00:00<00:00, 78433.11it/s]
100%|██████████| 203/203 [00:00<00:00, 76431.21it/s]
100%|██████████| 153/153 [00:00<00:00, 75082.31it/s]
100%|██████████| 200/200 [00:00<00:00, 81080.69it/s]
100%|██████████| 65/65 [00:00<00:00, 72507.91it/s]
100%|██████████| 144/144 [00:00<00:00, 30502.49it/s]
100%|██████████| 30/30 [00:00<00:00, 67759.35it/s]
100%|██████████| 130/130 [00:00<00:00, 75468.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78477.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:41<00:00, 142.51it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 89748.96it/s]
100%|██████████| 287/287 [00:00<00:00, 85707.74it/s]
100%|██████████| 771/771 [00:00<00:00, 88789.66it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90631.81it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90980.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89726.69it/s]
100%|██████████| 353/353 [00:00<00:00, 87381.33it/s]
100%|██████████| 252/252 [00:00<00:00, 86494.65it/s]
100%|██████████| 203/203 [00:00<00:00, 85753.22it/s]
100%|██████████| 153/153 [00:00<00:00, 76670.07it/s]
100%|██████████| 200/200 [00:00<00:00, 85397.62it/s]
100%|██████████| 65/65 [00:00<00:00, 65868.51it/s]
100%|██████████| 144/144 [00:00<00:00, 80423.41it/s]
100%|██████████| 30/30 [00:00<00:00, 51275.11it/s]
100%|██████████| 130/130 [00:00<00:00, 82377.93it/s]
100%|██████████| 3500/3500 [00:00<00:00, 87027.53it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 120.01it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 81740.69it/s]
100%|██████████| 287/287 [00:00<00:00, 69481.40it/s]
100%|██████████| 771/771 [00:00<00:00, 79997.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85933.00it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84910.10it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86105.89it/s]
100%|██████████| 353/353 [00:00<00:00, 81039.37it/s]
100%|██████████| 252/252 [00:00<00:00, 83055.52it/s]
100%|██████████| 203/203 [00:00<00:00, 82536.23it/s]
100%|██████████| 153/153 [00:00<00:00, 60769.75it/s]
100%|██████████| 200/200 [00:00<00:00, 72284.43it/s]
100%|██████████| 65/65 [00:00<00:00, 49886.51it/s]
100%|██████████| 144/144 [00:00<00:00, 62221.05it/s]
100%|██████████| 30/30 [00:00<00:00, 30992.39it/s]
100%|██████████| 130/130 [00:00<00:00, 63394.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84762.77it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:56<00:00, 102.99it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 77877.29it/s]
100%|██████████| 287/287 [00:00<00:00, 77352.86it/s]
100%|██████████| 771/771 [00:00<00:00, 79277.50it/s]
100%|██████████| 2000/2000 [00:00<00:00, 51660.67it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81166.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89107.17it/s]
100%|██████████| 353/353 [00:00<00:00, 80375.08it/s]
100%|██████████| 252/252 [00:00<00:00, 56847.45it/s]
100%|██████████| 203/203 [00:00<00:00, 81028.14it/s]
100%|██████████| 153/153 [00:00<00:00, 81365.35it/s]
100%|██████████| 200/200 [00:00<00:00, 80659.69it/s]
100%|██████████| 65/65 [00:00<00:00, 77035.82it/s]
100%|██████████| 144/144 [00:00<00:00, 80799.97it/s]
100%|██████████| 30/30 [00:00<00:00, 70099.79it/s]
100%|██████████| 130/130 [00:00<00:00, 65433.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 68843.89it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:50<00:00, 114.67it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 74569.05it/s]
100%|██████████| 287/287 [00:00<00:00, 76269.74it/s]
100%|██████████| 771/771 [00:00<00:00, 78404.86it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98275.59it/s]
100%|██████████| 1000/1000 [00:00<00:00, 79671.46it/s]
100%|██████████| 3000/3000 [00:00<00:00, 99571.20it/s]
100%|██████████| 353/353 [00:00<00:00, 74750.81it/s]
100%|██████████| 252/252 [00:00<00:00, 79776.93it/s]
100%|██████████| 203/203 [00:00<00:00, 80128.34it/s]
100%|██████████| 153/153 [00:00<00:00, 74872.07it/s]
100%|██████████| 200/200 [00:00<00:00, 78655.49it/s]
100%|██████████| 65/65 [00:00<00:00, 67183.28it/s]
100%|██████████| 144/144 [00:00<00:00, 80188.50it/s]
100%|██████████| 30/30 [00:00<00:00, 70453.03it/s]
100%|██████████| 130/130 [00:00<00:00, 65160.08it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71247.23it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:49<00:00, 117.37it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 89568.62it/s]
100%|██████████| 287/287 [00:00<00:00, 87166.20it/s]
100%|██████████| 771/771 [00:00<00:00, 79855.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89235.76it/s]
100%|██████████| 1000/1000 [00:00<00:00, 90701.38it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88944.03it/s]
100%|██████████| 353/353 [00:00<00:00, 86894.14it/s]
100%|██████████| 252/252 [00:00<00:00, 86671.96it/s]
100%|██████████| 203/203 [00:00<00:00, 85813.72it/s]
100%|██████████| 153/153 [00:00<00:00, 81046.79it/s]
100%|██████████| 200/200 [00:00<00:00, 82128.53it/s]
100%|██████████| 65/65 [00:00<00:00, 61100.35it/s]
100%|██████████| 144/144 [00:00<00:00, 84166.64it/s]
100%|██████████| 30/30 [00:00<00:00, 62757.67it/s]
100%|██████████| 130/130 [00:00<00:00, 70093.78it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81596.26it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 145.28it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 71098.34it/s]
100%|██████████| 287/287 [00:00<00:00, 79367.39it/s]
100%|██████████| 771/771 [00:00<00:00, 85604.84it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89111.58it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88952.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88039.18it/s]
100%|██████████| 353/353 [00:00<00:00, 84301.62it/s]
100%|██████████| 252/252 [00:00<00:00, 82944.72it/s]
100%|██████████| 203/203 [00:00<00:00, 83197.55it/s]
100%|██████████| 153/153 [00:00<00:00, 75020.87it/s]
100%|██████████| 200/200 [00:00<00:00, 77917.59it/s]
100%|██████████| 65/65 [00:00<00:00, 66028.04it/s]
100%|██████████| 144/144 [00:00<00:00, 65422.42it/s]
100%|██████████| 30/30 [00:00<00:00, 51675.20it/s]
100%|██████████| 130/130 [00:00<00:00, 51934.42it/s]
100%|██████████| 3500/3500 [00:00<00:00, 85748.04it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:42<00:00, 138.96it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 56311.11it/s]
100%|██████████| 287/287 [00:00<00:00, 78641.49it/s]
100%|██████████| 771/771 [00:00<00:00, 81872.71it/s]
100%|██████████| 2000/2000 [00:00<00:00, 101703.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82607.32it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80501.27it/s]
100%|██████████| 353/353 [00:00<00:00, 86392.19it/s]
100%|██████████| 252/252 [00:00<00:00, 77924.26it/s]
100%|██████████| 203/203 [00:00<00:00, 76928.42it/s]
100%|██████████| 153/153 [00:00<00:00, 74411.93it/s]
100%|██████████| 200/200 [00:00<00:00, 78921.89it/s]
100%|██████████| 65/65 [00:00<00:00, 72585.13it/s]
100%|██████████| 144/144 [00:00<00:00, 78643.20it/s]
100%|██████████| 30/30 [00:00<00:00, 61200.93it/s]
100%|██████████| 130/130 [00:00<00:00, 67962.05it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76600.70it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 146.04it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 76566.65it/s]
100%|██████████| 287/287 [00:00<00:00, 74214.87it/s]
100%|██████████| 771/771 [00:00<00:00, 76384.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82341.36it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77726.99it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80212.35it/s]
100%|██████████| 353/353 [00:00<00:00, 78704.51it/s]
100%|██████████| 252/252 [00:00<00:00, 78172.07it/s]
100%|██████████| 203/203 [00:00<00:00, 78655.31it/s]
100%|██████████| 153/153 [00:00<00:00, 75622.03it/s]
100%|██████████| 200/200 [00:00<00:00, 78091.68it/s]
100%|██████████| 65/65 [00:00<00:00, 68465.53it/s]
100%|██████████| 144/144 [00:00<00:00, 72786.19it/s]
100%|██████████| 30/30 [00:00<00:00, 56425.61it/s]
100%|██████████| 130/130 [00:00<00:00, 70565.49it/s]
100%|██████████| 3500/3500 [00:00<00:00, 78839.88it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:40<00:00, 143.34it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 82242.87it/s]
100%|██████████| 287/287 [00:00<00:00, 84730.43it/s]
100%|██████████| 771/771 [00:00<00:00, 88616.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 89423.16it/s]
100%|██████████| 1000/1000 [00:00<00:00, 87993.62it/s]
100%|██████████| 3000/3000 [00:00<00:00, 82414.70it/s]
100%|██████████| 353/353 [00:00<00:00, 84498.88it/s]
100%|██████████| 252/252 [00:00<00:00, 82905.69it/s]
100%|██████████| 203/203 [00:00<00:00, 85770.50it/s]
100%|██████████| 153/153 [00:00<00:00, 80477.62it/s]
100%|██████████| 200/200 [00:00<00:00, 83236.83it/s]
100%|██████████| 65/65 [00:00<00:00, 73326.99it/s]
100%|██████████| 144/144 [00:00<00:00, 74390.91it/s]
100%|██████████| 30/30 [00:00<00:00, 33244.15it/s]
100%|██████████| 130/130 [00:00<00:00, 66780.10it/s]
100%|██████████| 3500/3500 [00:00<00:00, 76643.09it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:43<00:00, 132.95it/s]
INFO:root:The new embedding has 5845 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 63584.78it/s]
100%|██████████| 287/287 [00:00<00:00, 80876.46it/s]
100%|██████████| 771/771 [00:00<00:00, 58374.10it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77976.98it/s]
100%|██████████| 1000/1000 [00:00<00:00, 78148.42it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81707.75it/s]
100%|██████████| 353/353 [00:00<00:00, 85366.08it/s]
100%|██████████| 252/252 [00:00<00:00, 59333.37it/s]
100%|██████████| 203/203 [00:00<00:00, 82043.14it/s]
100%|██████████| 153/153 [00:00<00:00, 79157.33it/s]
100%|██████████| 200/200 [00:00<00:00, 74904.97it/s]
100%|██████████| 65/65 [00:00<00:00, 40978.47it/s]
100%|██████████| 144/144 [00:00<00:00, 83192.81it/s]
100%|██████████| 30/30 [00:00<00:00, 56048.61it/s]
100%|██████████| 130/130 [00:00<00:00, 82402.83it/s]
100%|██████████| 3500/3500 [00:00<00:00, 72505.24it/s]
100%|██████████| 203

['monotony' 'unvariedness']


100%|██████████| 5846/5846 [00:52<00:00, 112.28it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 89722.06it/s]
100%|██████████| 287/287 [00:00<00:00, 71068.91it/s]
100%|██████████| 771/771 [00:00<00:00, 87625.21it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85588.43it/s]
100%|██████████| 1000/1000 [00:00<00:00, 84248.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 84597.83it/s]
100%|██████████| 353/353 [00:00<00:00, 88711.16it/s]
100%|██████████| 252/252 [00:00<00:00, 77433.30it/s]
100%|██████████| 203/203 [00:00<00:00, 81838.11it/s]
100%|██████████| 153/153 [00:00<00:00, 82484.38it/s]
100%|██████████| 200/200 [00:00<00:00, 84222.97it/s]
100%|██████████| 65/65 [00:00<00:00, 69300.90it/s]
100%|██████████| 144/144 [00:00<00:00, 65323.36it/s]
100%|██████████| 30/30 [00:00<00:00, 54424.36it/s]
100%|██████████| 130/130 [00:00<00:00, 87395.34it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83216.54it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 122.00it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 58221.04it/s]
100%|██████████| 287/287 [00:00<00:00, 70668.38it/s]
100%|██████████| 771/771 [00:00<00:00, 64907.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 79235.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88932.09it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87241.99it/s]
100%|██████████| 353/353 [00:00<00:00, 83469.91it/s]
100%|██████████| 252/252 [00:00<00:00, 83186.26it/s]
100%|██████████| 203/203 [00:00<00:00, 39841.08it/s]
100%|██████████| 153/153 [00:00<00:00, 56654.76it/s]
100%|██████████| 200/200 [00:00<00:00, 58686.22it/s]
100%|██████████| 65/65 [00:00<00:00, 38594.25it/s]
100%|██████████| 144/144 [00:00<00:00, 70533.67it/s]
100%|██████████| 30/30 [00:00<00:00, 55067.45it/s]
100%|██████████| 130/130 [00:00<00:00, 76851.24it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84668.42it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 127.66it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 82330.13it/s]
100%|██████████| 287/287 [00:00<00:00, 79793.53it/s]
100%|██████████| 771/771 [00:00<00:00, 81924.57it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82349.44it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82130.14it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80243.05it/s]
100%|██████████| 353/353 [00:00<00:00, 80880.00it/s]
100%|██████████| 252/252 [00:00<00:00, 80956.24it/s]
100%|██████████| 203/203 [00:00<00:00, 77018.88it/s]
100%|██████████| 153/153 [00:00<00:00, 75953.19it/s]
100%|██████████| 200/200 [00:00<00:00, 77765.90it/s]
100%|██████████| 65/65 [00:00<00:00, 47488.20it/s]
100%|██████████| 144/144 [00:00<00:00, 69977.96it/s]
100%|██████████| 30/30 [00:00<00:00, 64627.18it/s]
100%|██████████| 130/130 [00:00<00:00, 73703.64it/s]
100%|██████████| 3500/3500 [00:00<00:00, 98972.28it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 128.45it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 81136.06it/s]
100%|██████████| 287/287 [00:00<00:00, 69961.95it/s]
100%|██████████| 771/771 [00:00<00:00, 84148.02it/s]
100%|██████████| 2000/2000 [00:00<00:00, 103049.09it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81572.68it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98584.35it/s]
100%|██████████| 353/353 [00:00<00:00, 81039.37it/s]
100%|██████████| 252/252 [00:00<00:00, 79072.69it/s]
100%|██████████| 203/203 [00:00<00:00, 76486.14it/s]
100%|██████████| 153/153 [00:00<00:00, 75055.97it/s]
100%|██████████| 200/200 [00:00<00:00, 61712.71it/s]
100%|██████████| 65/65 [00:00<00:00, 42866.31it/s]
100%|██████████| 144/144 [00:00<00:00, 74390.91it/s]
100%|██████████| 30/30 [00:00<00:00, 62015.34it/s]
100%|██████████| 130/130 [00:00<00:00, 73277.72it/s]
100%|██████████| 3500/3500 [00:00<00:00, 90731.37it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.79it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 85111.20it/s]
100%|██████████| 287/287 [00:00<00:00, 81805.32it/s]
100%|██████████| 771/771 [00:00<00:00, 88743.37it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91530.73it/s]
100%|██████████| 1000/1000 [00:00<00:00, 91045.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 88238.60it/s]
100%|██████████| 353/353 [00:00<00:00, 87525.97it/s]
100%|██████████| 252/252 [00:00<00:00, 80782.99it/s]
100%|██████████| 203/203 [00:00<00:00, 82946.29it/s]
100%|██████████| 153/153 [00:00<00:00, 70134.26it/s]
100%|██████████| 200/200 [00:00<00:00, 82932.36it/s]
100%|██████████| 65/65 [00:00<00:00, 73326.99it/s]
100%|██████████| 144/144 [00:00<00:00, 81906.67it/s]
100%|██████████| 30/30 [00:00<00:00, 52582.16it/s]
100%|██████████| 130/130 [00:00<00:00, 75021.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84290.68it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 131.28it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 86769.72it/s]
100%|██████████| 287/287 [00:00<00:00, 82410.16it/s]
100%|██████████| 771/771 [00:00<00:00, 85142.79it/s]
100%|██████████| 2000/2000 [00:00<00:00, 87783.68it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89052.93it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86791.27it/s]
100%|██████████| 353/353 [00:00<00:00, 85707.05it/s]
100%|██████████| 252/252 [00:00<00:00, 81217.50it/s]
100%|██████████| 203/203 [00:00<00:00, 84359.82it/s]
100%|██████████| 153/153 [00:00<00:00, 78412.57it/s]
100%|██████████| 200/200 [00:00<00:00, 82241.25it/s]
100%|██████████| 65/65 [00:00<00:00, 70868.15it/s]
100%|██████████| 144/144 [00:00<00:00, 80745.96it/s]
100%|██████████| 30/30 [00:00<00:00, 57799.32it/s]
100%|██████████| 130/130 [00:00<00:00, 80161.65it/s]
100%|██████████| 3500/3500 [00:00<00:00, 84176.61it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.51it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78770.34it/s]
100%|██████████| 287/287 [00:00<00:00, 76648.54it/s]
100%|██████████| 771/771 [00:00<00:00, 81021.43it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82295.31it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82046.60it/s]
100%|██████████| 3000/3000 [00:00<00:00, 96941.52it/s]
100%|██████████| 353/353 [00:00<00:00, 79252.18it/s]
100%|██████████| 252/252 [00:00<00:00, 79788.98it/s]
100%|██████████| 203/203 [00:00<00:00, 60334.73it/s]
100%|██████████| 153/153 [00:00<00:00, 64670.82it/s]
100%|██████████| 200/200 [00:00<00:00, 76343.36it/s]
100%|██████████| 65/65 [00:00<00:00, 65191.24it/s]
100%|██████████| 144/144 [00:00<00:00, 80573.61it/s]
100%|██████████| 30/30 [00:00<00:00, 70453.03it/s]
100%|██████████| 130/130 [00:00<00:00, 77639.12it/s]
100%|██████████| 3500/3500 [00:00<00:00, 73800.32it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.70it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80415.11it/s]
100%|██████████| 287/287 [00:00<00:00, 77802.82it/s]
100%|██████████| 771/771 [00:00<00:00, 80199.60it/s]
100%|██████████| 2000/2000 [00:00<00:00, 80988.32it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81008.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80594.08it/s]
100%|██████████| 353/353 [00:00<00:00, 78834.42it/s]
100%|██████████| 252/252 [00:00<00:00, 79614.69it/s]
100%|██████████| 203/203 [00:00<00:00, 77587.36it/s]
100%|██████████| 153/153 [00:00<00:00, 59957.82it/s]
100%|██████████| 200/200 [00:00<00:00, 77200.52it/s]
100%|██████████| 65/65 [00:00<00:00, 76927.13it/s]
100%|██████████| 144/144 [00:00<00:00, 70981.29it/s]
100%|██████████| 30/30 [00:00<00:00, 57772.78it/s]
100%|██████████| 130/130 [00:00<00:00, 77286.96it/s]
100%|██████████| 3500/3500 [00:00<00:00, 81139.40it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 129.82it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 70901.04it/s]
100%|██████████| 287/287 [00:00<00:00, 69722.86it/s]
100%|██████████| 771/771 [00:00<00:00, 82950.07it/s]
100%|██████████| 2000/2000 [00:00<00:00, 70400.21it/s]
100%|██████████| 1000/1000 [00:00<00:00, 74958.52it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75159.55it/s]
100%|██████████| 353/353 [00:00<00:00, 79893.66it/s]
100%|██████████| 252/252 [00:00<00:00, 84550.40it/s]
100%|██████████| 203/203 [00:00<00:00, 69043.44it/s]
100%|██████████| 153/153 [00:00<00:00, 67408.46it/s]
100%|██████████| 200/200 [00:00<00:00, 79093.04it/s]
100%|██████████| 65/65 [00:00<00:00, 54976.76it/s]
100%|██████████| 144/144 [00:00<00:00, 72402.27it/s]
100%|██████████| 30/30 [00:00<00:00, 36878.41it/s]
100%|██████████| 130/130 [00:00<00:00, 44075.62it/s]
100%|██████████| 3500/3500 [00:00<00:00, 71036.23it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 128.58it/s]
INFO:root:The new embedding has 5844 word and vectors have 1800 dimensions
100%|██████████| 999/999 [00:00<00:00, 86310.37it/s]
100%|██████████| 287/287 [00:00<00:00, 83150.19it/s]
100%|██████████| 771/771 [00:00<00:00, 86081.09it/s]
100%|██████████| 2000/2000 [00:00<00:00, 88524.78it/s]
100%|██████████| 1000/1000 [00:00<00:00, 89486.12it/s]
100%|██████████| 3000/3000 [00:00<00:00, 87695.58it/s]
100%|██████████| 353/353 [00:00<00:00, 86175.97it/s]
100%|██████████| 252/252 [00:00<00:00, 80261.57it/s]
100%|██████████| 203/203 [00:00<00:00, 87759.61it/s]
100%|██████████| 153/153 [00:00<00:00, 50088.08it/s]
100%|██████████| 200/200 [00:00<00:00, 82305.81it/s]
100%|██████████| 65/65 [00:00<00:00, 71257.12it/s]
100%|██████████| 144/144 [00:00<00:00, 81016.74it/s]
100%|██████████| 30/30 [00:00<00:00, 48922.67it/s]
100%|██████████| 130/130 [00:00<00:00, 82043.26it/s]
100%|██████████| 3500/3500 [00:00<00:00, 74625.29it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 126.22it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80245.70it/s]
100%|██████████| 287/287 [00:00<00:00, 74402.95it/s]
100%|██████████| 771/771 [00:00<00:00, 80377.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 91993.46it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81892.81it/s]
100%|██████████| 3000/3000 [00:00<00:00, 98370.86it/s]
100%|██████████| 353/353 [00:00<00:00, 82557.67it/s]
100%|██████████| 252/252 [00:00<00:00, 76458.67it/s]
100%|██████████| 203/203 [00:00<00:00, 79137.81it/s]
100%|██████████| 153/153 [00:00<00:00, 77279.45it/s]
100%|██████████| 200/200 [00:00<00:00, 74918.35it/s]
100%|██████████| 65/65 [00:00<00:00, 65820.80it/s]
100%|██████████| 144/144 [00:00<00:00, 75819.71it/s]
100%|██████████| 30/30 [00:00<00:00, 70334.89it/s]
100%|██████████| 130/130 [00:00<00:00, 66212.45it/s]
100%|██████████| 3500/3500 [00:00<00:00, 102307.94it/s]
100%|██████████| 20

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:44<00:00, 130.68it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 66265.65it/s]
100%|██████████| 287/287 [00:00<00:00, 78055.07it/s]
100%|██████████| 771/771 [00:00<00:00, 82147.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 82444.13it/s]
100%|██████████| 1000/1000 [00:00<00:00, 82960.24it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81144.48it/s]
100%|██████████| 353/353 [00:00<00:00, 79794.63it/s]
100%|██████████| 252/252 [00:00<00:00, 73227.42it/s]
100%|██████████| 203/203 [00:00<00:00, 78851.98it/s]
100%|██████████| 153/153 [00:00<00:00, 77038.24it/s]
100%|██████████| 200/200 [00:00<00:00, 67308.10it/s]
100%|██████████| 65/65 [00:00<00:00, 60719.32it/s]
100%|██████████| 144/144 [00:00<00:00, 68665.28it/s]
100%|██████████| 30/30 [00:00<00:00, 48099.82it/s]
100%|██████████| 130/130 [00:00<00:00, 63394.90it/s]
100%|██████████| 3500/3500 [00:00<00:00, 89236.17it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:45<00:00, 128.53it/s]
INFO:root:The new embedding has 5846 word and vectors have 1600 dimensions
100%|██████████| 999/999 [00:00<00:00, 68726.38it/s]
100%|██████████| 287/287 [00:00<00:00, 82704.59it/s]
100%|██████████| 771/771 [00:00<00:00, 87258.73it/s]
100%|██████████| 2000/2000 [00:00<00:00, 90566.25it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88476.23it/s]
100%|██████████| 3000/3000 [00:00<00:00, 89037.18it/s]
100%|██████████| 353/353 [00:00<00:00, 86422.44it/s]
100%|██████████| 252/252 [00:00<00:00, 80684.32it/s]
100%|██████████| 203/203 [00:00<00:00, 84762.94it/s]
100%|██████████| 153/153 [00:00<00:00, 68516.82it/s]
100%|██████████| 200/200 [00:00<00:00, 85475.93it/s]
100%|██████████| 65/65 [00:00<00:00, 70446.97it/s]
100%|██████████| 144/144 [00:00<00:00, 82297.29it/s]
100%|██████████| 30/30 [00:00<00:00, 49306.08it/s]
100%|██████████| 130/130 [00:00<00:00, 82527.55it/s]
100%|██████████| 3500/3500 [00:00<00:00, 80702.70it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:46<00:00, 125.27it/s]
INFO:root:The new embedding has 5844 word and vectors have 2100 dimensions
100%|██████████| 999/999 [00:00<00:00, 82126.81it/s]
100%|██████████| 287/287 [00:00<00:00, 44826.29it/s]
100%|██████████| 771/771 [00:00<00:00, 82879.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 85001.30it/s]
100%|██████████| 1000/1000 [00:00<00:00, 88468.76it/s]
100%|██████████| 3000/3000 [00:00<00:00, 81442.27it/s]
100%|██████████| 353/353 [00:00<00:00, 81123.74it/s]
100%|██████████| 252/252 [00:00<00:00, 82254.06it/s]
100%|██████████| 203/203 [00:00<00:00, 66753.72it/s]
100%|██████████| 153/153 [00:00<00:00, 74810.97it/s]
100%|██████████| 200/200 [00:00<00:00, 76566.34it/s]
100%|██████████| 65/65 [00:00<00:00, 59125.95it/s]
100%|██████████| 144/144 [00:00<00:00, 75724.65it/s]
100%|██████████| 30/30 [00:00<00:00, 43018.50it/s]
100%|██████████| 130/130 [00:00<00:00, 71471.95it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83551.87it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:52<00:00, 111.28it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 78009.23it/s]
100%|██████████| 287/287 [00:00<00:00, 77692.35it/s]
100%|██████████| 771/771 [00:00<00:00, 82442.53it/s]
100%|██████████| 2000/2000 [00:00<00:00, 78626.74it/s]
100%|██████████| 1000/1000 [00:00<00:00, 80446.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 86143.62it/s]
100%|██████████| 353/353 [00:00<00:00, 79078.64it/s]
100%|██████████| 252/252 [00:00<00:00, 79007.67it/s]
100%|██████████| 203/203 [00:00<00:00, 79730.66it/s]
100%|██████████| 153/153 [00:00<00:00, 80639.42it/s]
100%|██████████| 200/200 [00:00<00:00, 81072.85it/s]
100%|██████████| 65/65 [00:00<00:00, 72048.03it/s]
100%|██████████| 144/144 [00:00<00:00, 75488.04it/s]
100%|██████████| 30/30 [00:00<00:00, 30511.43it/s]
100%|██████████| 130/130 [00:00<00:00, 71071.37it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93231.62it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:48<00:00, 120.14it/s]
INFO:root:The new embedding has 5844 words and vectors have 300 dimensions
100%|██████████| 999/999 [00:00<00:00, 80264.15it/s]
100%|██████████| 287/287 [00:00<00:00, 79283.75it/s]
100%|██████████| 771/771 [00:00<00:00, 61476.91it/s]
100%|██████████| 2000/2000 [00:00<00:00, 98870.96it/s]
100%|██████████| 1000/1000 [00:00<00:00, 66097.83it/s]
100%|██████████| 3000/3000 [00:00<00:00, 59318.38it/s]
100%|██████████| 353/353 [00:00<00:00, 79708.71it/s]
100%|██████████| 252/252 [00:00<00:00, 78398.21it/s]
100%|██████████| 203/203 [00:00<00:00, 77828.49it/s]
100%|██████████| 153/153 [00:00<00:00, 77316.69it/s]
100%|██████████| 200/200 [00:00<00:00, 77442.84it/s]
100%|██████████| 65/65 [00:00<00:00, 76153.56it/s]
100%|██████████| 144/144 [00:00<00:00, 76861.77it/s]
100%|██████████| 30/30 [00:00<00:00, 69905.07it/s]
100%|██████████| 130/130 [00:00<00:00, 72527.20it/s]
100%|██████████| 3500/3500 [00:00<00:00, 86900.79it/s]
100%|██████████| 203

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']


100%|██████████| 5846/5846 [00:47<00:00, 122.19it/s]
INFO:root:The new embedding has 5846 word and vectors have 1900 dimensions
100%|██████████| 999/999 [00:00<00:00, 85287.91it/s]
100%|██████████| 287/287 [00:00<00:00, 78288.58it/s]
100%|██████████| 771/771 [00:00<00:00, 81653.58it/s]
100%|██████████| 2000/2000 [00:00<00:00, 51988.20it/s]
100%|██████████| 1000/1000 [00:00<00:00, 81039.96it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80601.82it/s]
100%|██████████| 353/353 [00:00<00:00, 82825.54it/s]
100%|██████████| 252/252 [00:00<00:00, 84092.98it/s]
100%|██████████| 203/203 [00:00<00:00, 83002.90it/s]
100%|██████████| 153/153 [00:00<00:00, 81324.10it/s]
100%|██████████| 200/200 [00:00<00:00, 82809.56it/s]
100%|██████████| 65/65 [00:00<00:00, 70960.37it/s]
100%|██████████| 144/144 [00:00<00:00, 81795.74it/s]
100%|██████████| 30/30 [00:00<00:00, 50271.32it/s]
100%|██████████| 130/130 [00:00<00:00, 73317.13it/s]
100%|██████████| 3500/3500 [00:00<00:00, 83799.41it/s]
100%|██████████| 203

In [29]:
Top = load_embedding('/home/iker/Escritorio/Meta/avg.vec', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)


In [31]:
Top.L1_dimensionwwise()

In [32]:
results_to_csv(evaluate_on_all(Top,lowercase_dataset=True))

100%|██████████| 999/999 [00:00<00:00, 72481.96it/s]
100%|██████████| 287/287 [00:00<00:00, 74242.34it/s]
100%|██████████| 771/771 [00:00<00:00, 75593.36it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76853.94it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76982.31it/s]
100%|██████████| 3000/3000 [00:00<00:00, 73733.47it/s]
100%|██████████| 353/353 [00:00<00:00, 72535.24it/s]
100%|██████████| 252/252 [00:00<00:00, 73887.77it/s]
100%|██████████| 203/203 [00:00<00:00, 69727.60it/s]
100%|██████████| 153/153 [00:00<00:00, 69988.93it/s]
100%|██████████| 200/200 [00:00<00:00, 74065.05it/s]
100%|██████████| 65/65 [00:00<00:00, 65457.33it/s]
100%|██████████| 144/144 [00:00<00:00, 72988.49it/s]
100%|██████████| 30/30 [00:00<00:00, 66752.85it/s]
100%|██████████| 130/130 [00:00<00:00, 68976.54it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75869.10it/s]
100%|██████████| 2034/2034 [00:00<00:00, 72429.78it/s]

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']
0.6434964962286586,0.7728845388014604,0.8101669335623386,0.8593612431654819,0.8668068255841362,0.8619611306739761,0.8179271022075507,0.7688437098585119,0.8754778889455215,0.8044480045798984,0.7607321108693915,0.8846368238956354,0.5682822572288425,0.8741516009467072,0.8088846157604197,0.5764077323320247,0.6247643009627538,
1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.9985250737463127,





In [22]:
evaluate_on_all(Top,lowercase_dataset=True)

100%|██████████| 999/999 [00:00<00:00, 70233.15it/s]
100%|██████████| 287/287 [00:00<00:00, 74587.35it/s]
100%|██████████| 771/771 [00:00<00:00, 75838.01it/s]
100%|██████████| 2000/2000 [00:00<00:00, 77650.01it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76952.65it/s]
100%|██████████| 3000/3000 [00:00<00:00, 78744.58it/s]
100%|██████████| 353/353 [00:00<00:00, 73811.72it/s]
100%|██████████| 252/252 [00:00<00:00, 71455.15it/s]
100%|██████████| 203/203 [00:00<00:00, 75576.40it/s]
100%|██████████| 153/153 [00:00<00:00, 74793.53it/s]
100%|██████████| 200/200 [00:00<00:00, 72346.77it/s]
100%|██████████| 65/65 [00:00<00:00, 65852.60it/s]
100%|██████████| 144/144 [00:00<00:00, 72786.19it/s]
100%|██████████| 30/30 [00:00<00:00, 59241.58it/s]
100%|██████████| 130/130 [00:00<00:00, 75583.52it/s]
100%|██████████| 3500/3500 [00:00<00:00, 93347.81it/s]
100%|██████████| 2034/2034 [00:00<00:00, 75223.21it/s]

['monsignori' 'priest']
['internationalisms' 'scope']
['internationalisms' 'doctrine']





array([{'dataset': 'SimLex999', 'coverage': 1.0, 'pearson': 0.6662235410501283, 'spearman': 0.6404598488060838},
       {'dataset': 'MTurk-287', 'coverage': 1.0, 'pearson': 0.781966937140428, 'spearman': 0.7724961807592994},
       {'dataset': 'MTurk-771', 'coverage': 1.0, 'pearson': 0.7951002669089963, 'spearman': 0.80985608582461},
       {'dataset': 'MEN_DEV', 'coverage': 1.0, 'pearson': 0.8396025740468014, 'spearman': 0.8589625980494974},
       {'dataset': 'MEN_TEST', 'coverage': 1.0, 'pearson': 0.8531647520309281, 'spearman': 0.8654431268412633},
       {'dataset': 'MEN_ALL', 'coverage': 1.0, 'pearson': 0.8439572260816524, 'spearman': 0.8612290440145963},
       {'dataset': 'WS353_all', 'coverage': 1.0, 'pearson': 0.7797596549985749, 'spearman': 0.8167489511597438},
       {'dataset': 'WS353_relatedness', 'coverage': 1.0, 'pearson': 0.7545473118269888, 'spearman': 0.7671759499110585},
       {'dataset': 'WS353_similarity', 'coverage': 1.0, 'pearson': 0.8669118089252843, 'spearman

In [33]:
Top.export('/home/iker/Escritorio/Meta/FTr+UKBr-RotEmbeddings.vec')

100%|██████████| 2083053/2083053 [03:14<00:00, 10723.35it/s]


In [16]:
path = '/run/user/1000/gvfs/afp-volume:host=MyCloudEX2Ultra.local,user=iker,volume=My_Book_25EE-1/TFG/vecmap_results/vecmap-master/joint(Orto)/'
    
FT = load_embedding(path+'FT.Jointc-FT.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
UKB = load_embedding(path+'UKB.Jointc-UKB.Orto.TXT', vocabulary = None, length_normalize = False, normalize_dimensionwise=False, delete_duplicates=True, dims_restriction=300)
  



In [18]:
results_to_csv(evaluate_on_all(FT,lowercase_dataset=True))

100%|██████████| 999/999 [00:00<00:00, 49629.38it/s]
100%|██████████| 287/287 [00:00<00:00, 73190.57it/s]
100%|██████████| 771/771 [00:00<00:00, 75201.35it/s]
100%|██████████| 2000/2000 [00:00<00:00, 76387.85it/s]
100%|██████████| 1000/1000 [00:00<00:00, 76232.35it/s]
100%|██████████| 3000/3000 [00:00<00:00, 75093.17it/s]
100%|██████████| 353/353 [00:00<00:00, 74921.03it/s]
100%|██████████| 252/252 [00:00<00:00, 57086.94it/s]
100%|██████████| 203/203 [00:00<00:00, 70390.52it/s]
100%|██████████| 153/153 [00:00<00:00, 65831.81it/s]
100%|██████████| 200/200 [00:00<00:00, 70861.70it/s]
100%|██████████| 65/65 [00:00<00:00, 68517.16it/s]
100%|██████████| 144/144 [00:00<00:00, 72918.00it/s]
100%|██████████| 30/30 [00:00<00:00, 47608.44it/s]
100%|██████████| 130/130 [00:00<00:00, 73673.76it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75023.07it/s]
100%|██████████| 2034/2034 [00:00<00:00, 61776.52it/s]

['preliterate' 'noncivilized']
['ruralist' 'rustic']
['ruralist' 'advocate']
['hypercoaster' 'roller']
['extravert' 'extroversive']
['deviationism' 'desertion']
['antedating' 'chronologize']
['adventism' 'christianity']
['uncertainty' 'speculativeness']
['monsignori' 'priest']
['rotational' 'circumvolution']
['impossibilities' 'unattainableness']
['winners' 'walloper']
['commandership' 'position']
['newness' 'brand-newness']
['heraldist' 'applaud']
['heraldist' 'tell']
['monotony' 'unvariedness']
['sublieutenant' 'lieutenant']
['americanize' 'change']
['incensing' 'odorize']
['embroiderers' 'embroideress']
['inconvertible' 'incommutable']
['diffidence' 'unassertiveness']
['monogenesis' 'reproduction']
['caesarism' 'autocracy']
['christianise' 'convert']
['kazakhstani' 'asian']
['nobelist' 'laureate']
['interpenetrate' 'spiritize']
['microphallus' 'penis']
['insecurities' 'insecureness']
['aerialist' 'ropewalker']
['postdates' 'chronologize']
['internationalisms' 'scope']
['internationa




In [19]:
results_to_csv(evaluate_on_all(UKB,lowercase_dataset=True))

100%|██████████| 999/999 [00:00<00:00, 76189.35it/s]
100%|██████████| 287/287 [00:00<00:00, 31335.81it/s]
100%|██████████| 771/771 [00:00<00:00, 73831.24it/s]
100%|██████████| 2000/2000 [00:00<00:00, 75208.52it/s]
100%|██████████| 1000/1000 [00:00<00:00, 77698.20it/s]
100%|██████████| 3000/3000 [00:00<00:00, 80752.87it/s]
100%|██████████| 353/353 [00:00<00:00, 69550.42it/s]
100%|██████████| 252/252 [00:00<00:00, 70398.60it/s]
100%|██████████| 203/203 [00:00<00:00, 64279.31it/s]
100%|██████████| 153/153 [00:00<00:00, 69973.67it/s]
100%|██████████| 200/200 [00:00<00:00, 69252.93it/s]
100%|██████████| 65/65 [00:00<00:00, 68620.63it/s]
100%|██████████| 144/144 [00:00<00:00, 33813.67it/s]
100%|██████████| 30/30 [00:00<00:00, 55406.92it/s]
100%|██████████| 130/130 [00:00<00:00, 68499.94it/s]
100%|██████████| 3500/3500 [00:00<00:00, 75384.83it/s]
  0%|          | 0/2034 [00:00<?, ?it/s]

['plays' 'losses']
['ship' 'ballots']
['saints' 'observatory']
['republicans' 'challenge']
['scottish' 'commuters']
['singapore' 'sanctions']
['rich' 'privileges']
['battle' 'prisoners']
['crime' 'assaulted']
['slaves' 'insured']
['cheers' 'musician']
['session' 'surprises']
['bulgarian' 'nurses']
['citizenship' 'casey']
['intelligence' 'troubles']
['salute' 'patterns']
['reichstag' 'germany']
['radiation' 'costumes']
['photography' 'proving']
['assassination' 'forbes']
['catholics' 'protestant']
['battle' 'warships']
['alcohol' 'fleeing']
['coil' 'ashes']
['explosive' 'builders']
['colonies' 'depression']
['diamond' 'killed']
['saints' 'repeal']
['operator' 'extracts']
['assassination' 'killed']
['birds' 'disturbances']
['palestinians' 'turks']
['chile' 'plates']
['exile' 'pledges']
['exile' 'threats']
['seizure' 'bishops']
['trade' 'farley']
['radical' 'bishops']
['crystal' 'oldest']
['patent' 'professionals']
['goverment' 'immunity']
['cardinals' 'villages']
['artillery' 'sanctions'

100%|██████████| 2034/2034 [00:00<00:00, 41879.83it/s]


['anticyclones' 'high']
['repositions' 'move']
['repositions' 'reduce']
['bounced' 'skip']
['bounced' 'bounce']
['kindergarteners' 'child']
['angrier' 'huffy']
['angrier' 'stormy']
['defiles' 'mar']
['defiles' 'spot']
['companionships' 'friendship']
['postboxes' 'maildrop']
['antedating' 'chronologize']
['benefited' 'help']
['benefited' 'get']
['interned' 'work']
['interned' 'confine']
['serenaded' 'perform']
['snookered' 'play']
['snookered' 'flim-flam']
['encroachments' 'inroad']
['encroachments' 'entrance']
['sentenced' 'declare']
['shrieks' 'shout']
['shrieks' 'cry']
['papered' 'cover']
['territorials' 'soldier']
['territorials' 'guard']
['transmigrating' 'immigrate']
['transmigrating' 'born']
['associations' 'southern']
['associations' 'sociable']
['planners' 'schemer']
['planners' 'notebook']
['combusts' 'blow']
['combusts' 'ablaze']
['producing' 'together']
['baggers' 'machine']
['baggers' 'workman']
['replications' 'reproduction']
['replications' 'procedure']
['retrials' 'tria


