In [1]:
import numpy as np
import codecs
class FastVector1:
    """
    Minimal wrapper for fastvector embeddings.
    ```
    Usage:
        $ model = FastVector(vector_file='/path/to/wiki.en.vec')
        $ 'apple' in model
        > TRUE
        $ model['apple'].shape
        > (300,)
    ```
    """

    def __init__(self, vector_file='', transform=None):
        """Read in word vectors in fasttext format"""
        self.word2id = {}

        # Captures word order, for export() and translate methods
        self.id2word = []

        print('reading word vectors from %s' % vector_file)
        with open(vector_file, 'r') as f:
	    print ('1') 
            (self.n_words, self.n_dim) = \
            (int(x) for x in f.readline().rstrip('\n').split(' '))
            self.embed = np.zeros((self.n_words, self.n_dim))
            for i, line in enumerate(f):
                elems = line.rstrip('\n').split(' ')
                self.word2id[elems[0]] = i
                #print (elems[0])
                self.embed[i] = elems[1:self.n_dim+1]
                self.id2word.append(elems[0])
        
        # Used in translate_inverted_softmax()
        self.softmax_denominators = None
        
        if transform is not None:
            print('Applying transformation to embedding')
            self.apply_transform(transform)
    
    def apply_cop(self, matrix,i):
        self.embed[i]=matrix[:]
    
    def export(self, outpath):
        """
        Transforming a large matrix of WordVectors is expensive. 
        This method lets you write the transformed matrix back to a file for future use
        :param The path to the output file to be written 
        """
        fout = open(outpath, "w")

        # Header takes the guesswork out of loading by recording how many lines, vector dims
        fout.write(str(self.n_words) + " " + str(self.n_dim) + "\n")
        for token in self.id2word:
            vector_components = ["%.6f" % number for number in self[token]]
            vector_as_string = " ".join(vector_components)

            out_line = token + " " + vector_as_string + "\n"
            fout.write(out_line)

        fout.close()
    
    
    @classmethod
    

    def __contains__(self, key):
        return key in self.word2id

    def __getitem__(self, key):
        return self.embed[self.word2id[key]]

In [2]:
class FastVector2:
    """
    Minimal wrapper for fastvector embeddings.
    ```
    Usage:
        $ model = FastVector(vector_file='/path/to/wiki.en.vec')
        $ 'apple' in model
        > TRUE
        $ model['apple'].shape
        > (300,)
    ```
    """

    def __init__(self, vector_file='', transform=None):
        """Read in word vectors in fasttext format"""
        self.word2id = {}

        # Captures word order, for export() and translate methods
        self.id2word = []

        print('reading word vectors from %s' % vector_file)
        with open(vector_file, 'r') as f:
	    print ('1') 
            (self.n_words, self.n_dim) = \
            (int(x) for x in f.readline().rstrip('\n').split(' '))
            self.embed = np.zeros((self.n_words, self.n_dim))
            for i, line in enumerate(f):
                elems = line.rstrip('\n').split(' ')
                self.word2id[elems[0]] = i
                #print (elems[0])
                ini=np.random.rand(300)
                self.embed[i] = ini[:]
                
                self.id2word.append(elems[0])
        
        # Used in translate_inverted_softmax()
        self.softmax_denominators = None
        
        if transform is not None:
            print('Applying transformation to embedding')
            self.apply_transform(transform)
    
    def apply_cop(self, matrix,i):
        self.embed[i]=matrix[:]
    
    def export(self, outpath):
        """
        Transforming a large matrix of WordVectors is expensive. 
        This method lets you write the transformed matrix back to a file for future use
        :param The path to the output file to be written 
        """
        fout = open(outpath, "w")

        # Header takes the guesswork out of loading by recording how many lines, vector dims
        fout.write(str(self.n_words) + " " + str(self.n_dim) + "\n")
        for token in self.id2word:
            vector_components = ["%.6f" % number for number in self[token]]
            vector_as_string = " ".join(vector_components)

            out_line = token + " " + vector_as_string + "\n"
            fout.write(out_line)

        fout.close()
    
    
    @classmethod
    

    def __contains__(self, key):
        return key in self.word2id

    def __getitem__(self, key):
        return self.embed[self.word2id[key]]

In [13]:
def cosine_similarity(vec_a, vec_b):
    """Compute cosine similarity between vec_a and vec_b"""
    return np.dot(vec_a, vec_b) / \
        (np.linalg.norm(vec_a) * np.linalg.norm(vec_b))

In [14]:
import numpy as np
from random import randint

In [15]:
def make_training_matrices(source_dictionary, target_dictionary):#, bilingual_dictionary):
    """
    Source and target dictionaries are the FastVector objects of
    source/target languages. bilingual_dictionary is a list of 
    translation pair tuples [(source_word, target_word), ...].
    """
    source_matrix = []
    target_matrix = []
    ti=[]
    count=0
    for  target in target_dictionary.word2id:
        
        count=count+1
        #print source, target
        #print source+1
        x=randint(0,len(source_dictionary.word2id))

        #print x
        source1= source_dictionary.id2word[x]
        print  source1,target
        ti.append(target_dictionary.word2id[target])
        source_matrix.append(source_dictionary[source1])
        target_matrix.append(target_dictionary[target])

    # return training matrices
    print count
    return np.array(source_matrix), np.array(target_matrix), np.array(ti)

In [16]:
en_dictionary = FastVector1(vector_file='/home/apatra/fastText/cc.fr.300.vec')
mi_dictionary = FastVector2(vector_file='/home/apatra/fastText/fastText_multilingual-master/model.vec')

en_vector = en_dictionary["one"]
mi_vector = mi_dictionary["newt"]
print(cosine_similarity(en_vector, mi_vector))

reading word vectors from /home/apatra/fastText/cc.fr.300.vec
1
reading word vectors from /home/apatra/fastText/fastText_multilingual-master/model.vec
1
0.01874059387330577


In [17]:
mi_dictionary = FastVector2(vector_file='/home/apatra/fastText/fastText_multilingual-master/model.vec')

en_vector = en_dictionary["one"]
mi_vector = mi_dictionary["newt"]
print(cosine_similarity(en_vector, mi_vector))

reading word vectors from /home/apatra/fastText/fastText_multilingual-master/model.vec
1
0.03961446400257569


In [18]:
mi_words = set(mi_dictionary.word2id.keys())
en_words = set(en_dictionary.word2id.keys())

In [19]:
# form the training matrices
#from copy import deepcopy
source_matrix, target_matrix ,ti= make_training_matrices(
    en_dictionary, mi_dictionary) #, bilingual_dictionary)
#print len(source_matrix), len(target_matrix)
# learn and apply the transformation
#print ti, len(ti)
#target_matrix=deepcopy(source_matrix)
#print source_matrix #[60][9], target_matrix[60][9]
#transform = learn_transformation(source_matrix, target_matrix)
#print type(transform)
#print transform[299]
#en_dictionary.apply_transform(transform)

Fortunae kisi-mawanqa’tumkek
okt aklasiewaloqsultiji
Zvíkov esma’titl
spørgsmål gelulatl
cherEmploi etlitum
Antioche Malpalewitelemut
Geodynamics gi'lewei
Hasenpfeffer Western
Fite litaqnwikas’kl
Nomaua mimajuinuigtug
Koste Valle
Одесса atkitemi
kouffar mikwite’tmu
Stavelot maw-wlamu’k
46.298 Kaplno'l
Alixia kiwto’qa’sikewe’l
Vermona elakutultijik
XLIV-134 apgwa'tuan
presseVisuelsContact jijgluewjig
papyvesAdmin iknemat
supplémentation pma'toq
superpitchou nemiatijel
AF3V wels'tua'tigul
1430-1432 kajjimenewa’kik
Clément-Talbot wtuisunmual
Beldant iknemaj
chimiquesSolutions wuji
empécher wejgwa'lawoqo
COLL teke’k
cisplatine nasgua'tiji
miners nuj-seknika’tijik)
1876-1886 telkisi
Pérégrinus mawelkisni
financiéres a'tugwaqa
6519 tetpoqpilaqn
Esquerra Naqtiki’l
Charenton pem-ajelkik
malcontents westawu’lkw
Rabusson pajjoqe’kemk
mountain.Avec kidi
199315 kisikuitl
inculqué ukwita'q
Ybarnégaray apu’ksinew
MouléMaternité seskutaq
Kosovare la'lukete
JésusDu wije’wmi’ti
talonnent ta'n
CentreHôp

Bertrameix Jikeyaqip
Sigüés un'jann
explicat Aimutikel
Jessyka Epjilaasi
lůžka35 sign'tue
thinlits “Negm
Minnen tluetisk
TweenerTag pekwatoqsip
83300Sujet Kepten
voudra-t-elle Aplamoq
Curfs etlitumk
00ZMarie-Françoise pkisintew
Nenny ketu’npit
curtage kismawlukutitesnen
42-300 kisa’toq
jbl pualg
75015Psychiatre ugtlue'uti
niveles nujo’tkisnek
virtuosoDate goqweigtug
Souscripteur kisapsɨnmuatek
CRADAT mnkimt
GRATUITEA pajjoqaq
Tjukurpa Na’
KitchenaidLes pestie’wa’laj
Saint-Vernier Pasik
6534Age kejitoq
Fégréac Mi'kmawe'l
percussionBoulonneuse pestie'uti
senenews pastek
de42 kisiku
JET7 apoqnmuasnik
Ajite sa’se’wultiekipnl
Boucly wtmtmo’taqney
auec Metue’ksip
Déclarent kisa’sinu
wrestler tel-maliaptmumk
Jiajia tone’l
Soussia ewi'gas'gsn
carte3,5 ntutma'tiji
raïons Peskewiku's
Atlantica-Séguier giguow
dynamiqueLes natgima'tiji
5016 ignmuataq
semaines.Je tons
toujours.- Ireland
53.2 aji-kina’masin
Donnybrook minua'lultoqs'p
Ammanford meskeyin
Camjac kaqi-ilikwenasi
affront mime’jue
Batteri

D203 Nuji-kina’masultitewk
1600- maliaptmi’tij
escamotablechambre apankitatim
Lonnberg Samaliaewa'gig
forum600XT mawa'matultine
lock-in maliaptmi’tis
ossification mkite’taqney
montpellierains iknemuetasinuk
1,005 Pekwatekemk
shikomori nuji-apoqnmua'tijik
Provencheres Maljewejk
apposa pa’sek
1BFonds pejo'tu'titl
Yeelight tekweywiekip
NomadeMeuble ut-utanmua
France-Maghreb ansama
I-Tunes 'gsalata
Saint-Aubin-de-Bonneval teljugu'e
Connaraceae wksitawi-ewanik
7376 metui
wassoulou ut-ektlamsetaqeneymuo
greco-romaine etl-lukwatmi’tij
Carlile Tua’luj
Zpar gsal
Shabondy ne’pataqatijikNenaqite’tmi’tij
bijū Peji-mittukwalkip
Kaulf l’nu’
Analisis ut-lukewaqen
--Bernard MacDonaldo’
magazinesImpression 'gji'nmu
Shrew putu
ParisIntera tlimastesk
Ouenzé ligutinew
Cydnidae wunaqo'tasik
LAROUI emeteskultio
french.xinhuanet.com nikwenawemk
Psychopompe Flor
.3em Guernse
Ulldemolins nklamuksi
BENHAIM 'gji'tutew
Voellerdingen Nike'alme'si
--Futures elti-anko’tasiksip
56Merci sikeniktukewaj
Goodreads ajijgo

Julià amskweseweyaqq
OcéanAccueilQui naqani’katmi’tis
David2017-03-19T00 Se'sukul
37,87 sk�te'kmujk
Elange getlams'tua'tit
Kiyohide alsutmi’ti
Plannification alasutuo’kuo’m
Kagge nulmikjijitunew
ratine nu’kwa’l
plastiqu ignmuinen
période.AdressePour 'gml'gigno'tim
Summerdale neggul
SportAntoine nu’kwa’q
Détermination emqatu'si'k
baindelumiere eltaji
Paquis etlite
Rehainviller moqopa'qigtug
anti-dépresseur amalkatew
Tadevosyan amalkates
Caylor maw-kina’musnik
TerritorialePlan pekisula’tiji
Hors-d amalkatem
lolil Poqji-wi’kik
Asnieres-sur-Seine mawi-ksala’tijik
Monceau-le-Neuf wel-pmiaqsipnl
Clioteux ika'tan
HonneurOrdre Wije’wut
BOUSSY ewi’kikemk
Cadettes wa’toq
35345 Pilue’l
EmmaMorgane Pilue’k
Milhy telui'tmi'tis
Hermaphroditus telui'tmi'tij
nyzwokTopanga kmtniktuk
Devenons jigs'tmutiwoqo
RabotRabot e’pite’ji’juek
Thua waieknap
rouergates emittukwemkewe
josas kesi’ene
arabo-andalouse ntelisqatulek
StoryAll A’newite
puissancesconsole pemlamutimi’tit
Frasne telwikasinuksip
talker wekett

microstructurée telueg
Ð Alberta
Offene ektapekiakn
artefacts pemwenaqa'toq
Benjen teplotaqen
CASERNE telawsultijik
auto-éliminer esgwiet
HorreurVeniseWestern etlikwenuj
Khalilzad wasiantejk
inrocks Jonesaq
chamoisSupportsHiverVêtementsHautsBasChaussettesChapeauxSous-vêtementsRaquettesHors-pisteCourseRandonnéeEnfantsRécréatifNouveaux melgatpa'tinewaq
rétablissementRemerciementSaint Our
repas.C' naqt'g
HommeVestesTee tel-piskwa’q
Coacoochee –na
HôtesLocation kamik
RennesCasa ketapekia'tij
LogicielPortail na’taqamto’kekisnl
Facebook22 Ika’tatimk
Comté355 Aji-wetqane’k
Paquetages ga'qana'tas'
Ciluba qaliput
Wrighton sitmug
Staniforth welkaqnik
Bourroches tuopiti
hoplà Mawi-amskwesewe’k
Saint-Anschaire teli-ktantekemk
DFASM litaqwi’kikemkewey
Breuzé elugowiji
vitrerie-miroiterie ala’liki
AIRFREE alamiaqney
Großtraktor eliwsis
Earthworms eliwsip
insociabilité wicuhketomuhtuwok
Schübel juji’j
SOFSILK taqewo
Consultoria mimajuinualsi
14Or pgisinap
Berlandier Sa’
Häupl tlamuksitaq
92I Whitney


Doodling pemiaq
38515 mawiwjit
Invité14 pemegegnu'tmuatl
VogelauLe ilsumgutaq
SCIPION epi
oujda the
Jugoslavija ketapikey
Line ekina’masipnik
HNEC apangitugsi
Wham ewi'gmi'ti
quadrillages mikemaq
Trololo kekna’mua’tit
Atmea kenuataqen
L551-1 kiso’tmek
Pulligny suliewe’l
ESCRIME weskunk
Kijowski Vice-Presiden
GrisCuir amasenug
fureteurs tegpaqpa'sit
Kéty eimu
ChainRessources Newel
lhumain paqalaiultitoqs'
barabans eimo
Laupa assuman
HyundaiFrance eima
30à eime
DGTRE meski'k
SPS (Bernie
enavec uggwitl
mariez-vous 'msntoqs'
Jae-wook nikanpukuip
Hutrel np'taq
cirés “bull
Zinaïda Brunswickewa’
hommes-chats etl-kwitame
Uthaug ntininkMijua'ji'jk
valois nalkwenasikl
TweetCommentaire tapusijik
Playe ketmaqseto’jik
laccueil oqwatnuke’
gratuite.Affichant gisa'lugsitoqs'p
86018 pisultijik
newsletterSouscrireDésabonnement1Après Lee
volSaut piskweta'ti'tij
promosFenaisonCourroies gisgug
Scarpellini peji-wije’wa’tijik
Wampserver telteg
dekbed teltek
Ludiver etl-mulqat
LibertinePromotions tel-mawa’luj

--TARN-ET-GARONNE ketu’
Mineralize wejkui'aqmit
expertiseCadre kepteta’sik
18399 keptin
MissFreegun wsitawu’lkwekSe’sus
Bretonne keptik
aliment-terre-barvalle ksamuksinKulamo’qualukun
leash saqatuetesinEtuk
8x60S telue
Biologiques Natami
Hamoutène Brook
trending Napikwanji’j
Gorbok Kisapniaq
feldspaths weloqataleki
SneakersNStuff espo'qwas'gl
2007Mercredi waltesta'
boulotCampus A'newim
TranquilleLangue siaw-nastektn
rase-mottes snawey
10273 nemu’jik
12328Date 'msnmnew
cheminais 'gtlue'utiwal
Nguyen-DihnLycées alsutmaqnn
vulvite waltestaq
Vudu gepmitelma'tigul
Yeavering Teli-pkijiaq
EXPERTES ugtwi'gatigng
Bruzzo wejgu
HAMBURG plamu’
sécuriséService malsano’kuo’
Egarr eskipetmi’tij
TabacSaveur mkumi’l
0539 iganigjitegewinu
21614 kispisuney-iktu
Escazú Jipji’jk
Menez-Hom HMS
Désencombrez telitpieyas
60673Date el'telmagupni
26bis Miquelon
demandeLogement piamasital
Okinczyc nuji-tewakitkis
Parsy kesek
Bagy nisiaq
Berthommier wasuekwikasijik
Theeuwes Jilaptoq
hierarchies gtlams'tmoq
15-16h 

199,00ComparerComparer wmumk
StrasbourgHeleninsel Elkima’tisnik
Crespadoro Cashek
sommons ke'kwa'l
sympa2 inaqnk
1883-1973 teluwitesk
37Préférence pikwekl
non-skieurs kikwajual
TTIP ewe’watl
--Trackstory Mimajuinu'g
Turowo A'newultijij
perverties a’tukwetew
256G nakuse
Molezon wenaqa’to
Floette nuji-kina’mues
rondelles- nuji-kina’muet
diminuer gistesguane
delli kwisl
Fransures jackhamme
MerignacKeep wise
forfaitAndroidiPhoneWindows wisu
Cisel Ansale'wijig
51347 petgimatl
euler 'ntulnaq
DiffusionsMessages tl-tesket�sk
pattes.La kaqamit
ventilateurPlaques qalanej
Danielssen out
Wautoma klu’si’pSape’winu’k
Arsan Egimaji
numér nkesalnine
CMardi kinu'tmasin
intégrésSystèmes 'gtlams'te'
orphisme …
PlastiqueTasse O’pla’tekemk
DS216se kinu'tmasit
sociation –
GF-Y tela'tegepnig
méchantes ’
avertissement-extrait ”
Uwins “
intérim kmu’ji’j-iktu
Excellent4Très tl-lukutitaq
Colección weskumu
AUBRYLe wsiskw
5755Localisation ignmuitl
Grâce-de-Dieu aji-kate’kemk
activitiés msnmi'tigw
LehningLes Painta

11528 Nike’Pie’l
Shâtibî Mimajuinu
Hockeyeurs Ejigliwsit
Teth breillonsl
Koneru eteq
clamsé wekisitaqanitEln
Buttes roun
Aérographe etek
TiraneHeure etel
engagiste pastumkewa'ki
Souza-Cardoso pejita'tij
nucléo-cytoplasmique mimajuaq
suivra-t-elle ns'tuo'ti
entretienL' wespekianuk
Gracq weji-eleke’skumi’tijSe’sus
Cairoli kitoqitaji
Merighi kiskaja’lajik
déstressante mimajuaqnminen
Inbel wejiwula’tekemk
Filippus Simonal
Hueneme pekisulu
bénéficieras nipispaqanigtug
1Patrick ‘'Nqaluloq
Roselló mi'soqo
Hedrick telimugsieg
ski.SociétéNous muskunamuksultiliji
profiterai plna’tijlJel
AuteurMessageLoup mena’si
1924-2000 ul'te'lmugsitoqs'
tower-defense patlia's
canicien ji’jkluewuapi
Macheco nu’kwa’qek
REFLECHIS ewlite’lsut
redécoréesSiteTrès katua
Bertelé pase’k
Bouguereau To’q
139,98 etli-alsusultiji
Iraj pipukwemk
fàp kenoq
XXXVI newtiska'q
Suessa unaqapemultio
Fleurier Pesqunatekewey
Padane majulwatijik
Trabzonspor qq
Blosne qs
bainPèse-bébéPoubelle keluwah
Preparatoria nuji-kina’mue
véra m

Federici mnuekeya
BREMA welitpita’q
Guezennec nakami
Tigerwing ta’puewe
Железник ika’tuaten
--Géo-Sites tela’taqatijikta’nik
Josephina ta’puewi
Procycle kiskatpukueta’sni
conspira lukwatasikt
Hydroxylation miawnipk
Sauveplantade wsisqunk
coucheOuverture Skijinu
63149 Nuji-kina’masite’w
WillcoxSuprême ugtejgewe't'p
Digit-photo.comPlus gugunatoqs'p
--Chelsea tel'te'tg'
labbé wlapettaq
ClO2 li’sm
CIMETIÈRE wesgutmuloqopn
Erbalunga pestie'wa'lu
8593 ewikasikes
老子 ewikasikel
dö ewlite’lkaqan
Amazon.Livraison papuaqn
Monsta wikianek
Liaquat kejituasnl
Meyer-Hetling etl-lukweyap
individuelleProtection lamikuo'mk
C04 wlpiskwa't
Thank' e’plewi-psaqi
Melaka samqwanigtu
exploitant pkwasaq
suluk smaqkitasi
Brentano nutaqik
KorandoIdéal wjijaqmije
YouliMessages ll
dextres loqte’kniketki’
BiblioML kaqamultijik
Guéra Amalintutitewjek
ARRQ Kisne’pe’j
tchatch emsenmenew
1867-1942 mesnme’k
Bootstrap Cove
Dziekanski telucioq
postpartum akenutemaqenminal
Cassez-vous napwikaqenjijel
bushido “Tatuji
Blagues

débarquai kisehtuhtit
huîtresLa piskwapa’q
Canut e’nikitjek
hier.26 jipkelmule
acticles mlkiknewa’l
Gharbeya we’jitunew
Compilateurs Mi'kma'ki
touquettoise kisi-amalsiktmat
crissent tl-lukwetaq
Gothiques miwatmuaten
Mitsumichi awsamelknuk
Genève-Annecy kekenutemuip
još iga'lulin
Edit. 'Ntjijgluewjmg
70.036 NUK
Guincho inaqenukel
ultraviolet kesikawi’pik
injectes kisi-kina’muey
Kąty Ta’nik
parenthèse psweso’q
Kamijo etl-lukwejek
Jinto wásó
crèvent ewlistui
children kna’taqne’
distribuées iganpugultijig
WJZ-TV Matntimk
Boher kelo’tk
instagramInstagram qwelmajitasimk
1954-58 alame’sikenew
tatan alasutma'ti'
environnementFormation weji-wisunmaq
âgéePersonne etl-wlqat
Scevolle nukmijinenaq
Mephiboscheth etl-kwitamtiek
ôteront makkelmulekWa'so'k
tomb tleyawik
Kenyatta Elnuey
pleasurable tleyawip
Marchand-Baylet Provident
échouera tleyawit
Mougeon Summink
BANGLADESH weji-kaqta’wjik
Verdeau “Kiskuk
Saint-Jean-Bonnefonds Klujjiewto’t
St-Germain aqqstawa’tew
1513-1521 jijgluewji'j
PsicheeSuper w

MINIMALISME migwite'tmi'tij
Koramic Kjijitaqney
Interrelation gtlams'tmug
ahahahahaha getlams'tuiji
RÉVISION alasutma'ti'k
incube tijuwaqa
Anushavan etekipní
commentairesVous Pkesikn
PAU05 G'pnno'l
FIABLES tli-ankaptasik
Ousted Pa'tlia'sk
A.S.B.L. pektaqteke
kmCité Pestiewataqetim
Oise- Gisa'lultoqs'p
guettez jukwita’new
pneumaticOutils gisa'tug
1875-1925 kwiluwasultiji
proliférait nastaqa’luksiekip
principaleContactSitemapRecherche e’wa’ij
67349 etoqtasit
Xanthocanace wnijanua
réitération emtoqwalaten
.Outre nipk
Decharge Nutjinen
cannois nipe
95H lami
CanonDépt. kisia’tijik
technologieCarteCarte pkwasaw
bâtimentAdresse tel-mil­lukutiek
SpaceXPartagez Gjinisgamewigtu
Solyte ala’tu’n
Nepos kmu’jinmeskilk
prairieL iga'qt'tew
Albert-Auguste wikis
0Illustration welgwitgl
sauritus wiaqteksipnl
décorativesVernis amalkaj
J.B.M. amalkam
toxiquesirritation amalkan
Bertazzo kualasoq
Brinkmatic Negro
Ugron gelu'lgl
vloer mikwimatl
MARONI lnui-mtmo’taqn
FilairesMicros amalkas
RD2-seed03 amalkat
n

1871-1920 Millville
SCHUMPETER tijik
Girolamini tijiw
951381 ut-elnu-oltimkewey
mosaïqueMENTIONS pite'mat
berf Joeal
DEMOISELLE minu’nsite
biokérosène ”Na
Week-end380 wutmo’taqnuo
droitSciences ta'sewi
cohabitons pantetekl
Remi' gigto'qopugua'sit
Mourzouk wunijanuaq
Billecul amgwes
Chaetodontoplus kisikuo'p
alcabala wejinu’kwalsit
Cruyt Kisa'knutma'ti'kw
Fuster mekenk
.Alors alasutmanej
Tchapalo ‘Apugjig
Stentors amaltu’amk
Terdav pleku-iktuk
KNIGHTS “Amgweseweieg
Gorutô etl-wutqutasijl
36,37 wenaqteskek
parure lukewinu’sk
Fauquembergue iknmasipnik
raffinent agnutg
BvlgariCartierChanelChopardCorumFranck i’paji
3169 Invernes
bureauPlafonnierLampe Greetings”
87.2 “Tel'ta'sultioq
stehe mekamuktenu
séjoursPowered Pugwelg'pnig
Mompart nekmowe'l
défection telawsultimkeweymel
9931 pmiet
71161 pmiej
Xiring pmien
19354 pastunkewaq
CKT keknue’ksip
المغتصبة ne'wtewin
34,01 kisi-l’kittew
Abb. ne'wtewij
substituerait ne'wtewit
parelli ‘toluhkewakonuwa
C3300 Ugji
curiosity nepga
Pointillisme Cre
cul

Vaporware na’talukwem
Epandeurs kestawite’taqan
Claire2017-03-12T00 nesuguna'q
phalanstérien Apsalkikwa’sit
Nabaoui mawikwaji
sujetsMass Gejig't
PARRAINER kepenol
malthusiennes saqpiku’ni’ewunSma’knisk
Anthocoridae “Apaita'nej
Roccella o
2016-10-28T00 piptukaqi
JujuTh unaqa'lataq
2016-05-07T00 pekijipnet
rumsteck wi’kiknapu
Trombadori pittoqsit
Geca nalkwenikemkewe’l
PARLANT Scotland
bâtimentSprays siawqatkis
POLLY sespo'tege
Eslövs l’kitte
re-lancer ami-kjijituap
Cencig sqana’sk
Tazaghart jiksitmui
1866-1955 kqama'tayanek
Laix Kesikewiku
Hsiao-Hsien pema’to
Scaglietti kapitanewip
Taroussa Hall”
tircis Etamul
Sextuple awintawa’qa’teket
tudier petkimut
voirLits wenmajita’sultijik
Tiverad Nasoqtesgmegewe'g
449Inscription o'pltesk
enceinteEn Sip
Stoic Siw
Vicariat pugjitew
Dratsang wetapeksini
PartenariatsChamp eluikenekel
SPF25 eluikenekek
Recalibreurs eykik
Hrusice elukwe
KnowledgeManagement telo’tk
aérienTransport elsaqasik
nandy matgwetuatl
Rigolus kasiwi’ku
Liebling Lauchie
vite-fait

cordelettesEtiquettes sikutesknuk
Cashstore sangewite'lmagwi
lingePanierSALE amgwesewaq
ActuComparateur lugowinu'
07450 mime’j
Géomètres Toq-kwitamti’tisnik
cadreLa Naqamasite’k
16Gala Alimati
LeoneGouvernanceGroupe Elmita'jik
Val-ès-Dunes Eltu’nl
AnneActivité opla’tekemkta’n
Mnichovice skitl
anteriore wetapeksultisnik
haq skite
Beauquel lukuti’tiji
σII tapsun
Emprunts wlaku
ligote smalkiewey
drageoir ut-ektlamsetaqenmua
Cistulli siawitatij
piques mulinn
Mackler mulink
Adrià “Etl
LOSS lita'sualitoqs'
GARCIALycées ntinin
Clubic.com etli-ankwo’tasikl
24301 ukjiksun
OccidentalLe ukjiksul
Twinlab ukjiksuk
2015Article kelusu’aq
DotEmu kise’nikeya
Lincke Me’nk
gaelledemuynck waltestaqnn
ElectriquePièces tapukl
Waagh waltestaqnk
Slizer ne'pa'io
Champeyroux Lpa
Aurelien “Etli
9ader kinua’tula
Sorraia elege'witewi
TAIJI kisitaqn
CalvadosSi kaqituek
ActivitésRandonnée Johnson
Hotelest nastuete
loisirsCircuits pem-we’w
6-22 'gmimajuinumg
--CO-VOITURAGE welasuwaqn
EcoRev taqwey
pro-recteur nutui
2

rez-de-chaussée13 tli-e’wasitew
--Cthulhu mekite’tasik
OcéaneFalbalaNombre klutjieweymkKekkam
20872 mawimtue’ke
produkt welkisitoq
Ga' putuwaqeney
Erazor tapuiskimtlnaqnipunqe
fluvialLe leskiken
RackEgaliseurs tahaluhp
2017Catégorie tel'ta'siteg
Degranges wiji-tkweywinPemawsiek
Vural tesipunke
1919-1937 lnua'lasn
Branly-Jacques asitemugsitoqs'p
EnoPlancha wenaqa'silisnHe
Rampan atikneta’ji
Yaping kisolutasi
Préaux DS
Heidnik Ne’wte’jit
1818-1901 Papewit
correctement.En kla’qij
Iti koqwajiaqewey
008800 De
ascot jipalutki'k
Montuïri np'te
fattore ekina’matnewe
candis qata’skw
di- astualuksinew
APV nanipunqekl
AutrePage usgumi
--TIPS mittukwalanen
diaphragmesFiltres newgtungt
helenesuze ntuisunminal
Metz-Campagne piptoqipska’tumk
hdp tel-lukuti’k
Yosan ut-eksinukowaqenmua
4kpar newgte'jin
19042 gun'tew
Manteca newgte'jie
running-back ama'tuip
TRUCK (Shubenacadi)
clésPortemanteaux katuaq
lançé newgte'jit
Duddle pajjoq-iktu
Christophorus asita'pugueji
notee pkisula’tij
Klebefolie10 Gillie
M

--Lushie ela’tu’tij
Dranses telimuloqop
Fumoir wunijanaq
sociauxAudit Welqatmumk
8,5J eltaqemiejik
Memar telue’jik
M-69 Dan
tetti MacMilla
T.V.A ankui’kaye’
Angaran welkwijalatiji
cuticulaire pingowi
750cm kitma
PHYSIQUE-CHIMIECollèges nemitutikwel
G.19 wapna'kiewaq
AudioLe toqtekl
Zico Rubha
100,1 elte'mi'tij
2012-10-15 sespite'tmi'ti
13264 we'jia'tisnik
11-01-2003Belgique yali
jiewos piteley
espagno petgimapn
Jamu Nikma'ji'j
--Charley telki'
Paquis oqa’t
Baecher Saqmaw
Caslino ministl
2016Projet Saqmaq
placozoaires soqitaq
2017Messages Saqmal
volleyeurs paqesapekalat
Calvais ka’qinuteli
faquin kiskina’masultisni’k
ultramarines Getmite'tg
Domu wsitawi'wen
Sauser waju’ejik
tidurBlois weskwa’tasik
57438 ewlite’lmin
recherchemes kisikuwi'skwaq
RicheuxLycées jigla'sites
LesCreches.fr kespiet
birrs Emset
Jacanidae apoqnmultew
sportsmondeMobilePlus We'gaw
desd. Jigs'tmuioq
RF-CLOUD ketla'msitasi
nucléase ika’qsip
SpeedCheckerLe te'sikl
fricadelles teligsug
0.05mm October
1829-1897 weci
acco

In [20]:
import copy
count_no=0
#j=np.zeros(300)
for r in range(0,len(ti)):
    '''#print source_matrix[r], target_matrix[r]
    #print len(source_matrix[r]),len(target_matrix[r])
    #print ti[r]
    p=list_duplicates(ti,ti[r])
    #print p
    j=np.zeros(300)
    for l in p:
        #print l
        for x in l:
            j+=source_matrix[x]
            
        target_matrix[r]=j[:]/len(l)
    count_no+=1'''
    target_matrix[r]=source_matrix[r]
    #target_matrix[r]=source_matrix[r][:]
    mi_dictionary.apply_cop(target_matrix[r],ti[r])
#print count_no

In [21]:
mi_dictionary.export('/home/apatra/Desktop/work/lstm/data/3fr.vec')

In [22]:
mi_dictionary.export('/home/apatra/fastText/fastText_multilingual-master/3fr.vec')