In [1]:
import numpy as np
import codecs
class FastVector1:
    """
    Minimal wrapper for fastvector embeddings.
    ```
    Usage:
        $ model = FastVector(vector_file='/path/to/wiki.en.vec')
        $ 'apple' in model
        > TRUE
        $ model['apple'].shape
        > (300,)
    ```
    """

    def __init__(self, vector_file='', transform=None):
        """Read in word vectors in fasttext format"""
        self.word2id = {}

        # Captures word order, for export() and translate methods
        self.id2word = []

        print('reading word vectors from %s' % vector_file)
        with open(vector_file, 'r') as f:
	    print ('1') 
            (self.n_words, self.n_dim) = \
            (int(x) for x in f.readline().rstrip('\n').split(' '))
            self.embed = np.zeros((self.n_words, self.n_dim))
            for i, line in enumerate(f):
                elems = line.rstrip('\n').split(' ')
                self.word2id[elems[0]] = i
                #print (elems[0])
                self.embed[i] = elems[1:self.n_dim+1]
                self.id2word.append(elems[0])
        
        # Used in translate_inverted_softmax()
        self.softmax_denominators = None
        
        if transform is not None:
            print('Applying transformation to embedding')
            self.apply_transform(transform)
    
    def apply_cop(self, matrix,i):
        self.embed[i]=matrix[:]
    
    def export(self, outpath):
        """
        Transforming a large matrix of WordVectors is expensive. 
        This method lets you write the transformed matrix back to a file for future use
        :param The path to the output file to be written 
        """
        fout = open(outpath, "w")

        # Header takes the guesswork out of loading by recording how many lines, vector dims
        fout.write(str(self.n_words) + " " + str(self.n_dim) + "\n")
        for token in self.id2word:
            vector_components = ["%.6f" % number for number in self[token]]
            vector_as_string = " ".join(vector_components)

            out_line = token + " " + vector_as_string + "\n"
            fout.write(out_line)

        fout.close()
    
    
    @classmethod
    

    def __contains__(self, key):
        return key in self.word2id

    def __getitem__(self, key):
        return self.embed[self.word2id[key]]

In [2]:
class FastVector2:
    """
    Minimal wrapper for fastvector embeddings.
    ```
    Usage:
        $ model = FastVector(vector_file='/path/to/wiki.en.vec')
        $ 'apple' in model
        > TRUE
        $ model['apple'].shape
        > (300,)
    ```
    """

    def __init__(self, vector_file='', transform=None):
        """Read in word vectors in fasttext format"""
        self.word2id = {}

        # Captures word order, for export() and translate methods
        self.id2word = []

        print('reading word vectors from %s' % vector_file)
        with open(vector_file, 'r') as f:
	    print ('1') 
            (self.n_words, self.n_dim) = \
            (int(x) for x in f.readline().rstrip('\n').split(' '))
            self.embed = np.zeros((self.n_words, self.n_dim))
            for i, line in enumerate(f):
                elems = line.rstrip('\n').split(' ')
                self.word2id[elems[0]] = i
                #print (elems[0])
                ini=np.random.rand(300)
                self.embed[i] = ini[:]
                
                self.id2word.append(elems[0])
        
        # Used in translate_inverted_softmax()
        self.softmax_denominators = None
        
        if transform is not None:
            print('Applying transformation to embedding')
            self.apply_transform(transform)
    
    def apply_cop(self, matrix,i):
        self.embed[i]=matrix[:]
    
    def export(self, outpath):
        """
        Transforming a large matrix of WordVectors is expensive. 
        This method lets you write the transformed matrix back to a file for future use
        :param The path to the output file to be written 
        """
        fout = open(outpath, "w")

        # Header takes the guesswork out of loading by recording how many lines, vector dims
        fout.write(str(self.n_words) + " " + str(self.n_dim) + "\n")
        for token in self.id2word:
            vector_components = ["%.6f" % number for number in self[token]]
            vector_as_string = " ".join(vector_components)

            out_line = token + " " + vector_as_string + "\n"
            fout.write(out_line)

        fout.close()
    
    
    @classmethod
    

    def __contains__(self, key):
        return key in self.word2id

    def __getitem__(self, key):
        return self.embed[self.word2id[key]]

In [3]:
def cosine_similarity(vec_a, vec_b):
    """Compute cosine similarity between vec_a and vec_b"""
    return np.dot(vec_a, vec_b) / \
        (np.linalg.norm(vec_a) * np.linalg.norm(vec_b))

In [4]:
import numpy as np
from random import randint

In [22]:
def make_training_matrices(source_dictionary, target_dictionary):#, bilingual_dictionary):
    """
    Source and target dictionaries are the FastVector objects of
    source/target languages. bilingual_dictionary is a list of 
    translation pair tuples [(source_word, target_word), ...].
    """
    source_matrix = []
    target_matrix = []
    ti=[]
    count=0
    for  target in target_dictionary.word2id:
        
        count=count+1
        #print source, target
        #print source+1
        x=randint(0,len(source_dictionary.word2id))

        #print x
        source1= source_dictionary.id2word[x]
        print  source1,target
        ti.append(target_dictionary.word2id[target])
        source_matrix.append(source_dictionary[source1])
        target_matrix.append(target_dictionary[target])

    # return training matrices
    print count
    return np.array(source_matrix), np.array(target_matrix), np.array(ti)

In [6]:
en_dictionary = FastVector1(vector_file='/home/apatra/fastText/fastText_multilingual-master/eng.vec')
mi_dictionary = FastVector2(vector_file='/home/apatra/fastText/fastText_multilingual-master/model.vec')

en_vector = en_dictionary["one"]
mi_vector = mi_dictionary["newt"]
print(cosine_similarity(en_vector, mi_vector))

reading word vectors from /home/apatra/fastText/fastText_multilingual-master/eng.vec
1
reading word vectors from /home/apatra/fastText/fastText_multilingual-master/model.vec
1
0.04759287163908247


In [73]:
mi_dictionary = FastVector2(vector_file='/home/apatra/fastText/fastText_multilingual-master/model.vec')

en_vector = en_dictionary["one"]
mi_vector = mi_dictionary["newt"]
print(cosine_similarity(en_vector, mi_vector))

reading word vectors from /home/apatra/fastText/fastText_multilingual-master/model.vec
1
0.04839652896473183


In [74]:
mi_words = set(mi_dictionary.word2id.keys())
en_words = set(en_dictionary.word2id.keys())

In [75]:
# form the training matrices
#from copy import deepcopy
source_matrix, target_matrix ,ti= make_training_matrices(
    en_dictionary, mi_dictionary) #, bilingual_dictionary)
#print len(source_matrix), len(target_matrix)
# learn and apply the transformation
#print ti, len(ti)
#target_matrix=deepcopy(source_matrix)
#print source_matrix #[60][9], target_matrix[60][9]
#transform = learn_transformation(source_matrix, target_matrix)
#print type(transform)
#print transform[299]
#en_dictionary.apply_transform(transform)

Neida kisi-mawanqa’tumkek
Ramprasad aklasiewaloqsultiji
ofmaterial esma’titl
Debility gelulatl
alofa etlitum
JKC Malpalewitelemut
Kirghizia gi'lewei
900px Western
preachy litaqnwikas’kl
Munchie mimajuinuigtug
Sadir Valle
Godart atkitemi
ContactOur mikwite’tmu
59-71 maw-wlamu’k
weekto Kaplno'l
Bibliomaniac kiwto’qa’sikewe’l
Kovesi elakutultijik
technology.Why apgwa'tuan
Podéis jijgluewjig
liom iknemat
prefference pma'toq
ÐºÑ nemiatijel
40g wels'tua'tigul
Riegelsville kajjimenewa’kik
╔ wtuisunmual
Derivatization iknemaj
H.3 wuji
Fernelius wejgwa'lawoqo
wаlk teke’k
4ish nasgua'tiji
Tiree nuj-seknika’tijik)
VLY telkisi
tyna mawelkisni
azkals a'tugwaqa
últimamente tetpoqpilaqn
Nutella-stuffed Naqtiki’l
1910-1936 pem-ajelkik
240-seat westawu’lkw
increases.It pajjoqe’kemk
Kholodenko kidi
Stepdown kisikuitl
Kreisen ukwita'q
deber apu’ksinew
Breach seskutaq
KWIM la'lukete
sister.She wije’wmi’ti
spitted ta'n
areaContact un'jan
tosse gji'jiaqat
Bajaao nutaptukl
passability Vernon
HuggerZ28 (rattl

ingeniero saqmawel
aust Unama'ki
Felbridge Wikewiku's
e-drama wa’so’
1000gr pqwajuika
Firecrest tetemitisnn
Rettie elisulti’
Stagnancy tel-lukuti’tij
LBCF lnuekatik
andCharles lnuekatil
Bokura wikijik
tea-lover mil-taqne'wasijik
UKCA kelkawekl
18-64 wejita’ji
wsize ajawtik
650I Luce
under-five ut-kinapmua
NAACP kisi-milamkwa’lujik
serving.The ksnukwaqn
Adoring tla’ten
Pre-medical 'ntglusuaqanml
6243 maliamatisk
perfectly-fitting paqasaqali
A-549 tela’tekemk
Langowski -----------------------------------------------------------------------------------------------------------------------------------------------------Mes
LAICA wi'gas'g'p
1T0 pekije’kek
bymy pekijialutkek
animal-plant Aplamo'
stunning-looking Jikeyaqip
ANNOYING un'jann
pure-blooded Aimutikel
Keechelus Epjilaasi
Home-baked sign'tue
semi-modular “Negm
Coner tluetisk
LexLuthor pekwatoqsip
ronto Kepten
Unigenes Aplamoq
Gologorsky etlitumk
progerin pkisintew
1870 ketu’npit
Ermes kismawlukutitesnen
life-building kisa’toq
sacrum p

Upad ‘Lesui'paq
worra skwijinu'k
Freaksville tinink
Niedermann kisnateli-ketlamsitasij
SocialSafe mattaqte’kne’
Goosman pekisito’q
slugthrower Nipialasutmam
250000 Mekaqnji’j
Barkhordar Maw-wlkasipnek
Naturalists mknimi
Pasetta ilsutmuam'gl
Marchio wetekewaqeney
said.Ron maltikle'wim
Vesga jigs'tuite
whatnot. jigs'tuita
Thigpen tela'laji
three-ounce pekwatuie
Saalburg Kejikawe’l
X920 ika’tumkis
Dotrice ktalasumuli
knot-tying telamko’tasik
CFL.ca Ewlgwijuaqan
Burkas o’pla’lsɨk
Στοκ me’kiskuk
Meerapfel ekitasik
Boorgat Ma’natu
Sovietism pejo’tu’titl
Camera1 kejitu’n
Convegno Herman
prayerThat kinu'tmuatoqsip
anacetrapib Epmepikai
Dimos nasolatiji
wogs tlimulan
Mood-Boosting Goyetch
shold tukia’tita
nine-headed Ika’qsip
ReviewIf ewlgwija's'g
06.36 glululuoq
Mirlis tapunemikel
hestitation aklasiewi
kumaran ankamiw-kjitoq
seraglio pegisinugwe
halas getlams'tg
800MW pejiwsultimk
fasfa waltestamk
okara npitemenew
ADCIRC elui'tmasip
thatother p'ta'utigtu
RedThis 'Gtlams'tasultioq
delivery.It w

supertelephoto nmiates
topic-focused teleke’witemua
185 taqamoqtek
Rechid o’platekep
bornprettystore.com Etltoqo'ltimko'kuom/Newtsiniw
too-easily nekml
anything.Let nekmo
8.5cm. peputestoq
earn-in wjinapukwalanew
Veliyidai matenaqewaqeney
Ndonga Newtejit
Annebella wesua'tua'tij
broughl Maw-lukuti’
62.73 apoqnmatultinew
lossA wlqatmekip
man-days newipunqekl
20Nov nutua'titl
wimmenz weji-pqojitasijik
chasey kesaltimkeweyiktukNuja’tu’
Putting wkwisie
dosimetrists laten
04106 wetkolwatemin
Wooks pejiwsisnik
2010.What wkwisin
reinnoirea lnu’
2030-2050 Robinaq
pay-day ankita’suaqney
quality-improvement ktutqutaqanmiktukSe’sus
EFFAS gisipugutmne
MapShare Atgitemultitoqs'p
Briefing.com Kaqi-kina’masijek
SX60 Kate’kews
8,508 epultisnik
Handcarved weliaqsip
Imperiale pemtajika’simk
Medroxyprogesterone kesi
mobas kesk
Berghe anqunte’map
landrum kese
Keeshonden wtuisunm
MedjetAssist teluwituoltijik
Comentar ektlamsetasi
Logan. wenki’k
35765 amalintuwaqenn
data-input kisi-npasmita’ne
ruffle-y aniap

NFL- tla'taqatine
k20 na’twen
STALEMATE Mattaqte’kemk
Haqiqa nemitunew
nixie Kiwkta’w-
live-aboards tel-nenujik
Mihic Unama’kikewaq
JobWe Jipuktuk
Setuid wqayij
teatre alasutma'tiji
FLAVOUR Klujjiewey
wrongful-death poqji-kwilmmkek
47421 Guide
condition.Price Musga's'gtn
Shannie metue’nukip
Zotac mijua’ji’juije
Kahli 'gtlams'tuine
FBP ekina’mua’tiji
time-waster Etl
Ne3 nmitoql
Well-Founded Nujjewigtu
Pescia mijua’ji’j
Valeriya ag
Fächer Jol'ta
Aril al
xviii. an
2014-09-24 aq
challengeNext ap
preference. as
VSAs au
nonissue at
250l aw
Chaokoh pematutijel
Abebooks.de weskowasik
lingham metuite’tmuksip
urand Ta’ntelitekemk
Brella newtipunqe
Polaire mesna'tipnn
Guhan a'
7AAD ikatmuksin
vennen kejikawey
tribological Majulgwala'tit
Favre waiekapie’k
trilithon unaqa'laten
Gingerly a’tlaweknji’j
000002 sa’q
Pinckley telimuloq
spce Canada
incompatibly pipukwatk
harpist amal-aknutma’tijik
recips Kisiku
Alx ministli’skwaq
Counrty Mathesonewey
2006-05-27 na'gweg
Immie jigs'tuin
-Oklahoma nme’j
Sac

Cowtan te'pe'pni'l
exklusiv emittukwaltultijik
EMAILING mesnmi’tis
event.More tla'tegeia
adorbale telimulekip
1Blue jipatmunulsukuin
cocreators netawet
themes.A waltesta'tiji
19781 egsitpu'
griffiths gigji
LoadWarrior Zutphena
Co-Heads apoqnmuwa
farma Wesgumgig
dress-codes tepjikeyin
Wyandots kustawia
cuidar keytuek
Personality- iapjiw
boxThis nikana’toq
blogable toqankuajik
Rocka kmu'ji'
mySA.com. kina’matney
Mombear Calu
nanotechnologist Kelo’tmuinamitt
Mabank kwilmi’tij
Ästhetik Crawford
Rs25 attikna’timk
effi Nemitua'tipnn
53005 'pgisinug
WingsThe “Ango'tmui
Roads nentu'gwe
guidance. Wikma’jl
fraternal nekapikwejit
Sn1 teknewey
perras elnu-oltimkewey
Rede D’Escouss
Taxwise Mackie
sonoran “Wenin
22pt isku
Rinke tetpaqi-lukweta
TRAINOR weji-wlapesultijik
tomorrow.What nisikwi'sk
Nominalism skijinuk
KanadaQuiet Kji-eleke'wit
Modotti skijinul
Heeze tqamutatultinu
Jesus.When Kawskwi
CF41 musga'tugsitoqs'
Ellice qasqe'k
ligatured la’
GUIA jinemu
middle-game wi'kmin
SOUNDGARDEN 'mg'sng
dh

CloseLet wutqutaqne’kati
lahh a'suguatl
reUgious jigla'sia's
Chine etekel
parkingI Publishing
ffox nuta'
cabin. ignmugsitesnen
Mayordomo tl-lukwette
Triya ship
CodeShare eymi’tij
Transat Juku’e
Wisherd seioqwattaq
Etzkorn etlite'tmu
Thatguy Eltu’sipnl
Shanon kis-tliaq
sub-combinations pija’lusni
dialog-based etl-lukutimi
thinkthey nutaj
Zorbax etl-lukutimk
JacobA nutal
second-third etlkina’masij
3x22 nutaq
92.81 ewlite’lmi
Jewbacca weskuna’tij
nothinh telitumk
Ailis iulteskatultititek
fault-injection pualgig
1700th nikwektnukipn
REPLICA elugwe
9AM aji-ntui’skemki
CitySlicker kisapnia
osat kisi-tasik
Dethier skik
builiding iga'lip
TOURS Pastunkewa’ki
powerleveled klo’tmnow
Kassina wunaqapemua
Strongwoman elikuwa’nu
havnen Eymu’tisnik
BossHog eympiskiaq
Pional wlpiskwa’t
fishI mekawtik
2017-05-31 (Pas'g
macroinstructions kisimkunmn
Donal naqsunaq
SharingTwitter0Facebook0Google SYSC
Al-Rasyid menaqajewe’te’w
Jan-18 tumk
Unwerth pekwiksite’lmuksi
95817 etlewistuap
accommadating etatk
rebut

Gavignet wikikaqenn
luchadores tlikina'muksit
Lenswork Sko’siaewey
chuffin pipanimasnik
LEK Kmu’ji’kank
3,890 kelulkewey
Marchiori tepakwa’
Maqetta Gigjiw
pras pej-mittukwa’tiji
aidil Douce-al
Girl24 welkwija’lulkAsite-muiu’atmuanej
counter-space tetuji-wlipsetoql
unstiched pempiasi
95765 wte’pitema
Cresset gepmitelmatl
35-degree nit-op-olu
2012-01-24 temikewey
thornscrub jiksutuap
started.Please kis-wanta’sik
breakfast.Good waqama'tuaj
issi toqotesip
paralyze malige'
frontwoman ‘tplutaqn
half-wall kikjalukwej
Grener maliamk
silverware. litaqnwi’kikemkewey
TRUSTS o’plataqatijik
mxn mesnmayekpnl
DLK Ikenemuatij
Pflum newtuka’lukwet
0x7F WULITA’SULTINENEWKepmite’lmanej
Philaristai Unama’kik
34-1 lue'winu'g
FX006 wenaqietuajig
environmental-health pa’qalaywaqn
chhattisgarh ignmuagwi
Последняя Telima'titl
Jahreszeit ela’tim
think.How kluskap
Gampel nelij
radio.In telimuksin
teacher.A Dove
fabulouse Mekwayewakat
anti-Rabbit mawuktml’tij
Ratnayake Listukujk
Serviss panta’tu’tisnl
connaitre U

multi-occupant pejita'ji
bedroooms tali-pkija’tekemk
Hulusi 'n'tute
HYou ilanqo’teke
ANEMIA tipu’lewey
white-colored Ke’
cards.They square
S-15 megt'
two-transistor kepmitetasitew
munkar pneknmuin
Freisa pipanigesultioq
SILKYPIX Koqwajo’taqann
funicular apetimuaq
Rottmayer Tel-kina’maqik
Burniso2cd “Gjisaqamawminu
gorgoeous waji
dyktige Se’sus
KeyLargo “Ge'
Securis siku’skw
Webkins wisawo
portion telmilesik
Pauland samqwate
tweeter. wi'gas'g
summer.It ika'q
Soboro Nikantuk
Chf mima
6,297 mime
HARMER ika'n
Siegsdorf musgalsultioq
Çorlu lakka’p-iktuk
Somn nemi’tultijik
comments.If toqey
Coulgate atkitemulti’k
bullet-point mawi-nutqwe’te’w
selmer nutqwe'k
10-barrel elta’qik
ARPA-Internet pase’
.wbfs Royal
Compostella weja’tekemk
Putar kiskattek
LiFE nenmi
rnase mawikwamkewey
THEM.I nenmn
N-Type ukk
Vanderbeke pejiwsitek
Banghart nig
thenarrow gigtoqopugutua'tit
yard-waste sa’se’wa’lit
faster.That Nukmi’
Kokutou Nemitaq
Theory11 pu'tayji'jk
AgION assusultijig
YesFor wejku’aqamit
Hariett Le

temperature4 wikisenaq
buddhistic nasmisko’taqn-iktuk
Revodrive pa’sik
Lebensart kmu’ji’j
outsprints ewni'skopalikaqnji'
Tchefuncte Newgte'jit
InYou amalkewaqen
EarthDesk ewi'gig'p
much-demanded ala’suinu’k
behaviour.The panuijkatasik
AsiaInfo kloqowe
bluethooth Aknutmaqn
re-publishing wicuhkehkemici
D-Beat pkwatulkutowwlita’sultineno
Onepass ila’liji
bantuannya piluamugwiaq
lunching wetetaqeney
jhanas Eykipnik
BARRACKS awije’jk
Klinkhammer Poqjuikk
3,882 wamkik
Skärhamn petgimimg'
Fedder Mill
Taluk apajasitek
amasing Tal-kis-
AMME Perr
COld mjikey
PlayJune “Eskmatmi’tij
Threadspotting maliaptik
7,99 etli-mawta’sik
innert ktika'lin
card.Is wikuow
cardsYou Tla'tega's
Wol- Palasiaq
Newad ma’
China.On wikuom
Entrainement ‘Ula
Union. mkumie’jl
Fayiz Eltuek
5in mkumie’jk
USFIA Dingwall’
futo iknemuwetemkewey
Salubrious welmitu’n
super-freak negmeweg
percodan te'sipowji't
jobsSkilled Mikemewel
contohnya Mikemewey
contans natqapilawtik
style.Thanks Kwete
GMTIn wjietew
Underslung apajiwswatuti

10K. mimgwas'gtuaji
Info.plist. Heber
Alkaloids etlankuamkl
inveteracy nutalkienen
CAPI Siawqatmu'tioq
osse nkwisk
muxxu kinuwa’taqatijik
1,034.00 tán
capital-improvement sa’qewe’kl
revendications Carolyn
Goetzel pituimtlnaqn
mountainbiken sekki’sasijik
up.Many lugwatte
Emmitt piskweta'mk
ihese keleiwaj
Bo-Kaap kisa’tu’n
instep alankua
--flag kluljewtasimkewei
Saddar pite’mamkewe
power-laws koqwajo’taqnn
Raslan wukmi’eml
Alouds “Pipanim
employés oqwatnu
Kachadurian kinamaqen
33014 Southside
Yvonnes wenjui’simk
coursers panta’sitew
Cobalamin Westawu'lk
Ĺ ugjattesnu
Chaville tqamuewe'l
'atent Edward
Amazonis nasgwa'tatultipni
mathewi ango'tmlij
Zanzibaris espite’tasimkewey
🍅 toqa'maji
Portis ingute'jijig
bbms mikmaw
Gujan mikmaq
75ms tplutaqaniktuk
Michelsons maw-meskilkl
Mouth-feel nenua'tisn
Natufians ntini
GXL npisu
08731 na’msitewe’l
Huben piemkewe
Ifill tekweywa’tisnik
Kaustubha npisi
excusion Metua’lik
Mathewes etlqatekej
Coagulant wi’katiknji’j
Comancheria anquno’sun
handicap-frie

Ai-S Epitjik
H.D. mawita’tij
M--- saske'al
23440 l’tu’tij
Coasting 'gtlams'tmultoqs'
'Olmes wapniaq
16.71 pkwi'sik
Aslin mawita’snik
chairmans Ekitk
esport telui’tujik
biebs Pemi-aji-mtua’lik
i8i piskwetaji
JumpKing Skajmenaq
rule-based weskijinua’lie
and15 alo
grip-and-grin Jol'tan
tantra ali
Costarella ala
Khieu litaqnwi’kikemkeweyek
RECT alt
AM-7 nutuawoq
hammer- sape'wuti'l
Capclave Nasmisko’taqn
Dandelo tupkwanji'j
rea meski’kek
Inpaint telimapnn
cupy telimapni
nunciatures panta’tasikl
installations Sesusewmajukwejit
Restitution ugtelege'witemua
ACIC lia's
ever-present lia'n
macaca ekwitameje
Hammersteins enkasaiw
well6 ala’tuksip
Samcheongdong kmu'ji'j
Gumrah lsmi
Hendri kina’matnewe
counteroffer Sko’si
Disse Kualasoq
getai apaja’tinen
TeaEqualsBliss teluatijik
14,017 “Koqoey
illegal.I na’tuwen
winter.As Auld
verb1. sesaki’multijik
Herewith kast’plewuti’
OneSwitch.org.uk wo'qomal
Lindex nenk
thedeveloping kekmuwatk
U-turned wigili
Objective-C nena
Jarwa l’nua’kik
deForest etlewis

11-item aji-ila’muan
PM-8 teli-ktlamsitasultisni
GNU tela'tegelij
ChartThis wissuignemg'p
DelhiAbout wesua'toq
ΤΟΝ knua’taqa
etoo getlams'tuigw
Nebido ktuknitaq
Zacatón kistliaqesenke
important.It telki’k
95762 gepmite'lmugsi
much-hyped pla'kit
Lavigueur van
castle-like g'satalultio
фигура metuina’
Farofa g'satalultie
Battalia mawolutek
Counter-Cyclical lassup
FanProsAuthentic peskunatekiskaq
VladTheEmailer o’pla’luksin
Careerlink ektlataqsunem
2017.04.05 “Simon
epistasis elapekulti'titl
BCH ikana'to
Neech Sesgwalugsie
psychological elsutmultoqs'p
940XL Kanataewey
charges.Please nisoqamkiaql
Titanus elukowuksiekik
magiks liew
desperados waltesta’tijik
RENDERING etl-mulqa’tim
sanguine pemi-npi
dwdollar kina’muanen
Degenerations mawukwat
down-votes teliuj
wiTh kina’muanew
Chiam ne'kayiw
Half-Shell wett'g
most-honored kaqlamili
portfolioof 'gtlams'tuiwoq
count.What Ewi’kmi’tij
all.Enjoy Gnisgamemuo
Drive-In kwitniktuk
Alums ns'tasultioq
-saying nukwa’qsipnek
ARPE Mi'kamiq
Kiyo bolero-ewik

E-bow ujjuaqi'g
tets westatew
full-swing musga'toq
hyperconvergence kaskiktlnaqenipunekek
Marach awti
Wroclawski waltes
Berdnikov ankamatiji
Vergano mekenujik
Stac Retarded
sarafina nanijik
Amaterasu epketesenuk
Malefactor kitoqekuwatijl
89.27 pema’la’titl
well-categorized Gujjuaqi'g
BillKSmith wta’piml
INFORMATICA ugsua'tuigwig
Progressivist mtaweknninen
dot-shaped ulgwitt'tal
1780-1832 mijua'ji'
Gudauta paqtismk
NMFA eksitpukatali’tij
SQLDataSource gepmite'lmaw
descendre kjiniskam
Dntel wltesin
premarketing pemta’
MALY npu'ti'gw
Nisanyan melgimaj
DLRP Wenaqa’sijek
précisant Budge
Kirkus Ne'wewey
postageor mijua'jij
2008-04-08 tellukutie
Jember Algokian
B-54 tla’site
jobs.This L'nui
crazyBut ml'gigno'ti
56.01 akenutemaqenel
winnen awti’l
2009-09-27 gji'nmum
Brac “Telimulo
Naukri Ekina’maqik
bomp tluewn
JNBY metu’kaqnik
Horóscopo Gji'tutes
1L klusuwaqen
EonNAS sqna’qwey
Pompili gina'mui
whatwhat gina'mue
revoke gina'mug
sacerdotalism tla'taqatitoqs'p
6892 koqwaje’k
FACIL qaliputi’l
Ver

www.allrecipes.com ktlita’suaqnuow
Rooibus nujiegsuet
segítőkész Almantiewa’kik
planimetric tetaputenug
WPRT teleyapn
Rousteing Wjijaqmijl
16.5lbs tewijo’ltiji
Super-hot wenjikuo’ml
Tassilo pro’kra’miktuk
AMVAC a’tukwaqnn
fattys malsano’kuo’mek
ivonprefontaine wejo'tmi'tij
zerged Sqna’qewey
misstress Palapa
Rinella kepmite’lmule
2.d Maryland
51-54 dancing
distinctness ‘'Mgne'n
p.148 pekisuluksi’
Parissi ekina’maq
birth-month kisa’lultew
uaw Essisoqnikewaq
14,050 melkikenaqten
spare.I amaljikwej
1Hi newtejuwamuk
Fantastika westawu’lsketa
Crianlarich usgutmultoqs'p
Jaked poqtikimkit
 gina'muane
Frame3 ika’tu’tijl
Janskerk commerc
Curie-Sklodowska pun-kwitamemk
FamilyI pita'qal
Assyr ewi’ka’tisnik
Tenmon Potolek
Multics jijklue’wjuapi’
HopgoodGanim kwilut
lambchopsil Tqamuewey
faver ‘nisgameultijig’
réputé gisa'l'gig
DNRE Samaliaewa
Chemist ankweywan
century.With pata’suaqan
Rayyan amasgipnnugsitoqs'
Heartland lasutmaykipo'q
blackcurrent mimatui-l’mita’pni’
dangs Ne'wt
Glenbrittle malie’

Stebner apokjilu
BLOODWORTH nemi'gwig
Shamsky wi’katikne’kl
shomi nqano’pat
10-by-10-foot gistejuultinew
media-generated suwiskatoq
awardees Tim
Emmarentia ekweji
Bamiyan ika'tutl
Polarik angua'to
leater npuwinu
Martosko kisi-aji-winteskawenuk
15mths ignmuip
Paulins Wenjui’sit
Благодаря sa'se'wa'lat
MeelionDollerBogus kwetapa'lut
sequined sapo’nu
curiuos ignmuin
inlength npimn
male.The koquey
mattys4 weja’tumkis
month.The “Jugwita'gw
1,035.00 “Ga'qanma'titeg
Dussander Nopa
tooSee unaqapemg
dians waqatikalujik
FINGERPRINTING unaqapeml
projectively sikua’lut
Camb. ukumuljin
put-away eli’sawemk
rebreeding Ronal
jarang pejiwsultimkek
عبدالله pisqutqa’tasnik
Deliciousness kisnaqa’siwun
rs1800795 wenqatamu’
Sarles ugmimajuaqanmuaq
stifler Gypsumey
Coolhaus apoqtmu’tiji
better.the Jenrl
Staffers apisiktuksi
G-Faerie08 wlta'sualate
Noes staqa
borreliae geitu'tij
work.You te’sisjik
francesca ektek
ResourceRequest ktapekiaqney
quote-unquote megniwoqo
delicas wlpultite’wki’k
Shyma Channel
super-f

In [76]:
import copy
count_no=0
#j=np.zeros(300)
for r in range(0,len(ti)):
    '''#print source_matrix[r], target_matrix[r]
    #print len(source_matrix[r]),len(target_matrix[r])
    #print ti[r]
    p=list_duplicates(ti,ti[r])
    #print p
    j=np.zeros(300)
    for l in p:
        #print l
        for x in l:
            j+=source_matrix[x]
            
        target_matrix[r]=j[:]/len(l)
    count_no+=1'''
    target_matrix[r]=source_matrix[r]
    #target_matrix[r]=source_matrix[r][:]
    mi_dictionary.apply_cop(target_matrix[r],ti[r])
#print count_no

In [77]:
mi_dictionary.export('/home/apatra/Desktop/work/lstm/data/micmaq10.vec')

In [78]:
mi_dictionary.export('/home/apatra/fastText/fastText_multilingual-master/micmaq10.vec')