In [21]:
import os
import json
from gensim.utils import simple_preprocess
from gensim.models.phrases import Phrases, Phraser
from gensim import corpora
from gensim.similarities import Similarity


path = r"G:\work\aiddata_tuff\data\Pakistan-2019-json\Pakistan"

files = os.listdir(path)
documents=[]
file_names=[]

for file in files:
    f = open(path+"\\"+file)
    data = json.load(f)
    title = data['title']
    snippet = data['snippet']
    body = data['body']
    this_text = title + " " + snippet + body
    documents.append(this_text)
    file_names.append(file)


In [22]:
#Convert documents to collection of words
texts = [[text for text in simple_preprocess(doc, deacc=True)] for doc in documents]

#Build a bigram model to capture every pair of words in the texts
bigram = Phrases(texts, min_count=1)
bigram_phraser = Phraser(bigram)

texts_bigrams = [[text for text in bigram_phraser[ simple_preprocess(doc, deacc=True)]] for doc in documents]

dictionary = corpora.Dictionary(texts_bigrams)

#Create corpus
corpus = [dictionary.doc2bow(docString) for docString in texts_bigrams]

#Build similarity index
index = Similarity(corpus=corpus, num_features=len(dictionary), output_prefix='on_disk_output')

In [23]:
#Parse similarities from index
doc_id = 0
similar_docs = {}
for similarities in index:
    similar_docs[doc_id] = list(enumerate(similarities))
    doc_id += 1

In [28]:
#adjust this threshold to finetune the results
sim_threshold=0.95

for doc_id, sim_doc_tuples in similar_docs.items():
    print("-------------------------------------") 
    print("Analyzing doc #", doc_id) 
    print("Filename", file_names[doc_id]) 
    this_sim_docs = [] 
    for sim_doc_tuple in sim_doc_tuples: 
        sim_doc_id = sim_doc_tuple[0] 
        sim_score = sim_doc_tuple[1] 
        if sim_score >= sim_threshold and doc_id != sim_doc_id: 
            this_sim_docs.append(file_names[sim_doc_id]) 
    print("\nSimiliar Docs:", this_sim_docs) 
    print("-------------------------------------\n")

-------------------------------------
Analyzing doc # 0
Filename pakis-1-text813733.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1
Filename pakis-10-text2908317.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2
Filename pakis-100-text3397292.json

Similiar Docs: ['pakis-977-text3635658.json']
-------------------------------------

-------------------------------------
Analyzing doc # 3
Filename pakis-1000-text1901643.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 4
Filename pakis-1001-text1544554.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 5
Filename pakis-1002-text2401403.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 6
Filename pakis-10

Similiar Docs: ['pakis-1963-text1596003.json']
-------------------------------------

-------------------------------------
Analyzing doc # 66
Filename pakis-1058-text2443126.json

Similiar Docs: ['pakis-21-text2259552.json']
-------------------------------------

-------------------------------------
Analyzing doc # 67
Filename pakis-1059-text2176935.json

Similiar Docs: ['pakis-510-text1531958.json', 'pakis-998-text1298047.json']
-------------------------------------

-------------------------------------
Analyzing doc # 68
Filename pakis-106-text1641167.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 69
Filename pakis-1060-text1476480.json

Similiar Docs: ['pakis-2098-text2401716.json', 'pakis-525-text1993537.json']
-------------------------------------

-------------------------------------
Analyzing doc # 70
Filename pakis-1061-text1342980.json

Similiar Docs: ['pakis-1887-text2530181.json', 'pakis-561-text251362


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 129
Filename pakis-1114-text1782655.json

Similiar Docs: ['pakis-1186-text2189489.json']
-------------------------------------

-------------------------------------
Analyzing doc # 130
Filename pakis-1115-text111316.json

Similiar Docs: ['pakis-1109-text2250493.json', 'pakis-1866-text3687899.json']
-------------------------------------

-------------------------------------
Analyzing doc # 131
Filename pakis-1116-text256037.json

Similiar Docs: ['pakis-1378-text3550385.json', 'pakis-494-text3148661.json']
-------------------------------------

-------------------------------------
Analyzing doc # 132
Filename pakis-1117-text1662915.json

Similiar Docs: ['pakis-1220-text596844.json']
-------------------------------------

-------------------------------------
Analyzing doc # 133
Filename pakis-1118-text2875888.json

Similiar Docs: []
-------------------------------------

---


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 189
Filename pakis-1169-text1865672.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 190
Filename pakis-117-text2538054.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 191
Filename pakis-1170-text3401791.json

Similiar Docs: ['pakis-1502-text159846.json']
-------------------------------------

-------------------------------------
Analyzing doc # 192
Filename pakis-1171-text2524891.json

Similiar Docs: ['pakis-1037-text1024632.json', 'pakis-1575-text1957188.json', 'pakis-1683-text285930.json']
-------------------------------------

-------------------------------------
Analyzing doc # 193
Filename pakis-1172-text3098157.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 194
Fi

Filename pakis-1209-text3297998.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 235
Filename pakis-121-text810777.json

Similiar Docs: ['pakis-1173-text1194753.json']
-------------------------------------

-------------------------------------
Analyzing doc # 236
Filename pakis-1210-text3481415.json

Similiar Docs: ['pakis-2118-text103730.json']
-------------------------------------

-------------------------------------
Analyzing doc # 237
Filename pakis-1211-text3325952.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 238
Filename pakis-1212-text2804904.json

Similiar Docs: ['pakis-1904-text3414555.json']
-------------------------------------

-------------------------------------
Analyzing doc # 239
Filename pakis-1213-text889989.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 240

-------------------------------------

-------------------------------------
Analyzing doc # 295
Filename pakis-1264-text1471216.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 296
Filename pakis-1265-text3319581.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 297
Filename pakis-1266-text1102996.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 298
Filename pakis-1267-text3233256.json

Similiar Docs: ['pakis-1156-text1826245.json', 'pakis-143-text1649520.json', 'pakis-1609-text3039001.json', 'pakis-824-text1370954.json']
-------------------------------------

-------------------------------------
Analyzing doc # 299
Filename pakis-1268-text2782860.json

Similiar Docs: ['pakis-375-text1005494.json', 'pakis-599-text2405824.json']
-------------------------------------

------------------


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 357
Filename pakis-132-text2433622.json

Similiar Docs: ['pakis-614-text966283.json']
-------------------------------------

-------------------------------------
Analyzing doc # 358
Filename pakis-1320-text2749767.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 359
Filename pakis-1321-text328643.json

Similiar Docs: ['pakis-909-text979832.json']
-------------------------------------

-------------------------------------
Analyzing doc # 360
Filename pakis-1322-text3288935.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 361
Filename pakis-1323-text3595599.json

Similiar Docs: ['pakis-772-text3508910.json']
-------------------------------------

-------------------------------------
Analyzing doc # 362
Filename pakis-1324-text3107872.json

S

-------------------------------------

-------------------------------------
Analyzing doc # 420
Filename pakis-1377-text1650388.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 421
Filename pakis-1378-text3550385.json

Similiar Docs: ['pakis-1116-text256037.json', 'pakis-494-text3148661.json']
-------------------------------------

-------------------------------------
Analyzing doc # 422
Filename pakis-1379-text1079233.json

Similiar Docs: ['pakis-178-text506922.json']
-------------------------------------

-------------------------------------
Analyzing doc # 423
Filename pakis-138-text2573291.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 424
Filename pakis-1380-text1989472.json

Similiar Docs: ['pakis-1444-text2324241.json', 'pakis-1929-text1981515.json']
-------------------------------------

-------------------------------------
Analyzing doc 


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 486
Filename pakis-1436-text1726283.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 487
Filename pakis-1437-text252432.json

Similiar Docs: ['pakis-150-text1162539.json']
-------------------------------------

-------------------------------------
Analyzing doc # 488
Filename pakis-1438-text1388413.json

Similiar Docs: ['pakis-1251-text3719376.json', 'pakis-1565-text3151621.json', 'pakis-1745-text163202.json', 'pakis-56-text3369520.json', 'pakis-6-text1271816.json', 'pakis-850-text3465172.json']
-------------------------------------

-------------------------------------
Analyzing doc # 489
Filename pakis-1439-text254062.json

Similiar Docs: ['pakis-917-text1081007.json']
-------------------------------------

-------------------------------------
Analyzing doc # 490
Filename pakis-144-text1797665.json

Simi


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 557
Filename pakis-150-text1162539.json

Similiar Docs: ['pakis-1437-text252432.json']
-------------------------------------

-------------------------------------
Analyzing doc # 558
Filename pakis-1500-text304021.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 559
Filename pakis-1501-text892982.json

Similiar Docs: ['pakis-355-text214594.json']
-------------------------------------

-------------------------------------
Analyzing doc # 560
Filename pakis-1502-text159846.json

Similiar Docs: ['pakis-1170-text3401791.json']
-------------------------------------

-------------------------------------
Analyzing doc # 561
Filename pakis-1503-text841958.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 562
Filename pakis-1504-text3595200.json

Si


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 614
Filename pakis-1551-text3526606.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 615
Filename pakis-1552-text3501529.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 616
Filename pakis-1553-text359001.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 617
Filename pakis-1554-text3584772.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 618
Filename pakis-1555-text3733348.json

Similiar Docs: ['pakis-1980-text803938.json', 'pakis-230-text3009347.json']
-------------------------------------

-------------------------------------
Analyzing doc # 619
Filename pakis-1556-text723434.json

Similiar Docs: []
-------


Similiar Docs: ['pakis-1017-text3364113.json', 'pakis-1052-text2946189.json']
-------------------------------------

-------------------------------------
Analyzing doc # 660
Filename pakis-1593-text3192136.json

Similiar Docs: ['pakis-1587-text91699.json', 'pakis-1875-text3396958.json', 'pakis-240-text1179326.json', 'pakis-382-text1567028.json', 'pakis-44-text2304557.json', 'pakis-477-text2063700.json']
-------------------------------------

-------------------------------------
Analyzing doc # 661
Filename pakis-1594-text3250357.json

Similiar Docs: ['pakis-1333-text1443465.json', 'pakis-1845-text3177924.json', 'pakis-2110-text3727492.json', 'pakis-274-text2680119.json']
-------------------------------------

-------------------------------------
Analyzing doc # 662
Filename pakis-1595-text1530377.json

Similiar Docs: ['pakis-791-text732046.json']
-------------------------------------

-------------------------------------
Analyzing doc # 663
Filename pakis-1596-text1119192.json

Si


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 709
Filename pakis-1637-text2415503.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 710
Filename pakis-1638-text2036446.json

Similiar Docs: ['pakis-1462-text3423255.json', 'pakis-1598-text2025327.json', 'pakis-1703-text1648028.json', 'pakis-1746-text2313295.json']
-------------------------------------

-------------------------------------
Analyzing doc # 711
Filename pakis-1639-text2680059.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 712
Filename pakis-164-text2327388.json

Similiar Docs: ['pakis-1964-text2393628.json']
-------------------------------------

-------------------------------------
Analyzing doc # 713
Filename pakis-1640-text3023965.json

Similiar Docs: []
-------------------------------------

---------------------------


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 772
Filename pakis-1694-text1556657.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 773
Filename pakis-1695-text1758155.json

Similiar Docs: ['pakis-761-text3703673.json']
-------------------------------------

-------------------------------------
Analyzing doc # 774
Filename pakis-1696-text106247.json

Similiar Docs: ['pakis-1107-text681182.json', 'pakis-153-text2307740.json', 'pakis-17-text1736203.json', 'pakis-1932-text3433816.json', 'pakis-647-text694444.json']
-------------------------------------

-------------------------------------
Analyzing doc # 775
Filename pakis-1697-text2306388.json

Similiar Docs: ['pakis-1432-text610888.json', 'pakis-635-text659405.json']
-------------------------------------

-------------------------------------
Analyzing doc # 776
Filename pakis-1698-text1143865.json

Sim


Similiar Docs: ['pakis-1775-text1271560.json', 'pakis-38-text926357.json']
-------------------------------------

-------------------------------------
Analyzing doc # 836
Filename pakis-1751-text1289883.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 837
Filename pakis-1752-text2768005.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 838
Filename pakis-1753-text421269.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 839
Filename pakis-1754-text1228525.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 840
Filename pakis-1755-text3695625.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 841
Filename pakis-1756-text1413274.json

Similiar Docs: ['pakis-18


Similiar Docs: ['pakis-403-text537322.json', 'pakis-853-text1505712.json']
-------------------------------------

-------------------------------------
Analyzing doc # 884
Filename pakis-1795-text3527168.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 885
Filename pakis-1796-text242774.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 886
Filename pakis-1797-text2956085.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 887
Filename pakis-1798-text1178388.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 888
Filename pakis-1799-text1946033.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 889
Filename pakis-18-text1147975.json

Similiar Docs: ['pakis-1145

Analyzing doc # 946
Filename pakis-1850-text3057964.json

Similiar Docs: ['pakis-1244-text3040563.json', 'pakis-842-text1991550.json']
-------------------------------------

-------------------------------------
Analyzing doc # 947
Filename pakis-1851-text2152650.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 948
Filename pakis-1852-text728395.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 949
Filename pakis-1853-text1246054.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 950
Filename pakis-1854-text1078810.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 951
Filename pakis-1855-text3121535.json

Similiar Docs: ['pakis-596-text360044.json']
-------------------------------------

-----------------------------------


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 999
Filename pakis-1899-text1568876.json

Similiar Docs: ['pakis-841-text520415.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1000
Filename pakis-19-text3058022.json

Similiar Docs: ['pakis-1631-text1409346.json', 'pakis-426-text2818154.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1001
Filename pakis-190-text1973488.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1002
Filename pakis-1900-text2546729.json

Similiar Docs: ['pakis-1566-text2312810.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1003
Filename pakis-1901-text3280460.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1004
Fi

Filename pakis-1940-text475435.json

Similiar Docs: ['pakis-1042-text1362840.json', 'pakis-1130-text2745350.json', 'pakis-1606-text2040108.json', 'pakis-1673-text2121009.json', 'pakis-2031-text561532.json', 'pakis-2145-text2676717.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1047
Filename pakis-1941-text2332552.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1048
Filename pakis-1942-text3335122.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1049
Filename pakis-1943-text429297.json

Similiar Docs: ['pakis-1249-text291026.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1050
Filename pakis-1944-text3601939.json

Similiar Docs: ['pakis-876-text778256.json']
-------------------------------------

-------------------------------------
Analyzing doc #


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1094
Filename pakis-1984-text2489858.json

Similiar Docs: ['pakis-1081-text3656168.json', 'pakis-323-text1381019.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1095
Filename pakis-1985-text1562216.json

Similiar Docs: ['pakis-784-text2142686.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1096
Filename pakis-1986-text2949060.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1097
Filename pakis-1987-text2549100.json

Similiar Docs: ['pakis-1306-text901529.json', 'pakis-2014-text1268316.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1098
Filename pakis-1988-text3426337.json

Similiar Docs: ['pakis-1510-text1616806.json']
------------------------------------

-------------------------------------
Analyzing doc # 1156
Filename pakis-2039-text1144830.json

Similiar Docs: ['pakis-1080-text1731496.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1157
Filename pakis-204-text1635080.json

Similiar Docs: ['pakis-1540-text2557968.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1158
Filename pakis-2040-text1046178.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1159
Filename pakis-2041-text643869.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1160
Filename pakis-2042-text2787078.json

Similiar Docs: ['pakis-1864-text2207840.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1161
Filename pakis-2043-text742460.json

Similiar Docs: ['pakis-1030-text2951700.json']
--

Similiar Docs: ['pakis-2116-text2073456.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1214
Filename pakis-2091-text1410234.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1215
Filename pakis-2092-text1635660.json

Similiar Docs: ['pakis-231-text3117920.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1216
Filename pakis-2093-text848685.json

Similiar Docs: ['pakis-1135-text1822394.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1217
Filename pakis-2094-text2345174.json

Similiar Docs: ['pakis-812-text1772866.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1218
Filename pakis-2095-text1175029.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1219
F


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1277
Filename pakis-2148-text695241.json

Similiar Docs: ['pakis-335-text362571.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1278
Filename pakis-2149-text1425621.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1279
Filename pakis-215-text2362516.json

Similiar Docs: ['pakis-272-text3414401.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1280
Filename pakis-2150-text3599261.json

Similiar Docs: ['pakis-1137-text2453313.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1281
Filename pakis-2151-text2355716.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1282
Filename pakis-216-text1800476.


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1324
Filename pakis-254-text2620396.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1325
Filename pakis-255-text2505790.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1326
Filename pakis-256-text2523723.json

Similiar Docs: ['pakis-103-text3636505.json', 'pakis-464-text3265329.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1327
Filename pakis-257-text1437405.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1328
Filename pakis-258-text2937786.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1329
Filename pakis-259-text24007.json

Similiar Docs: []
-------


Similiar Docs: ['pakis-1532-text2543301.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1368
Filename pakis-294-text1255461.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1369
Filename pakis-295-text1364274.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1370
Filename pakis-296-text575920.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1371
Filename pakis-297-text1857601.json

Similiar Docs: ['pakis-1583-text403972.json', 'pakis-1906-text651958.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1372
Filename pakis-298-text1479126.json

Similiar Docs: ['pakis-104-text1156502.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1373
File


Similiar Docs: ['pakis-1281-text1564919.json', 'pakis-2130-text370457.json', 'pakis-265-text2158359.json', 'pakis-436-text3294428.json', 'pakis-951-text3558761.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1430
Filename pakis-35-text2999953.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1431
Filename pakis-350-text1133778.json

Similiar Docs: ['pakis-1646-text1781147.json', 'pakis-789-text2439263.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1432
Filename pakis-351-text1836016.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1433
Filename pakis-352-text902478.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1434
Filename pakis-353-text3123187.json

Similiar Docs: ['pakis-147-t


Similiar Docs: ['pakis-443-text2425338.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1487
Filename pakis-400-text3584976.json

Similiar Docs: ['pakis-795-text1419577.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1488
Filename pakis-401-text2164113.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1489
Filename pakis-402-text100111.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1490
Filename pakis-403-text537322.json

Similiar Docs: ['pakis-1794-text1817901.json', 'pakis-853-text1505712.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1491
Filename pakis-404-text531843.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1492
Filena


Similiar Docs: ['pakis-105-text2151856.json', 'pakis-2136-text3228577.json', 'pakis-375-text1005494.json', 'pakis-599-text2405824.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1533
Filename pakis-442-text1992690.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1534
Filename pakis-443-text2425338.json

Similiar Docs: ['pakis-40-text3043000.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1535
Filename pakis-444-text3735116.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1536
Filename pakis-445-text2508681.json

Similiar Docs: ['pakis-20-text2835524.json', 'pakis-961-text1932037.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1537
Filename pakis-446-text1310836.json

Similiar Docs: []
-------------


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1593
Filename pakis-497-text35569.json

Similiar Docs: ['pakis-1257-text2424607.json', 'pakis-1625-text3568965.json', 'pakis-754-text571507.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1594
Filename pakis-498-text1269910.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1595
Filename pakis-499-text1961602.json

Similiar Docs: ['pakis-729-text1326074.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1596
Filename pakis-5-text1278741.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1597
Filename pakis-50-text1119030.json

Similiar Docs: ['pakis-1371-text2279518.json', 'pakis-1469-text1060509.json']
-------------------------------------

-----

Analyzing doc # 1655
Filename pakis-552-text489391.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1656
Filename pakis-553-text441823.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1657
Filename pakis-554-text814859.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1658
Filename pakis-555-text14351.json

Similiar Docs: ['pakis-1954-text943255.json', 'pakis-2010-text1080967.json', 'pakis-386-text2322743.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1659
Filename pakis-556-text3140256.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1660
Filename pakis-557-text2964552.json

Similiar Docs: []
-------------------------------------

------------------------------------


Similiar Docs: ['pakis-209-text1684364.json', 'pakis-228-text161728.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1716
Filename pakis-607-text3467384.json

Similiar Docs: ['pakis-1933-text3551973.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1717
Filename pakis-608-text2071498.json

Similiar Docs: ['pakis-1318-text2456438.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1718
Filename pakis-609-text1466643.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1719
Filename pakis-61-text1123758.json

Similiar Docs: ['pakis-1248-text3179318.json', 'pakis-592-text2273975.json', 'pakis-759-text2589955.json', 'pakis-821-text2267835.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1720
Filename pakis-610-text1727555.json

S


Similiar Docs: ['pakis-1728-text2067068.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1764
Filename pakis-650-text3166511.json

Similiar Docs: ['pakis-2081-text1223567.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1765
Filename pakis-651-text1198537.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1766
Filename pakis-652-text2456009.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1767
Filename pakis-653-text3180738.json

Similiar Docs: ['pakis-309-text1801833.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1768
Filename pakis-654-text3563695.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1769
Filename pakis-655-text2270778.j

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1831
Filename pakis-710-text196964.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1832
Filename pakis-711-text3460369.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1833
Filename pakis-712-text3718626.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1834
Filename pakis-713-text3581297.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1835
Filename pakis-714-text2367563.json

Similiar Docs: ['pakis-1516-text2343989.json', 'pakis-469-text1371827.json', 'pakis-72-text137898.json', 'pakis-833-text1142681.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1836
Fil


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1883
Filename pakis-758-text2423760.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 1884
Filename pakis-759-text2589955.json

Similiar Docs: ['pakis-1248-text3179318.json', 'pakis-592-text2273975.json', 'pakis-61-text1123758.json', 'pakis-821-text2267835.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1885
Filename pakis-76-text1803998.json

Similiar Docs: ['pakis-460-text1494681.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1886
Filename pakis-760-text1742722.json

Similiar Docs: ['pakis-925-text1634552.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1887
Filename pakis-761-text3703673.json

Similiar Docs: ['pakis-1695-text1758155.json']
--------------

-------------------------------------
Analyzing doc # 1948
Filename pakis-816-text2457118.json

Similiar Docs: ['pakis-923-text667345.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1949
Filename pakis-817-text743983.json

Similiar Docs: ['pakis-337-text1233704.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1950
Filename pakis-818-text2952321.json

Similiar Docs: ['pakis-1100-text346337.json', 'pakis-1671-text2624585.json', 'pakis-782-text979827.json', 'pakis-900-text2090253.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1951
Filename pakis-819-text2939083.json

Similiar Docs: ['pakis-1392-text2858089.json', 'pakis-1534-text2983232.json', 'pakis-1548-text1950982.json']
-------------------------------------

-------------------------------------
Analyzing doc # 1952
Filename pakis-82-text327078.json

Similiar Docs: []
-------------

Filename pakis-868-text2362288.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2006
Filename pakis-869-text599143.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2007
Filename pakis-87-text3544709.json

Similiar Docs: ['pakis-105-text2151856.json', 'pakis-375-text1005494.json', 'pakis-599-text2405824.json']
-------------------------------------

-------------------------------------
Analyzing doc # 2008
Filename pakis-870-text1276494.json

Similiar Docs: ['pakis-1876-text2940977.json']
-------------------------------------

-------------------------------------
Analyzing doc # 2009
Filename pakis-871-text1783999.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2010
Filename pakis-872-text1682331.json

Similiar Docs: ['pakis-334-text3536176.json']
-------------------------------------


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2054
Filename pakis-911-text1408778.json

Similiar Docs: ['pakis-1177-text3626129.json', 'pakis-1247-text1318125.json', 'pakis-133-text1398682.json', 'pakis-1579-text2089750.json']
-------------------------------------

-------------------------------------
Analyzing doc # 2055
Filename pakis-912-text2085672.json

Similiar Docs: ['pakis-1126-text3386823.json', 'pakis-1359-text2306569.json', 'pakis-1959-text678910.json']
-------------------------------------

-------------------------------------
Analyzing doc # 2056
Filename pakis-913-text544140.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2057
Filename pakis-914-text373788.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2058
Filename pakis-915-text3241103.json

Similiar Docs: []
-------


Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2100
Filename pakis-953-text214968.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2101
Filename pakis-954-text1696883.json

Similiar Docs: []
-------------------------------------

-------------------------------------
Analyzing doc # 2102
Filename pakis-955-text3579961.json

Similiar Docs: ['pakis-1054-text1600800.json', 'pakis-1747-text484599.json', 'pakis-2099-text2425204.json', 'pakis-8-text301234.json']
-------------------------------------

-------------------------------------
Analyzing doc # 2103
Filename pakis-956-text3281148.json

Similiar Docs: ['pakis-200-text1729486.json', 'pakis-252-text3233144.json']
-------------------------------------

-------------------------------------
Analyzing doc # 2104
Filename pakis-957-text1807403.json

Similiar Docs: []
-------------------------------------

---