## Import Libraries

In [1]:
import numpy as np
import pandas as pd
import re
import math

import nltk
import string
from Sastrawi.Stemmer.StemmerFactory import StemmerFactory

## Read The Data

In [2]:
data = pd.read_excel('korpusMRT.xlsx')
data

Unnamed: 0,Title,Content,Source
0,332.184 Orang Gunakan MRT Jakarta Pada Minggu ...,"Sejak beroperasi secara resmi pada Senin, 25 M...",https://www.jakartamrt.co.id/2019/03/29/332-18...
1,Ketua Wantimpres RI Apresiasi MRT Jakarta,Dalam kunjungannya ke Kantor Pusat PT MRT Jaka...,https://www.jakartamrt.co.id/2019/04/25/ketua-...
2,Masyarakat Mulai Gunakan MRT Jakarta ke Tempat...,"Dua hari setelah peresmiannya, masyarakat terl...",https://www.jakartamrt.co.id/2019/03/26/masyar...
3,Rata-rata 78 ribu orang Per Hari Gunakan MRT J...,Hal tersebut disampaikan oleh Direktur Utama P...,https://www.jakartamrt.co.id/2019/04/12/rata-r...
4,"Selama April 2019, Tarif MRT Jakarta Dipotong ...",Operasi komersial MRT Jakarta telah dimulai pa...,https://www.jakartamrt.co.id/2019/04/01/selama...
5,MRT Jakarta Terapkan Perda DKI Jakarta Nomor 1...,Sebagai bagian dari upaya menjaga kebersihan d...,https://www.jakartamrt.co.id/2019/04/03/mrt-ja...
6,Fasilitas MRT Jakarta Berstandar Internasional,Sistem transportasi yang memiliki fasilitas le...,https://kumparan.com/jakarta-smart-city/fasili...
7,PT MRT Jakarta dan Crossrail Internasional Ltd...,"Pada Kamis (2-5-2019) lalu, PT MRT Jakarta dan...",https://www.jakartamrt.co.id/2019/05/02/pt-mrt...
8,PT MRT Jakarta Jalin Kerjasama dengan Crossrai...,PT MRT Jakarta menandatangani kerja sama Penge...,https://ceknricek.com/a/pt-mrt-jakarta-jalin-k...
9,MRT Jakarta Gandeng Crossrail International,PT Mass Rapid Transit (MRT) Jakarta dan Crossr...,https://www.beritasatu.com/megapolitan/551940/...


## Preprocessing

1. Case Folding
2. Tokenization
3. Filtering
4. Stemming

In [3]:
def remove_stopwords(text):
    with open('stopwords.txt') as f:
        stopwords = f.readlines()
        stopwords = [x.strip() for x in stopwords]
    
    text = nltk.word_tokenize(text)
    text = [word for word in text if word not in stopwords]
                     
    return text

In [4]:
def stemming(text):
    factory = StemmerFactory()
    stemmer = factory.create_stemmer()
    
    result = [stemmer.stem(word) for word in text]
    
    return result

In [5]:
def preprocessing(text):
    #case folding
    text = text.lower()
    
    #remove urls
    text = re.sub('http\S+', '', text)
    
    #replace weird characters
    text = text.replace('“', '"')
    text = text.replace('”', '"')
    text = text.replace('-', ' ')
            
    #tokenization and remove stopwords
    text = remove_stopwords(text)
    
    #remove punctuation    
    text = [''.join(c for c in s if c not in string.punctuation) for s in text]    
    
    #stemming
    text = stemming(text)
    
    #remove empty string
    text = list(filter(None, text))
    
    return text

## Query:

In [6]:
q1 = "Pembangunan MRT Jakarta"    
q2 = "Fasilitas MRT Jakarta"
q3 = "Harga tiket MRT"
q4 = "Rute MRT Jakarta"
q5 = "Biaya Pembangunan MRT"
query = [q1, q2, q3, q4, q5]

In [7]:
queries = pd.DataFrame()
for i, v in enumerate(query):
    cols = ["Query " + str(i+1)]
    query = pd.DataFrame.from_dict(nltk.FreqDist(preprocessing(v)), orient='index', columns=cols)
    queries = pd.concat([queries, query], axis=1, sort=False)

## Term Weighting:
- Term Frequency
- Inverse Document Frequency
- TF-IDF Weighting

## 1. Term Frequency

In [8]:
tf = pd.DataFrame()
for i,v in enumerate(data['Content']):    
    doc = pd.DataFrame.from_dict(nltk.FreqDist(preprocessing(v)), orient='index') 
    doc.columns = [data['Title'][i]]    
    tf = pd.concat([tf, doc], axis=1, sort=False)

In [9]:
tf.index.name = 'Term'
tf = pd.concat([tf, queries], axis=1, sort=False)
tf = tf.fillna(0)
tf

Unnamed: 0,332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,Ketua Wantimpres RI Apresiasi MRT Jakarta,Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",MRT Jakarta Terapkan Perda DKI Jakarta Nomor 13 Tahun 2013,Fasilitas MRT Jakarta Berstandar Internasional,PT MRT Jakarta dan Crossrail Internasional Ltd Sepakati Kerja Sama Pengembangan SDM,PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,MRT Jakarta Gandeng Crossrail International,...,MRT Jakarta Kerjasama dengan Kodam Jaya Amankan Pembangunan Fase 2,"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,PT MRT Jakarta dan PT Kereta Api Indonesia (Persero) Sepakati Kerja Sama Pengembangan SDM,Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,Query 1,Query 2,Query 3,Query 4,Query 5
operasi,8.0,3.0,3.0,1.0,2.0,0.0,0.0,0.0,0.0,0.0,...,0.0,3.0,0.0,4.0,2.0,0.0,0.0,0.0,0.0,0.0
resmi,2.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
senin,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
maret,2.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,2.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0
2019,4.0,1.0,0.0,5.0,2.0,0.0,0.0,1.0,0.0,0.0,...,0.0,3.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0
catat,2.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
kamis,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,...,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0
28,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
332184,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [10]:
tf[tf != 0] = 1 + np.log10(tf)
tf

  """Entry point for launching an IPython kernel.


Unnamed: 0,332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,Ketua Wantimpres RI Apresiasi MRT Jakarta,Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",MRT Jakarta Terapkan Perda DKI Jakarta Nomor 13 Tahun 2013,Fasilitas MRT Jakarta Berstandar Internasional,PT MRT Jakarta dan Crossrail Internasional Ltd Sepakati Kerja Sama Pengembangan SDM,PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,MRT Jakarta Gandeng Crossrail International,...,MRT Jakarta Kerjasama dengan Kodam Jaya Amankan Pembangunan Fase 2,"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,PT MRT Jakarta dan PT Kereta Api Indonesia (Persero) Sepakati Kerja Sama Pengembangan SDM,Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,Query 1,Query 2,Query 3,Query 4,Query 5
operasi,1.903090,1.477121,1.477121,1.000000,1.301030,0.000000,0.000000,0.000000,0.000000,0.00000,...,0.000000,1.477121,0.000000,1.60206,1.301030,0.0,0.0,0.0,0.0,0.0
resmi,1.301030,0.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,...,1.000000,0.000000,0.000000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0
senin,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,...,0.000000,0.000000,0.000000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0
25,1.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,1.000000,0.00000,...,0.000000,0.000000,0.000000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0
maret,1.301030,0.000000,0.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,...,0.000000,1.301030,0.000000,1.00000,1.000000,0.0,0.0,0.0,0.0,0.0
2019,1.602060,1.000000,0.000000,1.698970,1.301030,0.000000,0.000000,1.000000,0.000000,0.00000,...,0.000000,1.477121,0.000000,1.00000,1.000000,0.0,0.0,0.0,0.0,0.0
catat,1.301030,0.000000,0.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,...,0.000000,0.000000,1.000000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0
kamis,1.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,1.000000,1.000000,1.00000,...,0.000000,0.000000,0.000000,0.00000,1.000000,0.0,0.0,0.0,0.0,0.0
28,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,...,0.000000,0.000000,0.000000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0
332184,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,...,0.000000,0.000000,0.000000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0


## 2. Inverse Document Frequency

In [11]:
train = tf.iloc[:,:len(data)]
test = tf.iloc[:,len(data):]

In [12]:
cols = train.columns
df = pd.DataFrame(train[cols].gt(0).sum(axis=1), columns=['Document Frequency'])

idf = np.log10(len(cols)/df)
idf.columns = ['Inverse Document Frequency']
idf = pd.concat([df, idf], axis=1)

In [13]:
idf

Unnamed: 0,Document Frequency,Inverse Document Frequency
operasi,15,0.301030
resmi,4,0.875061
senin,2,1.176091
25,6,0.698970
maret,6,0.698970
2019,12,0.397940
catat,3,1.000000
kamis,11,0.435729
28,1,1.477121
332184,1,1.477121


## 3. TF-IDF Weighting

In [14]:
tf_idf = tf.mul(idf['Inverse Document Frequency'], axis=0)
tf_idf.head()

Unnamed: 0,332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,Ketua Wantimpres RI Apresiasi MRT Jakarta,Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",MRT Jakarta Terapkan Perda DKI Jakarta Nomor 13 Tahun 2013,Fasilitas MRT Jakarta Berstandar Internasional,PT MRT Jakarta dan Crossrail Internasional Ltd Sepakati Kerja Sama Pengembangan SDM,PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,MRT Jakarta Gandeng Crossrail International,...,MRT Jakarta Kerjasama dengan Kodam Jaya Amankan Pembangunan Fase 2,"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,PT MRT Jakarta dan PT Kereta Api Indonesia (Persero) Sepakati Kerja Sama Pengembangan SDM,Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,Query 1,Query 2,Query 3,Query 4,Query 5
operasi,0.572887,0.444658,0.444658,0.30103,0.391649,0.0,0.0,0.0,0.0,0.0,...,0.0,0.444658,0.0,0.482268,0.391649,0.0,0.0,0.0,0.0,0.0
resmi,1.138481,0.0,0.875061,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.875061,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
senin,1.176091,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25,0.69897,0.69897,0.0,0.0,0.0,0.0,0.0,0.0,0.69897,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
maret,0.909381,0.0,0.0,0.69897,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.909381,0.0,0.69897,0.69897,0.0,0.0,0.0,0.0,0.0


## Normalization

In [15]:
def normalization(x):    
    for i in x:        
        x[i] = x[i] / np.sqrt(np.sum(np.square(tf_idf[i])))        
    
    return x

In [16]:
tfidf_normalized = normalization(tf_idf)
tfidf_normalized

Unnamed: 0,332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,Ketua Wantimpres RI Apresiasi MRT Jakarta,Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",MRT Jakarta Terapkan Perda DKI Jakarta Nomor 13 Tahun 2013,Fasilitas MRT Jakarta Berstandar Internasional,PT MRT Jakarta dan Crossrail Internasional Ltd Sepakati Kerja Sama Pengembangan SDM,PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,MRT Jakarta Gandeng Crossrail International,...,MRT Jakarta Kerjasama dengan Kodam Jaya Amankan Pembangunan Fase 2,"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,PT MRT Jakarta dan PT Kereta Api Indonesia (Persero) Sepakati Kerja Sama Pengembangan SDM,Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,Query 1,Query 2,Query 3,Query 4,Query 5
operasi,0.034248,0.037652,0.029757,0.018969,0.032334,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.000000,0.033024,0.000000,0.047369,0.033970,0.000000,0.000000,0.00000,0.000000,0.000000
resmi,0.068060,0.000000,0.058559,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.083660,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000
senin,0.070308,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000
25,0.041785,0.059186,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.128268,0.000000,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000
maret,0.054364,0.000000,0.000000,0.044044,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.000000,0.067538,0.000000,0.068653,0.060626,0.000000,0.000000,0.00000,0.000000,0.000000
2019,0.038112,0.033696,0.000000,0.042602,0.042743,0.000000,0.000000,0.052250,0.000000,0.000000,...,0.000000,0.043656,0.000000,0.039086,0.034516,0.000000,0.000000,0.00000,0.000000,0.000000
catat,0.077777,0.000000,0.000000,0.063013,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.000000,0.000000,0.082881,0.000000,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000
kamis,0.026048,0.036896,0.000000,0.000000,0.000000,0.000000,0.000000,0.057212,0.079960,0.059634,...,0.000000,0.000000,0.000000,0.000000,0.037793,0.000000,0.000000,0.00000,0.000000,0.000000
28,0.088304,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000
332184,0.088304,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000


## Cosine Similarity

In [17]:
def cosine_similarity(a, b):
    return np.dot(a, b)

In [18]:
train = tfidf_normalized.iloc[:,:len(data)]
test = tfidf_normalized.iloc[:,len(data):]

In [19]:
result = pd.DataFrame()
for i in test:
    cos_sim = []
    for j in train:        
#         print(cosine_similarity(test[i], train[j]))
        cos_sim.append(cosine_similarity(test[i], train[j]))
    
    df_cos_sim = pd.DataFrame(cos_sim, columns=[i])
    result = pd.concat([result, df_cos_sim], axis=1, sort=False)

Hasil cosine similarity dari tiap dokumen berdasarkan masing-masing query

In [20]:
result.set_index(train.columns, inplace=True)
result

Unnamed: 0,Query 1,Query 2,Query 3,Query 4,Query 5
332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,0.033971,0.0001,0.027791,0.049213,0.011794
Ketua Wantimpres RI Apresiasi MRT Jakarta,0.065711,0.000149,0.021349,0.000124,0.022822
Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,0.000134,0.000112,0.016871,0.05509,2.3e-05
Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,0.044048,9.3e-05,0.066614,7.7e-05,0.0153
"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",0.000146,0.043255,0.148855,0.000101,2.5e-05
MRT Jakarta Terapkan Perda DKI Jakarta Nomor 13 Tahun 2013,0.000149,0.040772,2.6e-05,0.000103,2.7e-05
Fasilitas MRT Jakarta Berstandar Internasional,7.8e-05,0.05619,1.5e-05,0.039994,1.6e-05
PT MRT Jakarta dan Crossrail Internasional Ltd Sepakati Kerja Sama Pengembangan SDM,0.000231,0.068793,3.7e-05,0.00016,3.9e-05
PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,0.000308,0.000257,5.4e-05,0.000213,5.6e-05
MRT Jakarta Gandeng Crossrail International,0.000259,0.000216,4.3e-05,0.000179,4.5e-05


## Document Ranking

#### Query 1: Pembangunan MRT Jakarta

In [21]:
pd.DataFrame(result['Query 1'].sort_values(ascending=False)).head(15)

Unnamed: 0,Query 1
"Kembangkan SDM, MRT Jakarta Gandeng Perusahaan Asal Inggris",0.075667
MRT Jakarta Dapat Tawaran Kredit dari Pemerintah Inggris,0.069835
Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,0.06731
MRT Jakarta Kerjasama dengan Kodam Jaya Amankan Pembangunan Fase 2,0.066856
Ketua Wantimpres RI Apresiasi MRT Jakarta,0.065711
"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",0.0598
PT MRT Jakarta Sepakati Kerja Sama dengan Sejumlah BUMD DKI Jakarta,0.05941
"Siapkan SDM, MRT Jakarta Gandeng MTR Academy Hong Kong",0.052734
Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,0.044048
332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,0.033971


#### Query 2: Fasilitas MRT Jakarta

In [22]:
pd.DataFrame(result['Query 2'].sort_values(ascending=False)).head(15)

Unnamed: 0,Query 2
PT MRT Jakarta dan Crossrail Internasional Ltd Sepakati Kerja Sama Pengembangan SDM,0.068793
Fasilitas MRT Jakarta Berstandar Internasional,0.05619
MRT Jakarta dan UI Kerjasama Kembangkan SDM dan Teknologi,0.054983
Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,0.04547
MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,0.043441
"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",0.043255
MRT Jakarta Terapkan Perda DKI Jakarta Nomor 13 Tahun 2013,0.040772
PT MRT Jakarta Sepakati Kerja Sama dengan Sejumlah BUMD DKI Jakarta,0.040134
"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",0.038935
PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,0.000257


#### Query 3: Harga Tiket MRT

In [23]:
pd.DataFrame(result['Query 3'].sort_values(ascending=False)).head(15)

Unnamed: 0,Query 3
"Selama April 2019, Tarif MRT Jakarta Dipotong 50 Persen",0.148855
Rata-rata 78 ribu orang Per Hari Gunakan MRT Jakarta,0.066614
MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,0.035481
MRT Jakarta Raih Pendapatan Besar dari Hak Penamaan Stasiun,0.030509
332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,0.027791
"MRT Jakarta Kerja Sama dengan GoJek, Pengemudi Untung",0.027705
"Jaga Kenyamanan Penumpang, MRT Jakarta Mulai Gerakan Zero Waste",0.023317
Ketua Wantimpres RI Apresiasi MRT Jakarta,0.021349
Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,0.016871
PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,5.4e-05


#### Query 4: Rute MRT Jakarta

In [24]:
pd.DataFrame(result['Query 4'].sort_values(ascending=False)).head(15)

Unnamed: 0,Query 4
"Kembangkan SDM, MRT Jakarta Gandeng Perusahaan Asal Inggris",0.080286
"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",0.069407
"MRT Jakarta Kerja Sama dengan GoJek, Pengemudi Untung",0.061264
Masyarakat Mulai Gunakan MRT Jakarta ke Tempat Kerja,0.05509
Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,0.054916
332.184 Orang Gunakan MRT Jakarta Pada Minggu Pertama Operasi,0.049213
Fasilitas MRT Jakarta Berstandar Internasional,0.039994
PT MRT Jakarta Jalin Kerjasama dengan Crossrail Internasional Ltd,0.000213
PT MRT Jakarta Jalin Kerja Sama Pengembangan SDM,0.000211
MRT Jakarta Gandeng Crossrail International,0.000179


#### Query 5: Biaya Pembangunan MRT

In [25]:
pd.DataFrame(result['Query 5'].sort_values(ascending=False)).head(15)

Unnamed: 0,Query 5
MRT Jakarta dan GO-JEK Kerja Sama Pengembangan Sistem Pembayaran,0.118942
"Siapkan SDM Kereta, MRT Jakarta Gandeng Monash University",0.089385
"Kembangkan SDM, MRT Jakarta Gandeng Perusahaan Asal Inggris",0.026287
MRT Jakarta Dapat Tawaran Kredit dari Pemerintah Inggris,0.024253
Kerja Sama Indonesia- Jepang (JICA): Proyek Pembangunan MRT Jakarta,0.023377
MRT Jakarta Kerjasama dengan Kodam Jaya Amankan Pembangunan Fase 2,0.023218
Ketua Wantimpres RI Apresiasi MRT Jakarta,0.022822
"PT MRT Jakarta Menyepakati Kerja Sama dengan PT Pembangunan Jaya Ancol, Tbk untuk Pengerjaan Fase Kedua Bundaran HI – An",0.020769
PT MRT Jakarta Sepakati Kerja Sama dengan Sejumlah BUMD DKI Jakarta,0.020631
"Siapkan SDM, MRT Jakarta Gandeng MTR Academy Hong Kong",0.018302
