# Content Based Recommendation

In [1]:
import os
import pandas as pd
import numpy as np

In [3]:
from IPython.display import Markdown, display
from tqdm import tqdm
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import linear_kernel

## Data Preprocessing

In [4]:
DATA_DIR = os.path.abspath('./datasets/20_news')
OUTPUT_DIR = os.path.join('./datasets/output')

In [5]:
RAW_DATA_DIR = DATA_DIR
OUTPUT_DIR = os.path.join('./datasets/output')

In [6]:
classes = os.listdir(RAW_DATA_DIR)
columns=['id','class','text']

data_dict = {
    'id':[],
    'class':[],
    'text': []
}


In [7]:
for label in classes:
    files = os.path.join(RAW_DATA_DIR,label)
    for f in tqdm(os.listdir(files)):
        id_ = f.split('.')[0]
        try:
            with open(os.path.join(files,f),encoding='utf-8') as content:
                text = content.read().strip()
            #Adding corresponding data to the dictionary
            data_dict['id'].append(id_)
            data_dict['class'].append(label)
            data_dict['text'].append(text)
        except:
            print(label,id_,"Failed to load")


  0%|          | 0/200 [00:00<?, ?it/s]

Agriculture 101 Failed to load
Agriculture 102 Failed to load
Agriculture 103 Failed to load
Agriculture 104 Failed to load
Agriculture 105 Failed to load
Agriculture 106 Failed to load
Agriculture 107 Failed to load
Agriculture 108 Failed to load
Agriculture 109 Failed to load
Agriculture 110 Failed to load
Agriculture 111 Failed to load
Agriculture 112 Failed to load
Agriculture 113 Failed to load
Agriculture 114 Failed to load


  9%|▉         | 18/200 [00:00<00:01, 168.21it/s]

Agriculture 115 Failed to load
Agriculture 116 Failed to load
Agriculture 117 Failed to load
Agriculture 118 Failed to load
Agriculture 119 Failed to load
Agriculture 120 Failed to load
Agriculture 121 Failed to load
Agriculture 122 Failed to load
Agriculture 123 Failed to load
Agriculture 124 Failed to load
Agriculture 125 Failed to load
Agriculture 126 Failed to load
Agriculture 127 Failed to load


 16%|█▌        | 32/200 [00:00<00:01, 156.50it/s]

Agriculture 128 Failed to load
Agriculture 129 Failed to load
Agriculture 130 Failed to load
Agriculture 131 Failed to load
Agriculture 132 Failed to load
Agriculture 133 Failed to load
Agriculture 134 Failed to load
Agriculture 135 Failed to load
Agriculture 136 Failed to load
Agriculture 137 Failed to load
Agriculture 138 Failed to load
Agriculture 139 Failed to load
Agriculture 140 Failed to load


 24%|██▎       | 47/200 [00:00<00:00, 153.53it/s]

Agriculture 141 Failed to load
Agriculture 142 Failed to load
Agriculture 143 Failed to load
Agriculture 144 Failed to load
Agriculture 145 Failed to load
Agriculture 146 Failed to load
Agriculture 147 Failed to load
Agriculture 148 Failed to load
Agriculture 149 Failed to load
Agriculture 150 Failed to load
Agriculture 151 Failed to load
Agriculture 152 Failed to load
Agriculture 153 Failed to load


 30%|███       | 61/200 [00:00<00:00, 148.27it/s]

Agriculture 154 Failed to load
Agriculture 155 Failed to load
Agriculture 156 Failed to load
Agriculture 157 Failed to load
Agriculture 158 Failed to load
Agriculture 159 Failed to load
Agriculture 160 Failed to load
Agriculture 161 Failed to load
Agriculture 162 Failed to load
Agriculture 163 Failed to load
Agriculture 164 Failed to load
Agriculture 165 Failed to load
Agriculture 166 Failed to load


 38%|███▊      | 75/200 [00:00<00:00, 142.13it/s]

Agriculture 167 Failed to load
Agriculture 168 Failed to load
Agriculture 169 Failed to load
Agriculture 170 Failed to load
Agriculture 171 Failed to load
Agriculture 172 Failed to load
Agriculture 173 Failed to load
Agriculture 174 Failed to load
Agriculture 175 Failed to load
Agriculture 176 Failed to load
Agriculture 177 Failed to load
Agriculture 178 Failed to load
Agriculture 179 Failed to load


 45%|████▌     | 90/200 [00:00<00:00, 143.58it/s]

Agriculture 180 Failed to load
Agriculture 181 Failed to load
Agriculture 182 Failed to load
Agriculture 183 Failed to load
Agriculture 184 Failed to load
Agriculture 185 Failed to load
Agriculture 186 Failed to load
Agriculture 187 Failed to load
Agriculture 188 Failed to load
Agriculture 189 Failed to load
Agriculture 190 Failed to load
Agriculture 191 Failed to load
Agriculture 192 Failed to load


 52%|█████▏    | 104/200 [00:00<00:00, 140.77it/s]

Agriculture 193 Failed to load
Agriculture 194 Failed to load
Agriculture 195 Failed to load
Agriculture 196 Failed to load
Agriculture 197 Failed to load
Agriculture 198 Failed to load
Agriculture 199 Failed to load
Agriculture 200 Failed to load


100%|██████████| 200/200 [00:00<00:00, 232.28it/s]
  0%|          | 0/246 [00:00<?, ?it/s]

Automobiles 100 Failed to load
Automobiles 101 Failed to load
Automobiles 102 Failed to load
Automobiles 103 Failed to load
Automobiles 104 Failed to load
Automobiles 105 Failed to load
Automobiles 106 Failed to load
Automobiles 107 Failed to load
Automobiles 108 Failed to load
Automobiles 109 Failed to load
Automobiles 110 Failed to load
Automobiles 111 Failed to load
Automobiles 112 Failed to load
Automobiles 113 Failed to load


  7%|▋         | 17/246 [00:00<00:01, 166.68it/s]

Automobiles 114 Failed to load
Automobiles 115 Failed to load
Automobiles 116 Failed to load
Automobiles 117 Failed to load
Automobiles 118 Failed to load
Automobiles 119 Failed to load
Automobiles 120 Failed to load
Automobiles 121 Failed to load
Automobiles 122 Failed to load
Automobiles 123 Failed to load
Automobiles 124 Failed to load
Automobiles 125 Failed to load
Automobiles 126 Failed to load
Automobiles 127 Failed to load


 13%|█▎        | 32/246 [00:00<00:01, 158.74it/s]

Automobiles 128 Failed to load
Automobiles 129 Failed to load
Automobiles 130 Failed to load
Automobiles 131 Failed to load
Automobiles 132 Failed to load
Automobiles 133 Failed to load
Automobiles 134 Failed to load
Automobiles 135 Failed to load
Automobiles 136 Failed to load
Automobiles 137 Failed to load
Automobiles 138 Failed to load
Automobiles 139 Failed to load
Automobiles 140 Failed to load
Automobiles 141 Failed to load


 20%|█▉        | 48/246 [00:00<00:01, 157.23it/s]

Automobiles 142 Failed to load
Automobiles 143 Failed to load
Automobiles 144 Failed to load
Automobiles 145 Failed to load
Automobiles 146 Failed to load
Automobiles 147 Failed to load
Automobiles 148 Failed to load
Automobiles 149 Failed to load
Automobiles 150 Failed to load
Automobiles 151 Failed to load
Automobiles 152 Failed to load
Automobiles 153 Failed to load
Automobiles 154 Failed to load
Automobiles 155 Failed to load
Automobiles 156 Failed to load
Automobiles 157 Failed to load


 26%|██▋       | 65/246 [00:00<00:01, 160.40it/s]

Automobiles 158 Failed to load
Automobiles 159 Failed to load
Automobiles 160 Failed to load
Automobiles 161 Failed to load
Automobiles 162 Failed to load
Automobiles 163 Failed to load
Automobiles 164 Failed to load
Automobiles 165 Failed to load
Automobiles 166 Failed to load
Automobiles 167 Failed to load
Automobiles 168 Failed to load
Automobiles 169 Failed to load
Automobiles 170 Failed to load
Automobiles 171 Failed to load
Automobiles 172 Failed to load
Automobiles 173 Failed to load
Automobiles 174 Failed to load
Automobiles 175 Failed to load
Automobiles 176 Failed to load
Automobiles 177 Failed to load
Automobiles 178 Failed to load
Automobiles 179 Failed to load


 36%|███▌      | 89/246 [00:00<00:00, 177.74it/s]

Automobiles 180 Failed to load
Automobiles 181 Failed to load
Automobiles 182 Failed to load
Automobiles 183 Failed to load
Automobiles 184 Failed to load
Automobiles 185 Failed to load
Automobiles 186 Failed to load
Automobiles 187 Failed to load
Automobiles 188 Failed to load
Automobiles 189 Failed to load
Automobiles 190 Failed to load
Automobiles 191 Failed to load
Automobiles 192 Failed to load
Automobiles 193 Failed to load
Automobiles 194 Failed to load
Automobiles 195 Failed to load
Automobiles 196 Failed to load


 65%|██████▌   | 161/246 [00:00<00:00, 229.62it/s]

Automobiles 34 Failed to load
Automobiles 60 Failed to load
Automobiles 66 Failed to load
Automobiles 96 Failed to load
Automobiles 97 Failed to load
Automobiles 98 Failed to load
Automobiles 99 Failed to load


100%|██████████| 246/246 [00:00<00:00, 356.52it/s]
  0%|          | 0/617 [00:00<?, ?it/s]

Bank 100 Failed to load


 25%|██▍       | 153/617 [00:00<00:00, 1529.99it/s]

Bank 274 Failed to load
Bank 285 Failed to load
Bank 286 Failed to load
Bank 311 Failed to load


 39%|███▊      | 238/617 [00:00<00:00, 1233.83it/s]

Bank 382 Failed to load


 55%|█████▌    | 342/617 [00:00<00:00, 1164.59it/s]

Bank 426 Failed to load
Bank 427 Failed to load
Bank 428 Failed to load
Bank 429 Failed to load
Bank 430 Failed to load
Bank 431 Failed to load
Bank 432 Failed to load
Bank 433 Failed to load
Bank 434 Failed to load
Bank 435 Failed to load
Bank 436 Failed to load
Bank 437 Failed to load
Bank 438 Failed to load
Bank 439 Failed to load
Bank 440 Failed to load
Bank 441 Failed to load
Bank 442 Failed to load
Bank 443 Failed to load
Bank 444 Failed to load
Bank 445 Failed to load
Bank 446 Failed to load
Bank 447 Failed to load
Bank 448 Failed to load
Bank 449 Failed to load
Bank 450 Failed to load
Bank 451 Failed to load
Bank 452 Failed to load
Bank 453 Failed to load
Bank 454 Failed to load
Bank 455 Failed to load
Bank 456 Failed to load
Bank 457 Failed to load
Bank 458 Failed to load
Bank 459 Failed to load
Bank 460 Failed to load
Bank 461 Failed to load
Bank 462 Failed to load
Bank 463 Failed to load
Bank 464 Failed to load
Bank 465 Failed to load
Bank 466 Failed to load
Bank 467 Failed 

 67%|██████▋   | 414/617 [00:00<00:00, 521.45it/s] 

Bank 472 Failed to load
Bank 473 Failed to load
Bank 474 Failed to load
Bank 475 Failed to load
Bank 476 Failed to load
Bank 477 Failed to load
Bank 478 Failed to load
Bank 479 Failed to load
Bank 480 Failed to load
Bank 481 Failed to load
Bank 482 Failed to load
Bank 483 Failed to load
Bank 484 Failed to load
Bank 485 Failed to load
Bank 486 Failed to load
Bank 487 Failed to load
Bank 488 Failed to load
Bank 489 Failed to load
Bank 490 Failed to load
Bank 491 Failed to load
Bank 492 Failed to load
Bank 493 Failed to load
Bank 494 Failed to load
Bank 495 Failed to load
Bank 496 Failed to load
Bank 497 Failed to load
Bank 498 Failed to load
Bank 499 Failed to load
Bank 500 Failed to load
Bank 501 Failed to load
Bank 502 Failed to load
Bank 503 Failed to load
Bank 504 Failed to load
Bank 505 Failed to load
Bank 506 Failed to load
Bank 507 Failed to load
Bank 508 Failed to load
Bank 509 Failed to load
Bank 510 Failed to load
Bank 511 Failed to load
Bank 512 Failed to load
Bank 513 Failed 

 76%|███████▋  | 471/617 [00:00<00:00, 333.89it/s]

Bank 523 Failed to load
Bank 524 Failed to load
Bank 525 Failed to load
Bank 526 Failed to load
Bank 527 Failed to load
Bank 528 Failed to load
Bank 529 Failed to load
Bank 530 Failed to load
Bank 531 Failed to load
Bank 532 Failed to load
Bank 533 Failed to load
Bank 534 Failed to load
Bank 535 Failed to load
Bank 536 Failed to load
Bank 537 Failed to load
Bank 538 Failed to load
Bank 539 Failed to load
Bank 540 Failed to load
Bank 541 Failed to load
Bank 542 Failed to load
Bank 543 Failed to load
Bank 544 Failed to load
Bank 545 Failed to load
Bank 546 Failed to load
Bank 547 Failed to load
Bank 548 Failed to load
Bank 549 Failed to load
Bank 550 Failed to load
Bank 551 Failed to load
Bank 552 Failed to load
Bank 553 Failed to load
Bank 554 Failed to load
Bank 555 Failed to load
Bank 556 Failed to load
Bank 557 Failed to load
Bank 558 Failed to load
Bank 559 Failed to load
Bank 560 Failed to load
Bank 561 Failed to load
Bank 562 Failed to load
Bank 563 Failed to load
Bank 564 Failed 

 84%|████████▍ | 517/617 [00:01<00:00, 288.51it/s]

Bank 565 Failed to load
Bank 566 Failed to load
Bank 567 Failed to load
Bank 568 Failed to load
Bank 569 Failed to load
Bank 570 Failed to load
Bank 571 Failed to load
Bank 572 Failed to load
Bank 573 Failed to load
Bank 574 Failed to load
Bank 575 Failed to load
Bank 576 Failed to load
Bank 577 Failed to load
Bank 578 Failed to load
Bank 579 Failed to load
Bank 580 Failed to load
Bank 581 Failed to load
Bank 582 Failed to load
Bank 583 Failed to load
Bank 584 Failed to load
Bank 585 Failed to load
Bank 586 Failed to load
Bank 587 Failed to load
Bank 588 Failed to load
Bank 589 Failed to load
Bank 590 Failed to load
Bank 591 Failed to load
Bank 592 Failed to load
Bank 593 Failed to load
Bank 594 Failed to load
Bank 595 Failed to load
Bank 596 Failed to load
Bank 597 Failed to load
Bank 598 Failed to load
Bank 599 Failed to load


 90%|█████████ | 556/617 [00:01<00:00, 265.62it/s]

Bank 600 Failed to load
Bank 601 Failed to load
Bank 602 Failed to load
Bank 603 Failed to load
Bank 604 Failed to load
Bank 605 Failed to load
Bank 606 Failed to load
Bank 607 Failed to load
Bank 608 Failed to load
Bank 609 Failed to load
Bank 610 Failed to load
Bank 611 Failed to load
Bank 612 Failed to load
Bank 613 Failed to load
Bank 614 Failed to load
Bank 615 Failed to load
Bank 616 Failed to load
Bank 617 Failed to load
Bank 67 Failed to load
Bank 68 Failed to load
Bank 69 Failed to load
Bank 70 Failed to load
Bank 71 Failed to load
Bank 72 Failed to load
Bank 73 Failed to load
Bank 74 Failed to load


 96%|█████████▌| 590/617 [00:01<00:00, 261.94it/s]

Bank 89 Failed to load


100%|██████████| 617/617 [00:01<00:00, 419.73it/s]
 68%|██████▊   | 177/259 [00:00<00:00, 1752.50it/s]

Blog 49 Failed to load


100%|██████████| 259/259 [00:00<00:00, 1532.58it/s]
  0%|          | 0/307 [00:00<?, ?it/s]

Business 143 Failed to load
Business 144 Failed to load
Business 145 Failed to load
Business 146 Failed to load
Business 147 Failed to load
Business 148 Failed to load
Business 149 Failed to load
Business 150 Failed to load
Business 151 Failed to load
Business 152 Failed to load
Business 153 Failed to load


 20%|█▉        | 61/307 [00:00<00:00, 592.23it/s]

Business 154 Failed to load
Business 155 Failed to load
Business 156 Failed to load
Business 157 Failed to load
Business 158 Failed to load
Business 160 Failed to load
Business 162 Failed to load
Business 164 Failed to load
Business 166 Failed to load
Business 168 Failed to load
Business 170 Failed to load
Business 172 Failed to load
Business 174 Failed to load
Business 176 Failed to load
Business 178 Failed to load
Business 180 Failed to load


 30%|██▉       | 91/307 [00:00<00:00, 454.13it/s]

Business 182 Failed to load
Business 184 Failed to load
Business 186 Failed to load
Business 188 Failed to load
Business 190 Failed to load
Business 192 Failed to load
Business 194 Failed to load
Business 196 Failed to load
Business 198 Failed to load
Business 200 Failed to load
Business 202 Failed to load
Business 204 Failed to load
Business 206 Failed to load
Business 208 Failed to load
Business 210 Failed to load
Business 212 Failed to load


 41%|████▏     | 127/307 [00:00<00:00, 421.08it/s]

Business 214 Failed to load
Business 216 Failed to load
Business 218 Failed to load
Business 220 Failed to load
Business 222 Failed to load
Business 224 Failed to load
Business 226 Failed to load
Business 228 Failed to load
Business 230 Failed to load
Business 232 Failed to load
Business 234 Failed to load
Business 236 Failed to load
Business 238 Failed to load
Business 240 Failed to load
Business 242 Failed to load
Business 244 Failed to load
Business 246 Failed to load


 53%|█████▎    | 164/307 [00:00<00:00, 397.80it/s]

Business 248 Failed to load
Business 250 Failed to load
Business 252 Failed to load
Business 254 Failed to load
Business 256 Failed to load
Business 258 Failed to load
Business 259 Failed to load
Business 260 Failed to load
Business 261 Failed to load
Business 262 Failed to load
Business 263 Failed to load
Business 264 Failed to load
Business 265 Failed to load
Business 266 Failed to load
Business 267 Failed to load
Business 268 Failed to load
Business 269 Failed to load
Business 270 Failed to load
Business 271 Failed to load
Business 272 Failed to load


 63%|██████▎   | 193/307 [00:00<00:00, 340.28it/s]

Business 273 Failed to load
Business 274 Failed to load
Business 275 Failed to load
Business 276 Failed to load
Business 277 Failed to load
Business 278 Failed to load
Business 279 Failed to load
Business 280 Failed to load
Business 281 Failed to load
Business 282 Failed to load
Business 283 Failed to load
Business 284 Failed to load
Business 285 Failed to load
Business 286 Failed to load
Business 287 Failed to load
Business 288 Failed to load
Business 289 Failed to load
Business 290 Failed to load
Business 291 Failed to load
Business 292 Failed to load
Business 293 Failed to load
Business 294 Failed to load
Business 295 Failed to load
Business 296 Failed to load
Business 297 Failed to load
Business 298 Failed to load


 72%|███████▏  | 221/307 [00:00<00:00, 276.96it/s]

Business 299 Failed to load
Business 300 Failed to load
Business 301 Failed to load
Business 302 Failed to load
Business 303 Failed to load
Business 304 Failed to load
Business 305 Failed to load
Business 306 Failed to load
Business 307 Failed to load
Business 51 Failed to load
Business 62 Failed to load
Business 64 Failed to load


 88%|████████▊ | 269/307 [00:00<00:00, 317.21it/s]

Business 85 Failed to load


100%|██████████| 307/307 [00:00<00:00, 376.67it/s]
  0%|          | 0/600 [00:00<?, ?it/s]

Economy 1 Failed to load
Economy 2 Failed to load


 19%|█▉        | 113/600 [00:00<00:00, 1129.98it/s]

Economy 226 Failed to load
Economy 23 Failed to load
Economy 233 Failed to load
Economy 243 Failed to load
Economy 263 Failed to load


 36%|███▋      | 219/600 [00:00<00:00, 1108.01it/s]

Economy 3 Failed to load
Economy 322 Failed to load
Economy 355 Failed to load
Economy 390 Failed to load


 55%|█████▌    | 330/600 [00:00<00:00, 1105.33it/s]

Economy 4 Failed to load
Economy 505 Failed to load
Economy 506 Failed to load
Economy 507 Failed to load


 76%|███████▌  | 454/600 [00:00<00:00, 1133.16it/s]

Economy 508 Failed to load
Economy 509 Failed to load
Economy 510 Failed to load
Economy 511 Failed to load
Economy 512 Failed to load
Economy 513 Failed to load
Economy 514 Failed to load
Economy 515 Failed to load
Economy 516 Failed to load
Economy 517 Failed to load
Economy 518 Failed to load
Economy 519 Failed to load
Economy 520 Failed to load
Economy 521 Failed to load
Economy 522 Failed to load
Economy 523 Failed to load
Economy 524 Failed to load
Economy 525 Failed to load
Economy 526 Failed to load
Economy 527 Failed to load
Economy 528 Failed to load
Economy 529 Failed to load
Economy 530 Failed to load
Economy 531 Failed to load
Economy 532 Failed to load
Economy 533 Failed to load
Economy 534 Failed to load
Economy 535 Failed to load
Economy 536 Failed to load
Economy 537 Failed to load
Economy 538 Failed to load
Economy 539 Failed to load
Economy 540 Failed to load
Economy 541 Failed to load
Economy 542 Failed to load
Economy 543 Failed to load
Economy 544 Failed to load
E

 90%|█████████ | 541/600 [00:00<00:00, 474.52it/s] 

Economy 587 Failed to load
Economy 588 Failed to load
Economy 589 Failed to load
Economy 590 Failed to load
Economy 591 Failed to load
Economy 592 Failed to load
Economy 593 Failed to load
Economy 594 Failed to load
Economy 595 Failed to load
Economy 596 Failed to load
Economy 597 Failed to load
Economy 598 Failed to load
Economy 599 Failed to load
Economy 600 Failed to load
Economy 81 Failed to load
Economy 89 Failed to load


100%|██████████| 600/600 [00:00<00:00, 632.24it/s]
  0%|          | 0/185 [00:00<?, ?it/s]

Education 137 Failed to load
Education 138 Failed to load
Education 139 Failed to load
Education 140 Failed to load
Education 141 Failed to load
Education 142 Failed to load
Education 143 Failed to load
Education 144 Failed to load
Education 146 Failed to load
Education 147 Failed to load
Education 149 Failed to load
Education 150 Failed to load
Education 151 Failed to load


 32%|███▏      | 59/185 [00:00<00:00, 578.44it/s]

Education 152 Failed to load
Education 153 Failed to load
Education 154 Failed to load
Education 155 Failed to load
Education 156 Failed to load
Education 157 Failed to load
Education 158 Failed to load
Education 159 Failed to load
Education 161 Failed to load
Education 162 Failed to load
Education 163 Failed to load
Education 164 Failed to load
Education 165 Failed to load
Education 166 Failed to load
Education 167 Failed to load
Education 168 Failed to load
Education 169 Failed to load
Education 171 Failed to load


 44%|████▍     | 81/185 [00:00<00:00, 380.47it/s]

Education 172 Failed to load
Education 173 Failed to load
Education 174 Failed to load
Education 175 Failed to load
Education 176 Failed to load
Education 177 Failed to load
Education 178 Failed to load
Education 179 Failed to load
Education 180 Failed to load
Education 181 Failed to load
Education 182 Failed to load
Education 183 Failed to load
Education 184 Failed to load
Education 185 Failed to load
Education 20 Failed to load


100%|██████████| 185/185 [00:00<00:00, 533.14it/s]
  0%|          | 0/304 [00:00<?, ?it/s]

Employment 103 Failed to load
Employment 105 Failed to load
Employment 122 Failed to load
Employment 143 Failed to load
Employment 205 Failed to load


 39%|███▉      | 119/304 [00:00<00:00, 1178.48it/s]

Employment 206 Failed to load
Employment 207 Failed to load
Employment 208 Failed to load
Employment 209 Failed to load
Employment 210 Failed to load
Employment 211 Failed to load
Employment 212 Failed to load
Employment 213 Failed to load
Employment 214 Failed to load
Employment 215 Failed to load
Employment 216 Failed to load
Employment 217 Failed to load
Employment 218 Failed to load
Employment 219 Failed to load
Employment 220 Failed to load
Employment 221 Failed to load
Employment 222 Failed to load
Employment 223 Failed to load
Employment 224 Failed to load
Employment 225 Failed to load
Employment 226 Failed to load
Employment 227 Failed to load
Employment 228 Failed to load
Employment 229 Failed to load
Employment 230 Failed to load
Employment 231 Failed to load
Employment 232 Failed to load
Employment 233 Failed to load
Employment 234 Failed to load
Employment 235 Failed to load
Employment 236 Failed to load
Employment 237 Failed to load
Employment 238 Failed to load


 51%|█████     | 155/304 [00:00<00:00, 471.93it/s] 

Employment 239 Failed to load
Employment 240 Failed to load
Employment 241 Failed to load
Employment 242 Failed to load
Employment 243 Failed to load
Employment 244 Failed to load
Employment 245 Failed to load
Employment 246 Failed to load
Employment 247 Failed to load
Employment 248 Failed to load
Employment 249 Failed to load
Employment 250 Failed to load
Employment 251 Failed to load
Employment 252 Failed to load
Employment 253 Failed to load
Employment 254 Failed to load
Employment 255 Failed to load
Employment 256 Failed to load
Employment 257 Failed to load
Employment 258 Failed to load
Employment 259 Failed to load
Employment 260 Failed to load
Employment 261 Failed to load
Employment 262 Failed to load
Employment 263 Failed to load
Employment 264 Failed to load
Employment 265 Failed to load
Employment 266 Failed to load


 61%|██████    | 186/304 [00:00<00:00, 333.04it/s]

Employment 267 Failed to load
Employment 268 Failed to load
Employment 269 Failed to load
Employment 27 Failed to load
Employment 270 Failed to load
Employment 271 Failed to load
Employment 272 Failed to load
Employment 273 Failed to load
Employment 274 Failed to load
Employment 275 Failed to load
Employment 276 Failed to load
Employment 277 Failed to load
Employment 278 Failed to load
Employment 279 Failed to load
Employment 280 Failed to load
Employment 281 Failed to load
Employment 283 Failed to load
Employment 284 Failed to load
Employment 285 Failed to load
Employment 286 Failed to load
Employment 287 Failed to load
Employment 288 Failed to load
Employment 289 Failed to load
Employment 290 Failed to load
Employment 291 Failed to load


 70%|███████   | 214/304 [00:00<00:00, 280.96it/s]

Employment 292 Failed to load
Employment 293 Failed to load
Employment 294 Failed to load
Employment 295 Failed to load
Employment 296 Failed to load
Employment 297 Failed to load
Employment 298 Failed to load
Employment 299 Failed to load
Employment 300 Failed to load
Employment 301 Failed to load
Employment 302 Failed to load
Employment 303 Failed to load
Employment 304 Failed to load


 88%|████████▊ | 266/304 [00:00<00:00, 325.31it/s]

Employment 88 Failed to load


100%|██████████| 304/304 [00:00<00:00, 428.18it/s]
  0%|          | 0/634 [00:00<?, ?it/s]

Entertainment 1 Failed to load
Entertainment 101 Failed to load
Entertainment 168 Failed to load
Entertainment 2 Failed to load


 21%|██        | 132/634 [00:00<00:00, 1306.95it/s]

Entertainment 3 Failed to load


 42%|████▏     | 264/634 [00:00<00:00, 1310.74it/s]

Entertainment 364 Failed to load
Entertainment 4 Failed to load
Entertainment 402 Failed to load


 60%|██████    | 382/634 [00:00<00:00, 1264.59it/s]

Entertainment 505 Failed to load
Entertainment 506 Failed to load
Entertainment 507 Failed to load
Entertainment 508 Failed to load
Entertainment 509 Failed to load
Entertainment 510 Failed to load
Entertainment 511 Failed to load
Entertainment 512 Failed to load
Entertainment 513 Failed to load
Entertainment 514 Failed to load
Entertainment 515 Failed to load
Entertainment 516 Failed to load


 73%|███████▎  | 464/634 [00:00<00:00, 1011.23it/s]

Entertainment 517 Failed to load
Entertainment 518 Failed to load
Entertainment 519 Failed to load
Entertainment 520 Failed to load
Entertainment 521 Failed to load
Entertainment 522 Failed to load
Entertainment 523 Failed to load
Entertainment 524 Failed to load
Entertainment 525 Failed to load
Entertainment 526 Failed to load
Entertainment 527 Failed to load
Entertainment 528 Failed to load
Entertainment 529 Failed to load
Entertainment 530 Failed to load
Entertainment 531 Failed to load
Entertainment 532 Failed to load
Entertainment 533 Failed to load
Entertainment 534 Failed to load
Entertainment 535 Failed to load
Entertainment 536 Failed to load
Entertainment 537 Failed to load
Entertainment 538 Failed to load
Entertainment 539 Failed to load
Entertainment 540 Failed to load
Entertainment 541 Failed to load
Entertainment 542 Failed to load
Entertainment 543 Failed to load
Entertainment 544 Failed to load
Entertainment 545 Failed to load
Entertainment 546 Failed to load
Entertainm

 86%|████████▌ | 543/634 [00:00<00:00, 438.68it/s] 

Entertainment 84 Failed to load


100%|██████████| 634/634 [00:00<00:00, 700.55it/s]
  0%|          | 0/180 [00:00<?, ?it/s]

Health 1 Failed to load
Health 10 Failed to load
Health 100 Failed to load
Health 101 Failed to load
Health 102 Failed to load
Health 103 Failed to load
Health 104 Failed to load
Health 105 Failed to load
Health 106 Failed to load
Health 107 Failed to load
Health 108 Failed to load
Health 109 Failed to load
Health 11 Failed to load
Health 110 Failed to load
Health 111 Failed to load
Health 112 Failed to load
Health 113 Failed to load
Health 114 Failed to load
Health 115 Failed to load


 11%|█         | 19/180 [00:00<00:00, 188.11it/s]

Health 116 Failed to load
Health 117 Failed to load
Health 118 Failed to load
Health 119 Failed to load
Health 12 Failed to load
Health 120 Failed to load
Health 121 Failed to load
Health 122 Failed to load
Health 123 Failed to load
Health 124 Failed to load
Health 125 Failed to load
Health 126 Failed to load
Health 127 Failed to load
Health 128 Failed to load
Health 129 Failed to load
Health 13 Failed to load
Health 130 Failed to load
Health 131 Failed to load
Health 132 Failed to load


 21%|██        | 38/180 [00:00<00:00, 188.12it/s]

Health 133 Failed to load
Health 134 Failed to load
Health 135 Failed to load
Health 136 Failed to load
Health 137 Failed to load
Health 138 Failed to load
Health 139 Failed to load
Health 14 Failed to load
Health 140 Failed to load
Health 141 Failed to load
Health 142 Failed to load
Health 143 Failed to load
Health 144 Failed to load
Health 145 Failed to load
Health 146 Failed to load
Health 147 Failed to load
Health 148 Failed to load
Health 149 Failed to load
Health 15 Failed to load


 32%|███▏      | 57/180 [00:00<00:00, 187.56it/s]

Health 150 Failed to load
Health 151 Failed to load
Health 152 Failed to load
Health 153 Failed to load
Health 154 Failed to load
Health 155 Failed to load
Health 156 Failed to load
Health 157 Failed to load
Health 158 Failed to load
Health 159 Failed to load
Health 16 Failed to load
Health 160 Failed to load
Health 161 Failed to load
Health 162 Failed to load
Health 163 Failed to load
Health 164 Failed to load
Health 165 Failed to load
Health 166 Failed to load
Health 167 Failed to load
Health 168 Failed to load


 43%|████▎     | 77/180 [00:00<00:00, 188.96it/s]

Health 169 Failed to load
Health 17 Failed to load
Health 170 Failed to load
Health 171 Failed to load
Health 172 Failed to load
Health 173 Failed to load
Health 174 Failed to load
Health 175 Failed to load
Health 176 Failed to load
Health 177 Failed to load
Health 178 Failed to load
Health 179 Failed to load
Health 18 Failed to load
Health 180 Failed to load
Health 19 Failed to load
Health 2 Failed to load
Health 20 Failed to load
Health 21 Failed to load
Health 22 Failed to load


 53%|█████▎    | 96/180 [00:00<00:00, 188.71it/s]

Health 23 Failed to load
Health 24 Failed to load
Health 25 Failed to load
Health 26 Failed to load
Health 27 Failed to load
Health 28 Failed to load
Health 29 Failed to load
Health 3 Failed to load
Health 30 Failed to load
Health 31 Failed to load
Health 32 Failed to load
Health 33 Failed to load
Health 34 Failed to load
Health 35 Failed to load
Health 36 Failed to load
Health 37 Failed to load
Health 38 Failed to load
Health 39 Failed to load


 63%|██████▎   | 114/180 [00:00<00:00, 186.01it/s]

Health 4 Failed to load
Health 40 Failed to load
Health 41 Failed to load
Health 42 Failed to load
Health 43 Failed to load
Health 44 Failed to load
Health 45 Failed to load
Health 46 Failed to load
Health 47 Failed to load
Health 48 Failed to load
Health 49 Failed to load
Health 5 Failed to load
Health 50 Failed to load
Health 51 Failed to load
Health 52 Failed to load
Health 53 Failed to load
Health 54 Failed to load
Health 55 Failed to load
Health 56 Failed to load
Health 57 Failed to load
Health 58 Failed to load


 75%|███████▌  | 135/180 [00:00<00:00, 189.47it/s]

Health 59 Failed to load
Health 6 Failed to load
Health 60 Failed to load
Health 61 Failed to load
Health 62 Failed to load
Health 63 Failed to load
Health 64 Failed to load
Health 65 Failed to load
Health 66 Failed to load
Health 67 Failed to load
Health 68 Failed to load
Health 69 Failed to load
Health 7 Failed to load
Health 70 Failed to load
Health 71 Failed to load
Health 72 Failed to load
Health 73 Failed to load
Health 74 Failed to load
Health 75 Failed to load


 86%|████████▌ | 154/180 [00:00<00:00, 189.07it/s]

Health 76 Failed to load
Health 77 Failed to load
Health 78 Failed to load
Health 79 Failed to load
Health 8 Failed to load
Health 80 Failed to load
Health 81 Failed to load
Health 82 Failed to load
Health 83 Failed to load
Health 84 Failed to load
Health 85 Failed to load
Health 86 Failed to load
Health 87 Failed to load
Health 88 Failed to load
Health 89 Failed to load
Health 9 Failed to load
Health 90 Failed to load
Health 91 Failed to load
Health 92 Failed to load
Health 93 Failed to load


 97%|█████████▋| 174/180 [00:00<00:00, 189.49it/s]

Health 94 Failed to load
Health 95 Failed to load
Health 96 Failed to load
Health 97 Failed to load
Health 98 Failed to load
Health 99 Failed to load


100%|██████████| 180/180 [00:00<00:00, 188.48it/s]
  0%|          | 0/330 [00:00<?, ?it/s]

Interview 1 Failed to load
Interview 109 Failed to load
Interview 122 Failed to load
Interview 125 Failed to load
Interview 159 Failed to load


 28%|██▊       | 93/330 [00:00<00:00, 930.00it/s]

Interview 2 Failed to load
Interview 234 Failed to load
Interview 235 Failed to load
Interview 236 Failed to load
Interview 237 Failed to load
Interview 238 Failed to load
Interview 239 Failed to load
Interview 240 Failed to load
Interview 241 Failed to load
Interview 242 Failed to load
Interview 243 Failed to load


 49%|████▉     | 161/330 [00:00<00:00, 819.45it/s]

Interview 244 Failed to load
Interview 245 Failed to load
Interview 246 Failed to load
Interview 247 Failed to load
Interview 248 Failed to load
Interview 249 Failed to load
Interview 250 Failed to load
Interview 251 Failed to load
Interview 252 Failed to load
Interview 253 Failed to load
Interview 254 Failed to load
Interview 255 Failed to load
Interview 256 Failed to load
Interview 257 Failed to load
Interview 258 Failed to load
Interview 259 Failed to load
Interview 260 Failed to load
Interview 261 Failed to load
Interview 262 Failed to load
Interview 263 Failed to load
Interview 264 Failed to load
Interview 265 Failed to load
Interview 266 Failed to load
Interview 267 Failed to load
Interview 268 Failed to load
Interview 269 Failed to load
Interview 270 Failed to load
Interview 271 Failed to load
Interview 272 Failed to load
Interview 273 Failed to load
Interview 274 Failed to load
Interview 275 Failed to load
Interview 276 Failed to load
Interview 277 Failed to load
Interview 278 

 61%|██████    | 200/330 [00:00<00:00, 439.12it/s]

Interview 280 Failed to load
Interview 281 Failed to load
Interview 282 Failed to load
Interview 283 Failed to load
Interview 284 Failed to load
Interview 285 Failed to load
Interview 286 Failed to load
Interview 287 Failed to load
Interview 288 Failed to load
Interview 289 Failed to load
Interview 290 Failed to load
Interview 291 Failed to load
Interview 292 Failed to load
Interview 293 Failed to load
Interview 294 Failed to load
Interview 295 Failed to load
Interview 296 Failed to load
Interview 297 Failed to load
Interview 298 Failed to load
Interview 299 Failed to load
Interview 3 Failed to load
Interview 300 Failed to load
Interview 301 Failed to load
Interview 302 Failed to load
Interview 303 Failed to load
Interview 304 Failed to load
Interview 305 Failed to load
Interview 306 Failed to load
Interview 307 Failed to load
Interview 308 Failed to load
Interview 309 Failed to load


 71%|███████   | 234/330 [00:00<00:00, 334.63it/s]

Interview 310 Failed to load
Interview 311 Failed to load
Interview 312 Failed to load
Interview 313 Failed to load
Interview 314 Failed to load
Interview 315 Failed to load
Interview 316 Failed to load
Interview 317 Failed to load
Interview 318 Failed to load
Interview 319 Failed to load
Interview 320 Failed to load
Interview 321 Failed to load
Interview 322 Failed to load
Interview 323 Failed to load
Interview 324 Failed to load
Interview 325 Failed to load
Interview 326 Failed to load
Interview 327 Failed to load
Interview 328 Failed to load
Interview 329 Failed to load
Interview 330 Failed to load


 80%|████████  | 264/330 [00:00<00:00, 305.65it/s]

Interview 4 Failed to load
Interview 8 Failed to load


100%|██████████| 330/330 [00:00<00:00, 453.29it/s]
  0%|          | 0/251 [00:00<?, ?it/s]

Literature 110 Failed to load
Literature 111 Failed to load
Literature 112 Failed to load
Literature 113 Failed to load
Literature 114 Failed to load
Literature 115 Failed to load
Literature 116 Failed to load
Literature 117 Failed to load
Literature 118 Failed to load
Literature 119 Failed to load
Literature 120 Failed to load
Literature 121 Failed to load
Literature 122 Failed to load
Literature 123 Failed to load
Literature 124 Failed to load
Literature 125 Failed to load
Literature 126 Failed to load
Literature 127 Failed to load


 13%|█▎        | 32/251 [00:00<00:00, 307.70it/s]

Literature 128 Failed to load
Literature 129 Failed to load
Literature 130 Failed to load
Literature 131 Failed to load
Literature 132 Failed to load
Literature 133 Failed to load
Literature 134 Failed to load
Literature 135 Failed to load
Literature 136 Failed to load
Literature 137 Failed to load
Literature 138 Failed to load
Literature 139 Failed to load
Literature 140 Failed to load
Literature 141 Failed to load
Literature 142 Failed to load
Literature 143 Failed to load
Literature 144 Failed to load
Literature 145 Failed to load
Literature 146 Failed to load


 21%|██        | 53/251 [00:00<00:00, 267.95it/s]

Literature 147 Failed to load
Literature 148 Failed to load
Literature 149 Failed to load
Literature 150 Failed to load
Literature 151 Failed to load
Literature 152 Failed to load
Literature 153 Failed to load
Literature 154 Failed to load
Literature 155 Failed to load
Literature 156 Failed to load
Literature 157 Failed to load


 55%|█████▍    | 137/251 [00:00<00:00, 336.75it/s]

Literature 89 Failed to load
Literature 90 Failed to load
Literature 91 Failed to load
Literature 92 Failed to load
Literature 93 Failed to load


100%|██████████| 251/251 [00:00<00:00, 603.34it/s]
100%|██████████| 111/111 [00:00<00:00, 1681.20it/s]
  0%|          | 0/500 [00:00<?, ?it/s]

Opinion 104 Failed to load
Opinion 119 Failed to load
Opinion 121 Failed to load
Opinion 126 Failed to load
Opinion 142 Failed to load


 10%|█         | 52/500 [00:00<00:00, 519.98it/s]

Opinion 152 Failed to load
Opinion 186 Failed to load
Opinion 188 Failed to load
Opinion 199 Failed to load
Opinion 200 Failed to load


 23%|██▎       | 114/500 [00:00<00:00, 544.99it/s]

Opinion 206 Failed to load
Opinion 210 Failed to load


 40%|███▉      | 198/500 [00:00<00:00, 609.16it/s]

Opinion 31 Failed to load


 56%|█████▋    | 282/500 [00:00<00:00, 662.33it/s]

Opinion 353 Failed to load
Opinion 358 Failed to load
Opinion 369 Failed to load
Opinion 381 Failed to load
Opinion 406 Failed to load


 72%|███████▏  | 362/500 [00:00<00:00, 696.57it/s]

Opinion 432 Failed to load
Opinion 455 Failed to load
Opinion 469 Failed to load
Opinion 474 Failed to load
Opinion 479 Failed to load


 89%|████████▉ | 447/500 [00:00<00:00, 736.45it/s]

Opinion 70 Failed to load
Opinion 78 Failed to load
Opinion 91 Failed to load


100%|██████████| 500/500 [00:00<00:00, 749.62it/s]
  0%|          | 0/550 [00:00<?, ?it/s]

Politics 1 Failed to load
Politics 177 Failed to load
Politics 179 Failed to load
Politics 2 Failed to load


 21%|██        | 113/550 [00:00<00:00, 1118.39it/s]

Politics 3 Failed to load


 43%|████▎     | 235/550 [00:00<00:00, 1143.93it/s]

Politics 316 Failed to load
Politics 4 Failed to load


 61%|██████▏   | 338/550 [00:00<00:00, 1107.15it/s]

Politics 426 Failed to load


 77%|███████▋  | 425/550 [00:00<00:00, 1023.45it/s]

Politics 511 Failed to load
Politics 522 Failed to load


100%|██████████| 550/550 [00:00<00:00, 1080.54it/s]
  0%|          | 0/353 [00:00<?, ?it/s]

Society 10 Failed to load
Society 11 Failed to load
Society 12 Failed to load
Society 13 Failed to load
Society 14 Failed to load
Society 15 Failed to load
Society 16 Failed to load
Society 17 Failed to load
Society 18 Failed to load


 27%|██▋       | 97/353 [00:00<00:00, 960.30it/s]

Society 19 Failed to load
Society 20 Failed to load
Society 21 Failed to load
Society 22 Failed to load
Society 23 Failed to load
Society 24 Failed to load
Society 25 Failed to load
Society 254 Failed to load
Society 255 Failed to load
Society 256 Failed to load
Society 257 Failed to load


 50%|████▉     | 176/353 [00:00<00:00, 898.91it/s]

Society 258 Failed to load
Society 259 Failed to load
Society 26 Failed to load
Society 260 Failed to load
Society 261 Failed to load
Society 262 Failed to load
Society 263 Failed to load
Society 264 Failed to load
Society 265 Failed to load
Society 266 Failed to load
Society 267 Failed to load
Society 268 Failed to load
Society 269 Failed to load
Society 27 Failed to load
Society 270 Failed to load
Society 271 Failed to load
Society 272 Failed to load
Society 273 Failed to load
Society 274 Failed to load
Society 275 Failed to load
Society 276 Failed to load
Society 277 Failed to load
Society 278 Failed to load
Society 279 Failed to load
Society 28 Failed to load
Society 280 Failed to load
Society 281 Failed to load
Society 282 Failed to load
Society 283 Failed to load
Society 284 Failed to load
Society 285 Failed to load
Society 286 Failed to load
Society 287 Failed to load
Society 288 Failed to load
Society 289 Failed to load
Society 29 Failed to load
Society 290 Failed to load
Socie

 62%|██████▏   | 220/353 [00:00<00:00, 351.54it/s]

Society 298 Failed to load
Society 299 Failed to load
Society 3 Failed to load
Society 30 Failed to load
Society 300 Failed to load
Society 301 Failed to load
Society 302 Failed to load
Society 303 Failed to load
Society 304 Failed to load
Society 305 Failed to load
Society 306 Failed to load
Society 307 Failed to load
Society 308 Failed to load
Society 309 Failed to load
Society 31 Failed to load
Society 310 Failed to load
Society 311 Failed to load
Society 312 Failed to load
Society 313 Failed to load
Society 314 Failed to load
Society 315 Failed to load
Society 316 Failed to load
Society 317 Failed to load
Society 318 Failed to load
Society 319 Failed to load
Society 32 Failed to load
Society 320 Failed to load
Society 321 Failed to load
Society 322 Failed to load
Society 323 Failed to load
Society 324 Failed to load
Society 325 Failed to load
Society 326 Failed to load
Society 327 Failed to load
Society 328 Failed to load


 72%|███████▏  | 255/353 [00:00<00:00, 278.90it/s]

Society 329 Failed to load
Society 33 Failed to load
Society 330 Failed to load
Society 331 Failed to load
Society 332 Failed to load
Society 333 Failed to load
Society 334 Failed to load
Society 335 Failed to load
Society 336 Failed to load
Society 337 Failed to load
Society 338 Failed to load
Society 339 Failed to load
Society 34 Failed to load
Society 340 Failed to load
Society 341 Failed to load
Society 342 Failed to load
Society 343 Failed to load
Society 344 Failed to load
Society 345 Failed to load
Society 346 Failed to load
Society 347 Failed to load
Society 348 Failed to load
Society 349 Failed to load
Society 35 Failed to load
Society 350 Failed to load
Society 351 Failed to load
Society 352 Failed to load
Society 353 Failed to load
Society 36 Failed to load
Society 37 Failed to load
Society 38 Failed to load


 81%|████████  | 286/353 [00:00<00:00, 248.78it/s]

Society 39 Failed to load
Society 4 Failed to load
Society 40 Failed to load
Society 41 Failed to load
Society 42 Failed to load
Society 43 Failed to load
Society 44 Failed to load
Society 45 Failed to load
Society 46 Failed to load
Society 47 Failed to load
Society 48 Failed to load
Society 49 Failed to load
Society 5 Failed to load
Society 50 Failed to load
Society 51 Failed to load
Society 52 Failed to load
Society 53 Failed to load
Society 54 Failed to load
Society 55 Failed to load
Society 56 Failed to load
Society 57 Failed to load
Society 58 Failed to load
Society 59 Failed to load
Society 6 Failed to load
Society 60 Failed to load
Society 61 Failed to load
Society 62 Failed to load
Society 63 Failed to load


 89%|████████▉ | 314/353 [00:00<00:00, 226.20it/s]

Society 64 Failed to load
Society 65 Failed to load
Society 66 Failed to load
Society 67 Failed to load
Society 7 Failed to load
Society 8 Failed to load
Society 9 Failed to load


100%|██████████| 353/353 [00:01<00:00, 334.28it/s]
  0%|          | 0/700 [00:00<?, ?it/s]

Sports 139 Failed to load
Sports 172 Failed to load


 30%|███       | 210/700 [00:00<00:00, 1030.03it/s]

Sports 384 Failed to load


100%|██████████| 700/700 [00:00<00:00, 1301.12it/s]
  0%|          | 0/118 [00:00<?, ?it/s]

Technology 108 Failed to load
Technology 109 Failed to load
Technology 111 Failed to load
Technology 112 Failed to load
Technology 113 Failed to load
Technology 114 Failed to load
Technology 115 Failed to load
Technology 116 Failed to load
Technology 117 Failed to load
Technology 118 Failed to load
Technology 3 Failed to load
Technology 34 Failed to load


 40%|███▉      | 47/118 [00:00<00:00, 439.26it/s]

Technology 38 Failed to load
Technology 51 Failed to load
Technology 78 Failed to load


100%|██████████| 118/118 [00:00<00:00, 621.06it/s]
  0%|          | 0/265 [00:00<?, ?it/s]

Tourism 138 Failed to load
Tourism 141 Failed to load
Tourism 142 Failed to load


 43%|████▎     | 113/265 [00:00<00:00, 1118.79it/s]

Tourism 265 Failed to load


100%|██████████| 265/265 [00:00<00:00, 1204.56it/s]
  0%|          | 0/313 [00:00<?, ?it/s]

World 1 Failed to load
World 2 Failed to load


 36%|███▌      | 113/313 [00:00<00:00, 1118.86it/s]

World 213 Failed to load
World 217 Failed to load
World 218 Failed to load
World 219 Failed to load
World 220 Failed to load
World 221 Failed to load
World 222 Failed to load
World 223 Failed to load
World 224 Failed to load
World 225 Failed to load
World 226 Failed to load
World 227 Failed to load
World 228 Failed to load
World 229 Failed to load
World 230 Failed to load


 47%|████▋     | 147/313 [00:00<00:00, 655.49it/s] 

World 231 Failed to load
World 232 Failed to load
World 233 Failed to load
World 234 Failed to load
World 235 Failed to load
World 236 Failed to load
World 237 Failed to load
World 238 Failed to load
World 239 Failed to load
World 240 Failed to load
World 241 Failed to load
World 242 Failed to load
World 243 Failed to load
World 244 Failed to load
World 245 Failed to load
World 246 Failed to load
World 247 Failed to load
World 248 Failed to load
World 249 Failed to load
World 250 Failed to load
World 251 Failed to load
World 252 Failed to load
World 253 Failed to load
World 254 Failed to load
World 255 Failed to load
World 256 Failed to load
World 257 Failed to load
World 258 Failed to load
World 259 Failed to load
World 260 Failed to load
World 261 Failed to load


 58%|█████▊    | 181/313 [00:00<00:00, 390.76it/s]

World 262 Failed to load
World 263 Failed to load
World 264 Failed to load
World 265 Failed to load
World 266 Failed to load
World 267 Failed to load
World 268 Failed to load
World 269 Failed to load
World 270 Failed to load
World 271 Failed to load
World 272 Failed to load
World 273 Failed to load
World 274 Failed to load
World 275 Failed to load
World 276 Failed to load
World 277 Failed to load
World 278 Failed to load
World 279 Failed to load
World 280 Failed to load
World 281 Failed to load
World 282 Failed to load
World 283 Failed to load
World 284 Failed to load
World 285 Failed to load
World 286 Failed to load
World 287 Failed to load
World 288 Failed to load
World 289 Failed to load


 67%|██████▋   | 211/313 [00:00<00:00, 307.56it/s]

World 290 Failed to load
World 291 Failed to load
World 292 Failed to load
World 293 Failed to load
World 294 Failed to load
World 295 Failed to load
World 296 Failed to load
World 297 Failed to load
World 298 Failed to load
World 299 Failed to load
World 3 Failed to load
World 300 Failed to load
World 301 Failed to load
World 302 Failed to load
World 303 Failed to load
World 304 Failed to load
World 305 Failed to load
World 306 Failed to load
World 307 Failed to load
World 308 Failed to load
World 309 Failed to load
World 310 Failed to load
World 311 Failed to load
World 312 Failed to load


 76%|███████▌  | 238/313 [00:00<00:00, 272.86it/s]

World 313 Failed to load
World 4 Failed to load
World 65 Failed to load
World 78 Failed to load


100%|██████████| 313/313 [00:00<00:00, 444.61it/s]


In [8]:
df = pd.DataFrame(data_dict,columns=columns)
df.columns
df

Unnamed: 0,id,class,text
0,1,Agriculture,﻿काठमाडौंमा पहिलो पटक स्ट्रबेरीको व्यवसायिक खे...
1,10,Agriculture,"जिल्लाका किसानले लगाएको अदुवामा गानो कुहिने, ग..."
2,100,Agriculture,काभ्रेपलाञ्चोकमा कृषकले एसआरआई प्रविधिमा गरेको...
3,11,Agriculture,राजधानीमा यतिबेला तरकारीको मूल्य आकासिएको छ। क...
4,12,Agriculture,पाल पोल्ट्री तथा लाइभस्टक क्षेत्रको समग्र विका...
5,13,Agriculture,माग अनुसारको आपूर्ति नभएपछि तरकारीको मुल्य दोब...
6,14,Agriculture,नेपाल र चीनबीचको सम्झौतासँगै शुरु भएको परियोजन...
7,15,Agriculture,यस वर्ष अम्बामा देशैभर अम्बामा रोग देखा पर्‍यो...
8,16,Agriculture,लैँचीको कारोबार ठप्प भएपछि चाडबाडका लागि खर्च ...
9,17,Agriculture,बदलिँदो मौसमका कारण मोरङमा उन्नत जातको धानबाली...


In [9]:
df.dropna(inplace=True) # drop rows with invalid values

## Processing data

In [11]:
from nltk.corpus import stopwords
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import linear_kernel

In [12]:
nepali_stop_words = set(stopwords.words('nepali'))

tf = TfidfVectorizer(stop_words=nepali_stop_words,encoding='utf-8',decode_error='ignore')
tf = TfidfVectorizer(tokenizer= lambda x: x.split(" "),
                                  sublinear_tf=True, encoding='utf-8',
                                  decode_error='ignore',
                                  max_df=0.5,
                                  min_df=10,
                                  stop_words=nepali_stop_words)

tfidf_matrix = tf.fit_transform(df['text'])

cosine_similarities = linear_kernel(tfidf_matrix, tfidf_matrix)

results = {}

  'stop_words.' % sorted(inconsistent))
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  dtype = np.float


In [13]:
for idx, row in df.iterrows():
    idx = int(idx)
    similar_indices = cosine_similarities[idx].argsort()[:-100:-1]
    similar_items = [(cosine_similarities[idx][i], df['id'][i]) for i in similar_indices]

    results[row['id']] = similar_items[1:]
    
print('Completed!')
similar_indices = cosine_similarities[idx].argsort()[:-100:-1]

Completed!


## Displaying Results

In [14]:
def printBold(string):
    display(Markdown(string))

def item(id):
    id = str(id)
    return df.loc[df['id'] == id]['text'].tolist()[0].split(' - ')[0]

def recommender(item_id, num): 
    print("\n")
    printBold("**Recommendation System**")
    print(str(num) + " news similar to " + "'"+ item(item_id)[:100] + "..." + "'" )

    recs = results[str(item_id)][:num]
    for index, rec in enumerate(recs):
        print("\n")
        print(str(index+1) + ") " + "'"+ item(rec[1])[:200] + "..." + "'" + " (score:" + str(rec[0]) + ")")

# Extract the news (that the user is currently interacting with) and provide 8 recommended news
recommender(item_id=69, num=10)





**Recommendation System**

10 news similar to 'डिष्टिलरी उद्योगबाट छाडिएको दूषित पानीले रौतहटको दक्षिणी भेगका सयौं बिगाहा जग्गामा लगाइएको धानबाली न...'


1) 'अलैँचीको बिरुवा विक्री गरेर राम्रो कमाइ गर्ने उद्देश्यले पूर्वी पहाडी जिल्लाका कृषकले व्यावसायिक रुपमै अलैँचीको बिरुवा उमारे पनि सोचेअनुरुप यस वर्ष बिरुवा विक्री नभएकामा चिन्तित छन् ।
अलैँची खेतीको वि...' (score:0.29983569577803443)


2) '﻿नेपालका लागि टिभिएसका दुई पांगे्र सवारीको आधिकारिक वितरक जगदम्बा मोटर्सले टिभिएस अपाचे आरटिआर २०० ४भी सार्वजनिक गरेको छ।

रेस इडिसन २.० नाम दिइएको अपाचे आटिआर २०० ४भीमा एन्टी रिजर्भ टर्क स्लिप्पर क्ल...' (score:0.2127590569849505)


3) 'सन् २०१० मा रोजगारीको क्रममा कतार पुगेका खेम पौडेलले बालुवा नै बालुवा भएको ठाउँमा कलकलाउँदो हरियाली, तरकारी फलफूलको उत्पादन देखे। त्यो देखेर उनको मनमा प्रश्न उब्जियो, माटो, पानी  मल केही पनि नभएको ठाउ...' (score:0.19362969967347377)


4) '﻿पदम सिंह
बाजुरा, २ चैत – द्वन्द्वकालमा विस्थापित भएकोे कोल्टीमा राष्ट्रिय वाणिज्य बैंकको शाखा पुनःस्थापना नहुँदा त्यस क्षेत्रका ११ गाविस र हुम्ला, जुम्ल