In [4]:
import json
from bs4 import Tag
from tqdm import tqdm
import shangri_latibet_utils
import os
from concurrent.futures import ThreadPoolExecutor, as_completed


In [5]:

class CustomJSONEncoder(json.JSONEncoder):
    def default(self, obj):
        if isinstance(obj, Tag):
            return obj.get_text()
        return str(obj)

def save_json(path, file_name, data):
    try: 
        with open(path + file_name, "w", encoding='utf-8') as outfile:
            json.dump(data, outfile, indent=4, ensure_ascii=False, cls=CustomJSONEncoder)
        print(f"Successfully saved: {file_name}")
    except Exception as e:
        print(f"Error saving {file_name}: {str(e)}")

# def read_json(path, file_name):
#     try:
#         with open(path+file_name, 'r', encoding='utf-8') as openfile:
#             Loaded_file = json.load(openfile)
#             print(f"Successfully loaded: {file_name}")
#         return Loaded_file
#     except Exception as e:
#         print(f"Error loading {file_name}: {str(e)}")
#         return None

def scrape_article(url, page_key_code):
    try:
        article_content = shangri_latibet_utils.scrape_shangri_latibet_article_content(url, tags=page_key_code)
        return article_content
    except Exception as e:
        print(f"Error scraping {url}: {str(e)}")
        return None

def get_content(All_links_data, Total_lenght, page_key_code, page_key_list):
    all_article = {}
    
    with ThreadPoolExecutor(max_workers=10) as executor:
        future_to_url = {}
        start = 1
        for i in range(start, Total_lenght+1):
            page_key = page_key_code + str(i)
            all_link_page = All_links_data[page_key]["Links"]
            
            for url in all_link_page:
                future = executor.submit(scrape_article, url, page_key_code)
                future_to_url[future] = (page_key, url)
        
        for future in tqdm(as_completed(future_to_url), total=len(future_to_url)):
            page_key, url = future_to_url[future]
            try:
                article_content = future.result()
                if article_content:
                    article_key = f"{page_key}_scrape_shangri_Article_{len([k for k in all_article if k.startswith(page_key)]) + 1}"
                    all_article[article_key] = article_content
            except Exception as e:
                print(f"Error processing {url}: {str(e)}")
    
    Failure_count = sum(1 for article in all_article.values() if article["Response"] != 200)
    print(f"Total Failure in the {page_key_list[1]} article: {Failure_count}")
    
    save_file_name = f"scrape_shangri_ALL_content_{page_key_list[1]}.json"
    print(save_file_name)
    path = "./data/parallel_content/"
    save_json(path, save_file_name, all_article)

def process_json_file(file_path):
    try:
        with open(file_path, 'r', encoding='utf-8') as file:
            All_links_data = json.load(file)
            Total_lenght = len(All_links_data)
            print(f"Total page in {os.path.basename(file_path)}: {Total_lenght}")
        
            print(f"page key name: {list(All_links_data.keys())[-1]}")
            page_key_list = list(All_links_data.keys())[-1].split(" ")
            
            page_key_code = "Page "+page_key_list[1]+" "
            print(f"Page key code: {page_key_code}")
            get_content(All_links_data, Total_lenght, page_key_code, page_key_list)
    except json.JSONDecodeError as e:
        print(f"Error decoding JSON in file {os.path.basename(file_path)}: {str(e)}")
    except Exception as e:
        print(f"Error processing file {os.path.basename(file_path)}: {str(e)}")

def get_json_files(directory):
    json_files = [os.path.join(directory, f) for f in os.listdir(directory) if f.endswith('.json')]
    
    with ThreadPoolExecutor(max_workers=10) as executor:
        list(tqdm(executor.map(process_json_file, json_files), total=len(json_files)))
    
    print(f"Processed {len(json_files)} files")


In [10]:
%%time
# Example usage
directory_path = './data/links/'
# directory_path = './data/test_link/'
get_json_files(directory_path)

Total page in shangri_latibet_ALL_link_ས་གནས་གསར་འགྱུར།.json: 150
page key name: Page ས་གནས་གསར་འགྱུར། 150
Page key code: Page ས་གནས་གསར་འགྱུར། 
Total page in shangri_latibet_ALL_link_རྒྱལ་ཕྱི་ནང་གསར་འགྱུར།.json: 29
page key name: Page རྒྱལ་ཕྱི་ནང་གསར་འགྱུར། 29
Page key code: Page རྒྱལ་ཕྱི་ནང་གསར་འགྱུར། 
Total page in shangri_latibet_ALL_link_ཏང་གི་ཚོགས་ཆེན་བཅོ་བརྒྱད་པ།.json: 2
page key name: Page ཏང་གི་ཚོགས་ཆེན་བཅོ་བརྒྱད་པ། 2
Page key code: Page ཏང་གི་ཚོགས་ཆེན་བཅོ་བརྒྱད་པ། 
Total page in shangri_latibet_ALL_link_བོད་ཁུལ་གསར་འགྱུར།.json: 74
page key name: Page བོད་ཁུལ་གསར་འགྱུར། 74
Page key code: Page བོད་ཁུལ་གསར་འགྱུར། 
Total page in shangri_latibet_ALL_link_ཚོགས་ཆེན་གཉིས།.json: 2
page key name: Page ཚོགས་ཆེན་གཉིས། 2
Page key code: Page ཚོགས་ཆེན་གཉིས། 
Total page in shangri_latibet_ALL_link_གལ་ཆེའི་མཛད་སྒོ།.json: 2
page key name: Page གལ་ཆེའི་མཛད་སྒོ། 2
Page key code: Page གལ་ཆེའི་མཛད་སྒོ། 
Total page in shangri_latibet_ALL_link_དཔལ་འབྱོར་འགྱུར་སྟངས།.json: 4
page key name: Page དཔལ་འབ

  0%|          | 0/22 [00:00<?, ?it/s]
  0%|          | 0/49 [00:00<?, ?it/s][A

  0%|          | 0/80 [00:00<?, ?it/s][A[A


  0%|          | 0/33 [00:00<?, ?it/s][A[A[A



  0%|          | 0/40 [00:00<?, ?it/s][A[A[A[A




  0%|          | 0/38 [00:00<?, ?it/s][A[A[A[A[A





  0%|          | 0/27 [00:00<?, ?it/s][A[A[A[A[A[A






  0%|          | 0/37 [00:00<?, ?it/s][A[A[A[A[A[A[A







  0%|          | 0/568 [00:00<?, ?it/s][A[A[A[A[A[A[A[A








  0%|          | 0/1468 [00:00<?, ?it/s][A[A[A[A[A[A[A[A[A









  0%|          | 0/3000 [00:00<?, ?it/s][A[A[A[A[A[A[A[A[A[A









  0%|          | 1/3000 [00:01<1:29:10,  1.78s/it][A[A[A[A[A[A[A[A[A[A








  0%|          | 1/1468 [00:01<45:35,  1.86s/it][A[A[A[A[A[A[A[A[A




  3%|▎         | 1/38 [00:03<01:18,  2.12s/it][A[A[A[A[A
  5%|▍         | 1/22 [00:04<00:55,  2.65s/it][A

  1%|▏         | 1/80 [00:04<03:29,  2.65s/it][A[A







  0%|

Total Failure in the ཏང་གི་ཚོགས་ཆེན་བཅོ་བརྒྱད་པ། article: 0
scrape_shangri_ALL_content_ཏང་གི་ཚོགས་ཆེན་བཅོ་བརྒྱད་པ།.json
Successfully saved: scrape_shangri_ALL_content_ཏང་གི་ཚོགས་ཆེན་བཅོ་བརྒྱད་པ།.json
Total page in shangri_latibet_ALL_link_སློབ་གསོ།.json: 12
page key name: Page སློབ་གསོ། 12
Page key code: Page སློབ་གསོ། 


  0%|          | 0/232 [00:00<?, ?it/s]



 70%|███████   | 28/40 [00:10<00:02,  4.65it/s][A[A[A[A








  2%|▏         | 29/1468 [00:10<04:53,  4.90it/s][A[A[A[A[A[A[A[A[A









  1%|          | 29/3000 [00:10<10:45,  4.60it/s][A[A[A[A[A[A[A[A[A[A





100%|██████████| 27/27 [00:11<00:00,  2.91it/s][A[A[A[A[A[A






 78%|███████▊  | 29/37 [00:11<00:02,  3.19it/s][A[A[A[A[A[A[A



 75%|███████▌  | 30/40 [00:11<00:02,  4.21it/s][A[A[A[A









  1%|          | 30/3000 [00:11<12:31,  3.95it/s][A[A[A[A[A[A[A[A[A[A
 59%|█████▉    | 29/49 [00:11<00:05,  3.40it/s][A

 36%|███▋      | 29/80 [00:11<00:14,  3.43it/s][A[A




 79%|███████▉  | 30/38 [00:11<00:02,  3.91it/s][A[A[A[A[A






 81%|████████  | 30/37 [00:11<00:02,  3.35it/s][A[A[A[A[A[A[A
 61%|██████    | 30/49 [00:11<00:05,  3.63it/s][A

100%|██████████| 27/27 [00:11<00:00,  2.33it/s][A[A


Total Failure in the གལ་ཆེའི་མཛད་སྒོ། article: 0
scrape_shangri_ALL_content_གལ་ཆེའི་མཛད་སྒོ།.json
Successfully saved: scrape_shangri_ALL_content_གལ་ཆེའི་མཛད་སྒོ།.json
Total page in shangri_latibet_ALL_link_རྩོམ་རིག.json: 6
page key name: Page རྩོམ་རིག 6
Page key code: Page རྩོམ་རིག 








  0%|          | 0/114 [00:00<?, ?it/s][A[A[A[A[A[A

 41%|████▏     | 33/80 [00:11<00:08,  5.30it/s][A[A




 82%|████████▏ | 31/38 [00:11<00:01,  3.87it/s][A[A[A[A[A








  2%|▏         | 31/1468 [00:11<06:50,  3.50it/s][A[A[A[A[A[A[A[A[A






 84%|████████▍ | 31/37 [00:11<00:01,  3.17it/s][A[A[A[A[A[A[A







  5%|▌         | 31/568 [00:11<02:32,  3.51it/s][A[A[A[A[A[A[A[A








  2%|▏         | 32/1468 [00:11<06:32,  3.66it/s][A[A[A[A[A[A[A[A[A









  1%|          | 31/3000 [00:11<14:50,  3.33it/s][A[A[A[A[A[A[A[A[A[A




 87%|████████▋ | 33/38 [00:12<00:01,  4.25it/s][A[A[A[A[A
 65%|██████▌   | 32/49 [00:12<00:04,  3.67it/s][A



 78%|███████▊  | 31/40 [00:12<00:02,  3.27it/s][A[A[A[A






 86%|████████▋ | 32/37 [00:12<00:01,  3.10it/s][A[A[A[A[A[A[A








  0%|          | 1/232 [00:02<07:40,  1.99s/it]s][A[A[A[A[A[A[A[A[A









  1%|          | 32/3000 [00:12<17:01,  2.90it/s]

Total Failure in the ཁྱིམ་ཇུས་ནོར་གཉེར། article: 0
scrape_shangri_ALL_content_ཁྱིམ་ཇུས་ནོར་གཉེར།.json
Successfully saved: scrape_shangri_ALL_content_ཁྱིམ་ཇུས་ནོར་གཉེར།.json
Total page in shangri_latibet_ALL_link_ལོ་རྒྱུས།.json: 6
page key name: Page ལོ་རྒྱུས། 6
Page key code: Page ལོ་རྒྱུས། 
Total Failure in the མ་རྩའི་འདེབས་ཕྱོགས། article: 0
scrape_shangri_ALL_content_མ་རྩའི་འདེབས་ཕྱོགས།.json







  0%|          | 0/115 [00:00<?, ?it/s][A[A[A[A[A

Successfully saved: scrape_shangri_ALL_content_མ་རྩའི་འདེབས་ཕྱོགས།.json
Total page in shangri_latibet_ALL_link_གསོ་རིག.json: 25
page key name: Page གསོ་རིག 25
Page key code: Page གསོ་རིག 









  0%|          | 0/492 [00:00<?, ?it/s][A[A[A[A[A[A[A





  4%|▍         | 10/232 [00:04<00:57,  3.86it/s][A[A[A[A[A[A
 86%|████████▌ | 42/49 [00:15<00:01,  4.39it/s][A








  3%|▎         | 42/1468 [00:14<07:22,  3.22it/s][A[A[A[A[A[A[A[A[A



100%|██████████| 40/40 [00:15<00:00,  2.64it/s][A[A[A[A


Total Failure in the ཚོགས་ཆེན་གཉིས། article: 0
scrape_shangri_ALL_content_ཚོགས་ཆེན་གཉིས།.json
Successfully saved: scrape_shangri_ALL_content_ཚོགས་ཆེན་གཉིས།.json
Total page in shangri_latibet_ALL_link_དཔེ་གཟིགས།.json: 2
page key name: Page དཔེ་གཟིགས། 2
Page key code: Page དཔེ་གཟིགས། 






  0%|          | 0/24 [00:00<?, ?it/s][A[A[A[A

 51%|█████▏    | 41/80 [00:15<00:10,  3.60it/s][A[A









  1%|▏         | 41/3000 [00:15<16:00,  3.08it/s][A[A[A[A[A[A[A[A[A[A









  1%|▏         | 42/3000 [00:15<14:01,  3.51it/s][A[A[A[A[A[A[A[A[A[A





  9%|▉         | 10/114 [00:03<00:24,  4.27it/s][A[A[A[A[A[A

 54%|█████▍    | 43/80 [00:15<00:08,  4.26it/s][A[A








  3%|▎         | 44/1468 [00:15<06:44,  3.52it/s][A[A[A[A[A[A[A[A[A









  1%|▏         | 43/3000 [00:15<12:51,  3.83it/s][A[A[A[A[A[A[A[A[A[A
 90%|████████▉ | 44/49 [00:15<00:01,  3.95it/s][A









  5%|▍         | 11/232 [00:05<01:24,  2.63it/s]][A[A[A[A[A[A[A[A[A[A







  7%|▋         | 42/568 [00:15<02:39,  3.30it/s][A[A[A[A[A[A[A[A

 55%|█████▌    | 44/80 [00:16<00:10,  3.38it/s][A[A







  8%|▊         | 44/568 [00:15<02:17,  3.82it/s][A[A[A[A[A[A[A[A

 56%|█████▋    | 45/80 [00:16<00:09,  3.51it/s][A[A



Total Failure in the འབྱོར་ཕྱུག་གཏམ་རྒྱུད། article: 0
scrape_shangri_ALL_content_འབྱོར་ཕྱུག་གཏམ་རྒྱུད།.json
Successfully saved: scrape_shangri_ALL_content_འབྱོར་ཕྱུག་གཏམ་རྒྱུད།.json
Total page in shangri_latibet_ALL_link_མི་རིགས་སྲིད་ཇུས།.json: 1
page key name: Page མི་རིགས་སྲིད་ཇུས། 1
Page key code: Page མི་རིགས་སྲིད་ཇུས། 



  0%|          | 0/18 [00:00<?, ?it/s][A



 29%|██▉       | 7/24 [00:03<00:05,  3.21it/s][A[A[A[A





 18%|█▊        | 20/114 [00:07<00:25,  3.63it/s][A[A[A[A[A[A







 10%|▉         | 54/568 [00:19<02:10,  3.94it/s][A[A[A[A[A[A[A[A



 42%|████▏     | 10/24 [00:04<00:03,  4.55it/s][A[A[A[A









  2%|▏         | 55/3000 [00:20<12:40,  3.87it/s][A[A[A[A[A[A[A[A[A[A

  9%|▉         | 21/232 [00:10<01:20,  2.62it/s][A[A





 18%|█▊        | 21/114 [00:09<00:25,  3.67it/s][A[A[A[A[A[A




 10%|▉         | 11/115 [00:05<00:28,  3.62it/s][A[A[A[A[A








  4%|▍         | 56/1468 [00:20<06:53,  3.41it/s][A[A[A[A[A[A[A[A[A






  2%|▏         | 11/492 [00:05<02:05,  3.83it/s][A[A[A[A[A[A[A







 10%|▉         | 55/568 [00:20<02:23,  3.56it/s][A[A[A[A[A[A[A[A









  2%|▏         | 56/3000 [00:20<22:30,  2.18it/s][A[A[A[A[A[A[A[A[A[A

  9%|▉         | 22/232 [00:10<01:52,  1.86it/s][A[A





 19%|█

Total Failure in the དཔེ་གཟིགས། article: 0
scrape_shangri_ALL_content_དཔེ་གཟིགས།.json
Successfully saved: scrape_shangri_ALL_content_དཔེ་གཟིགས།.json
Total page in shangri_latibet_ALL_link_ཆོས་ལུགས་སྲིད་ཇུས།.json: 1
page key name: Page ཆོས་ལུགས་སྲིད་ཇུས། 1
Page key code: Page ཆོས་ལུགས་སྲིད་ཇུས། 






  0%|          | 0/12 [00:00<?, ?it/s][A[A[A[A





 33%|███▎      | 38/114 [00:13<00:26,  2.84it/s][A[A[A[A[A[A







 13%|█▎        | 74/568 [00:25<02:18,  3.56it/s][A[A[A[A[A[A[A[A






  6%|▌         | 30/492 [00:10<01:45,  4.39it/s][A[A[A[A[A[A[A




 26%|██▌       | 30/115 [00:10<00:18,  4.55it/s][A[A[A[A[A








  5%|▌         | 74/1468 [00:25<07:27,  3.11it/s][A[A[A[A[A[A[A[A[A









  2%|▎         | 75/3000 [00:25<11:00,  4.43it/s][A[A[A[A[A[A[A[A[A[A

 18%|█▊        | 42/232 [00:15<01:10,  2.68it/s][A[A
 94%|█████████▍| 17/18 [00:07<00:00,  3.56it/s][A









  3%|▎         | 76/3000 [00:26<10:14,  4.76it/s][A[A[A[A[A[A[A[A[A[A








  5%|▌         | 75/1468 [00:26<07:13,  3.21it/s][A[A[A[A[A[A[A[A[A







 13%|█▎        | 75/568 [00:26<02:50,  2.88it/s][A[A[A[A[A[A[A[A




 27%|██▋       | 31/115 [00:11<00:25,  3.27it/s][A[A[A[A[A

 91%|█████████▏| 73/80 [00:26<00:02,  2.45it/s

Total Failure in the མི་རིགས་སྲིད་ཇུས། article: 0
scrape_shangri_ALL_content_མི་རིགས་སྲིད་ཇུས།.json
Successfully saved: scrape_shangri_ALL_content_མི་རིགས་སྲིད་ཇུས།.json
Total page in shangri_latibet_ALL_link_ཆོས་ལུགས་རིག་གནས།.json: 2
page key name: Page ཆོས་ལུགས་རིག་གནས། 2
Page key code: Page ཆོས་ལུགས་རིག་གནས། 



  0%|          | 0/31 [00:00<?, ?it/s][A

Total Failure in the དཔལ་འབྱོར་འགྱུར་སྟངས། article: 0
scrape_shangri_ALL_content_དཔལ་འབྱོར་འགྱུར་སྟངས།.json
Successfully saved: scrape_shangri_ALL_content_དཔལ་འབྱོར་འགྱུར་སྟངས།.json
Total page in shangri_latibet_ALL_link_དགོན་སྡེ་ངོ་སྤྲོད།.json: 2
page key name: Page དགོན་སྡེ་ངོ་སྤྲོད། 2
Page key code: Page དགོན་སྡེ་ངོ་སྤྲོད། 




  0%|          | 0/39 [00:00<?, ?it/s][A[A









  3%|▎         | 82/3000 [00:28<12:19,  3.95it/s][A[A[A[A[A[A[A[A[A[A






  8%|▊         | 39/492 [00:13<01:15,  6.04it/s][A[A[A[A[A[A[A



 22%|██▏       | 52/232 [00:17<00:42,  4.21it/s]A[A[A[A









  3%|▎         | 83/3000 [00:28<10:53,  4.46it/s][A[A[A[A[A[A[A[A[A[A



 33%|███▎      | 4/12 [00:02<00:03,  2.00it/s][A[A[A[A








  6%|▌         | 84/1468 [00:28<06:53,  3.35it/s][A[A[A[A[A[A[A[A[A









  3%|▎         | 84/3000 [00:28<09:45,  4.98it/s][A[A[A[A[A[A[A[A[A[A



 42%|████▏     | 5/12 [00:03<00:02,  2.37it/s][A[A[A[A




 32%|███▏      | 37/115 [00:14<00:28,  2.76it/s][A[A[A[A[A








 23%|██▎       | 53/232 [00:18<00:49,  3.62it/s]][A[A[A[A[A[A[A[A[A









  3%|▎         | 85/3000 [00:28<12:15,  3.97it/s][A[A[A[A[A[A[A[A[A[A



 50%|█████     | 6/12 [00:03<00:02,  2.94it/s][A[A[A[A




 33%|███▎      | 38/115 [00:14<

Total Failure in the ཆོས་ལུགས་སྲིད་ཇུས། article: 0
scrape_shangri_ALL_content_ཆོས་ལུགས་སྲིད་ཇུས།.json
Successfully saved: scrape_shangri_ALL_content_ཆོས་ལུགས་སྲིད་ཇུས།.json
Total page in shangri_latibet_ALL_link_སྲོལ་རྒྱུན་དུས་སྟོན།.json: 4
page key name: Page སྲོལ་རྒྱུན་དུས་སྟོན། 4
Page key code: Page སྲོལ་རྒྱུན་དུས་སྟོན། 






  0%|          | 0/73 [00:00<?, ?it/s][A[A[A[A
 35%|███▌      | 11/31 [00:05<00:06,  2.97it/s][A








  7%|▋         | 100/1468 [00:34<06:25,  3.55it/s][A[A[A[A[A[A[A[A[A







 29%|██▉       | 67/232 [00:24<00:48,  3.38it/s][A[A[A[A[A[A[A[A

 28%|██▊       | 11/39 [00:07<00:10,  2.70it/s][A[A






 11%|█         | 53/492 [00:20<02:13,  3.28it/s][A[A[A[A[A[A[A





 56%|█████▌    | 64/114 [00:23<00:13,  3.63it/s][A[A[A[A[A[A




 46%|████▌     | 53/115 [00:20<00:20,  3.09it/s][A[A[A[A[A









  3%|▎         | 96/3000 [00:35<19:18,  2.51it/s][A[A[A[A[A[A[A[A[A[A
 39%|███▊      | 12/31 [00:07<00:07,  2.57it/s][A








  7%|▋         | 101/1468 [00:35<13:54,  1.64it/s][A[A[A[A[A[A[A[A[A







 29%|██▉       | 68/232 [00:24<01:45,  1.55it/s][A[A[A[A[A[A[A[A



  1%|▏         | 1/73 [00:02<02:57,  2.46s/it][A[A[A[A

 31%|███       | 12/39 [00:07<00:19,  1.40it/s][A[A






 11%|█         | 54/492 [00:

Total Failure in the ཆོས་ལུགས་རིག་གནས། article: 0
scrape_shangri_ALL_content_ཆོས་ལུགས་རིག་གནས།.json
Successfully saved: scrape_shangri_ALL_content_ཆོས་ལུགས་རིག་གནས།.json
Total page in shangri_latibet_ALL_link_ཡུལ་སྲོལ་གོམས་གཤིས།.json: 11
page key name: Page ཡུལ་སྲོལ་གོམས་གཤིས། 11
Page key code: Page ཡུལ་སྲོལ་གོམས་གཤིས། 



  0%|          | 0/201 [00:00<?, ?it/s][A




 70%|██████▉   | 80/115 [00:27<00:08,  4.25it/s][A[A[A[A[A



 30%|███       | 22/73 [00:10<00:12,  4.07it/s][A[A[A[A








  9%|▊         | 127/1468 [00:42<05:33,  4.02it/s][A[A[A[A[A[A[A[A[A

 92%|█████████▏| 36/39 [00:14<00:00,  4.00it/s][A[A





 79%|███████▉  | 90/114 [00:31<00:06,  3.71it/s][A[A[A[A[A[A







 22%|██▏       | 124/568 [00:42<01:54,  3.87it/s][A[A[A[A[A[A[A[A









  4%|▍         | 124/3000 [00:42<11:32,  4.15it/s][A[A[A[A[A[A[A[A[A[A






 39%|███▉      | 90/232 [00:32<00:37,  3.76it/s][A[A[A[A[A[A[A




 71%|███████▏  | 82/115 [00:28<00:08,  3.77it/s][A[A[A[A[A



 33%|███▎      | 24/73 [00:10<00:13,  3.73it/s][A[A[A[A








  9%|▊         | 128/1468 [00:42<06:06,  3.66it/s][A[A[A[A[A[A[A[A[A

 95%|█████████▍| 37/39 [00:14<00:00,  3.59it/s][A[A





 80%|███████▉  | 91/114 [00:31<00:06,  3.43it/s][A[A[A[A[A[A







 22%|██▏      

Total Failure in the དགོན་སྡེ་ངོ་སྤྲོད། article: 0
scrape_shangri_ALL_content_དགོན་སྡེ་ངོ་སྤྲོད།.json
Successfully saved: scrape_shangri_ALL_content_དགོན་སྡེ་ངོ་སྤྲོད།.json
Total page in shangri_latibet_ALL_link_མི་རིགས་ཀྱི་ད་ཚུལ།.json: 1
page key name: Page མི་རིགས་ཀྱི་ད་ཚུལ། 1
Page key code: Page མི་རིགས་ཀྱི་ད་ཚུལ། 




 43%|████▎     | 99/232 [00:34<00:27,  4.86it/s]



 45%|████▌     | 33/73 [00:12<00:07,  5.10it/s][A[A[A[A






 18%|█▊        | 88/492 [00:30<01:44,  3.86it/s][A[A[A[A[A[A[A







 23%|██▎       | 133/568 [00:44<01:48,  4.02it/s][A[A[A[A[A[A[A[A




 77%|███████▋  | 89/115 [00:30<00:06,  3.85it/s][A[A[A[A[A








  9%|▉         | 134/1468 [00:44<07:04,  3.15it/s][A[A[A[A[A[A[A[A[A





 89%|████████▊ | 101/114 [00:33<00:02,  4.35it/s][A[A[A[A[A[A




 78%|███████▊  | 90/115 [00:30<00:06,  4.01it/s][A[A[A[A[A






 18%|█▊        | 89/492 [00:30<01:45,  3.83it/s][A[A[A[A[A[A[A
  2%|▏         | 5/201 [00:04<01:43,  1.90it/s][A








  9%|▉         | 135/1468 [00:46<06:58,  3.18it/s][A[A[A[A[A[A[A[A[A









  4%|▍         | 134/3000 [00:46<12:25,  3.85it/s][A[A[A[A[A[A[A[A[A[A







 24%|██▎       | 134/568 [00:46<01:59,  3.64it/s][A[A[A[A[A[A[A[A





 89%|████████▉ | 102/114 [00:35<00:02,  4.01i

Total Failure in the རྩོམ་རིག article: 0
scrape_shangri_ALL_content_རྩོམ་རིག.json


 50%|████▉     | 115/232 [00:40<00:31,  3.77it/s]A[A




 90%|█████████ | 104/115 [00:37<00:03,  3.54it/s][A[A[A[A[A








 10%|█         | 154/1468 [00:51<04:53,  4.48it/s][A[A[A[A[A[A[A[A[A
 11%|█▏        | 23/201 [00:10<00:44,  4.03it/s][A



 68%|██████▊   | 50/73 [00:19<00:05,  4.11it/s][A[A[A[A







 27%|██▋       | 152/568 [00:51<01:43,  4.02it/s][A[A[A[A[A[A[A[A

 83%|████████▎ | 15/18 [00:07<00:00,  3.24it/s][A[A









 50%|█████     | 117/232 [00:41<00:35,  3.22it/s]][A[A[A[A[A[A[A[A[A[A




 91%|█████████▏| 105/115 [00:37<00:03,  2.57it/s][A[A[A[A[A








 11%|█         | 155/1468 [00:51<06:40,  3.28it/s][A[A[A[A[A[A[A[A[A
 12%|█▏        | 24/201 [00:10<00:57,  3.06it/s][A



 70%|██████▉   | 51/73 [00:19<00:07,  3.04it/s][A[A[A[A

 94%|█████████▍| 17/18 [00:07<00:00,  3.29it/s][A[A









  5%|▌         | 153/3000 [00:51<14:11,  3.34it/s][A[A[A[A[A[A[A[A[A[A

Successfully saved: scrape_shangri_ALL_content_རྩོམ་རིག.json
Total page in shangri_latibet_ALL_link_ཆོས་ལུགས་ཀྱི་ད་ཚུལ།.json: 1
page key name: Page ཆོས་ལུགས་ཀྱི་ད་ཚུལ། 1
Page key code: Page ཆོས་ལུགས་ཀྱི་ད་ཚུལ། 


 51%|█████     | 118/232 [00:41<00:35,  3.19it/s]



 74%|███████▍  | 54/73 [00:19<00:04,  4.16it/s][A[A[A[A





  0%|          | 0/18 [00:00<?, ?it/s][A[A[A[A[A[A






 22%|██▏       | 109/492 [00:37<01:47,  3.57it/s][A[A[A[A[A[A[A




 97%|█████████▋| 111/115 [00:37<00:00,  4.48it/s][A[A[A[A[A







 27%|██▋       | 154/568 [00:52<02:14,  3.07it/s][A[A[A[A[A[A[A[A








 52%|█████▏    | 121/232 [00:42<00:28,  3.91it/s]][A[A[A[A[A[A[A[A[A

100%|██████████| 18/18 [00:08<00:00,  2.78it/s][A[A




 98%|█████████▊| 113/115 [00:38<00:00,  4.34it/s][A[A[A[A[A









 53%|█████▎    | 122/232 [00:43<00:31,  3.50it/s]][A[A[A[A[A[A[A[A[A[A



 77%|███████▋  | 56/73 [00:20<00:04,  3.50it/s][A[A[A[A
 14%|█▍        | 29/201 [00:11<00:48,  3.55it/s][A








 11%|█         | 160/1468 [00:53<06:08,  3.54it/s][A[A[A[A[A[A[A[A[A







 27%|██▋       | 155/568 [00:53<02:37,  2.63it/s][A[A[A[A[A[A[A[A






 23%|██▎  

Total Failure in the མི་རིགས་ཀྱི་ད་ཚུལ། article: 0
scrape_shangri_ALL_content_མི་རིགས་ཀྱི་ད་ཚུལ།.json
Successfully saved: scrape_shangri_ALL_content_མི་རིགས་ཀྱི་ད་ཚུལ།.json
Total page in shangri_latibet_ALL_link_གནས་ཁམས་ཆེན།.json: 5
page key name: Page གནས་ཁམས་ཆེན། 5
Page key code: Page གནས་ཁམས་ཆེན། 




  0%|          | 0/94 [00:00<?, ?it/s][A[A







 28%|██▊       | 158/568 [00:53<02:02,  3.35it/s][A[A[A[A[A[A[A[A
 16%|█▌        | 32/201 [00:12<00:46,  3.67it/s][A









  5%|▌         | 162/3000 [00:53<11:26,  4.13it/s][A[A[A[A[A[A[A[A[A[A







 28%|██▊       | 160/568 [00:54<01:41,  4.02it/s][A[A[A[A[A[A[A[A
 16%|█▋        | 33/201 [00:12<00:44,  3.75it/s][A





  6%|▌         | 1/18 [00:02<00:36,  2.14s/it][A[A[A[A[A[A








 11%|█         | 165/1468 [00:54<05:30,  3.94it/s][A[A[A[A[A[A[A[A[A









 55%|█████▍    | 127/232 [00:44<00:30,  3.42it/s]][A[A[A[A[A[A[A[A[A[A






 24%|██▎       | 116/492 [00:40<01:52,  3.34it/s][A[A[A[A[A[A[A







 29%|██▊       | 162/568 [00:55<01:39,  4.07it/s][A[A[A[A[A[A[A[A
 17%|█▋        | 34/201 [00:13<00:49,  3.40it/s][A




100%|██████████| 115/115 [00:40<00:00,  2.45it/s][A[A[A[A[A



 84%|████████▎ | 61/73 [00:22<00:03,  3.30it/s][A[A[A[A





 11%

Total Failure in the ལོ་རྒྱུས། article: 1
scrape_shangri_ALL_content_ལོ་རྒྱུས།.json











 11%|█▏        | 167/1468 [00:55<06:57,  3.11it/s][A[A[A[A[A[A[A[A[A






 24%|██▍       | 120/492 [00:41<01:35,  3.91it/s][A[A[A[A[A[A[A





 39%|███▉      | 7/18 [00:04<00:03,  3.51it/s][A[A[A[A[A[A





 44%|████▍     | 8/18 [00:04<00:04,  2.33it/s][A[A[A[A[A[A









 56%|█████▌    | 130/232 [00:46<00:33,  3.03it/s]][A[A[A[A[A[A[A[A[A[A



 88%|████████▊ | 64/73 [00:23<00:02,  3.08it/s][A[A[A[A

  1%|          | 1/94 [00:02<03:24,  2.20s/it][A[A
 19%|█▉        | 38/201 [00:14<00:48,  3.34it/s][A








 11%|█▏        | 168/1468 [00:56<09:43,  2.23it/s][A[A[A[A[A[A[A[A[A






 25%|██▍       | 121/492 [00:41<02:17,  2.70it/s][A[A[A[A[A[A[A







 29%|██▉       | 164/568 [00:56<02:15,  2.97it/s][A[A[A[A[A[A[A[A









 56%|█████▋    | 131/232 [00:46<00:41,  2.46it/s]][A[A[A[A[A[A[A[A[A[A



 89%|████████▉ | 65/73 [00:23<00:03,  2.55it/s][A[A[A[A

  2%|▏         | 2/94 [00:03<02:00,  1.

Successfully saved: scrape_shangri_ALL_content_ལོ་རྒྱུས།.json
Total page in shangri_latibet_ALL_link_གནས་སྐོར་མཛེས་ལྗོངས།.json: 6
page key name: Page གནས་སྐོར་མཛེས་ལྗོངས། 6
Page key code: Page གནས་སྐོར་མཛེས་ལྗོངས། 



 19%|█▉        | 39/201 [00:15<00:59,  2.74it/s][A








 12%|█▏        | 169/1468 [00:56<08:13,  2.63it/s][A[A[A[A[A[A[A[A[A







 57%|█████▋    | 133/232 [00:46<00:29,  3.34it/s][A[A[A[A[A[A[A[A

  3%|▎         | 3/94 [00:03<01:16,  1.20it/s][A[A



 96%|█████████▌| 70/73 [00:24<00:00,  4.75it/s][A[A[A[A
 20%|█▉        | 40/201 [00:15<00:56,  2.86it/s][A








 12%|█▏        | 170/1468 [00:56<07:47,  2.78it/s][A[A[A[A[A[A[A[A[A







 58%|█████▊    | 134/232 [00:46<00:26,  3.68it/s][A[A[A[A[A[A[A[A




  0%|          | 0/103 [00:00<?, ?it/s][A[A[A[A[A






 25%|██▌       | 123/492 [00:42<01:59,  3.10it/s][A[A[A[A[A[A[A









  6%|▌         | 170/3000 [00:57<17:25,  2.71it/s][A[A[A[A[A[A[A[A[A[A







 30%|██▉       | 170/568 [00:57<01:24,  4.71it/s][A[A[A[A[A[A[A[A
 20%|██        | 41/201 [00:16<00:54,  2.91it/s][A








 12%|█▏        | 174/1468 [00:58<04:22,  4.93it/s][A[A[A[A[A[A[A[A[A

Total Failure in the སྲོལ་རྒྱུན་དུས་སྟོན། article: 0
scrape_shangri_ALL_content_སྲོལ་རྒྱུན་དུས་སྟོན།.json
Successfully saved: scrape_shangri_ALL_content_སྲོལ་རྒྱུན་དུས་སྟོན།.json
Total page in shangri_latibet_ALL_link_སྐྱེ་ཁམས་སྲུང་སྐྱོང་།.json: 10
page key name: Page སྐྱེ་ཁམས་སྲུང་སྐྱོང་། 10
Page key code: Page སྐྱེ་ཁམས་སྲུང་སྐྱོང་། 






  0%|          | 0/195 [00:00<?, ?it/s][A[A[A[A
 24%|██▍       | 49/201 [00:17<00:45,  3.33it/s][A





 61%|██████    | 141/232 [00:49<00:30,  2.96it/s]A[A[A[A[A[A






 27%|██▋       | 133/492 [00:46<01:32,  3.87it/s][A[A[A[A[A[A[A








 12%|█▏        | 182/1468 [01:01<05:11,  4.13it/s][A[A[A[A[A[A[A[A[A







 31%|███▏      | 178/568 [01:01<01:23,  4.68it/s][A[A[A[A[A[A[A[A

 13%|█▎        | 12/94 [00:07<00:39,  2.09it/s][A[A




  3%|▎         | 3/103 [00:04<01:26,  1.16it/s][A[A[A[A[A
 25%|██▍       | 50/201 [00:19<00:52,  2.86it/s][A









  6%|▌         | 180/3000 [01:01<14:46,  3.18it/s][A[A[A[A[A[A[A[A[A[A





 61%|██████    | 142/232 [00:50<00:55,  1.62it/s]A[A[A[A[A[A






 27%|██▋       | 134/492 [00:46<03:02,  1.96it/s][A[A[A[A[A[A[A








 12%|█▏        | 183/1468 [01:01<10:19,  2.07it/s][A[A[A[A[A[A[A[A[A







 32%|███▏      | 179/568 [01:01<02:54,  2.23it/s][A[A[A[A[A[A[A[

Total Failure in the ཆོས་ལུགས་ཀྱི་ད་ཚུལ། article: 0
scrape_shangri_ALL_content_ཆོས་ལུགས་ཀྱི་ད་ཚུལ།.json
Successfully saved: scrape_shangri_ALL_content_ཆོས་ལུགས་ཀྱི་ད་ཚུལ།.json
Total page in shangri_latibet_ALL_link_ཡུལ་སྐོར་འགྱུར་སྟངས།.json: 1
page key name: Page ཡུལ་སྐོར་འགྱུར་སྟངས། 1
Page key code: Page ཡུལ་སྐོར་འགྱུར་སྟངས། 








  0%|          | 0/12 [00:00<?, ?it/s][A[A[A[A[A[A

 21%|██▏       | 20/94 [00:07<00:17,  4.24it/s][A[A








 13%|█▎        | 189/1468 [01:01<04:33,  4.67it/s][A[A[A[A[A[A[A[A[A






 28%|██▊       | 138/492 [00:46<01:43,  3.41it/s][A[A[A[A[A[A[A







 32%|███▏      | 184/568 [01:01<01:38,  3.91it/s][A[A[A[A[A[A[A[A








 13%|█▎        | 191/1468 [01:02<04:12,  5.06it/s][A[A[A[A[A[A[A[A[A



 64%|██████▍   | 149/232 [00:51<00:18,  4.38it/s]A[A[A[A






 28%|██▊       | 139/492 [00:47<01:41,  3.46it/s][A[A[A[A[A[A[A
 27%|██▋       | 55/201 [00:20<00:48,  3.01it/s][A




 11%|█         | 11/103 [00:05<00:27,  3.33it/s][A[A[A[A[A







 33%|███▎      | 185/568 [01:02<01:48,  3.54it/s][A[A[A[A[A[A[A[A









  6%|▋         | 188/3000 [01:02<11:56,  3.93it/s][A[A[A[A[A[A[A[A[A[A

 23%|██▎       | 22/94 [00:08<00:19,  3.68it/s][A[A








 13%|█▎        | 192/1468 [01:02<05:08,  4.14it/s][A[A[

Total Failure in the ཡུལ་སྐོར་འགྱུར་སྟངས། article: 0
scrape_shangri_ALL_content_ཡུལ་སྐོར་འགྱུར་སྟངས།.json
Successfully saved: scrape_shangri_ALL_content_ཡུལ་སྐོར་འགྱུར་སྟངས།.json
Total page in shangri_latibet_ALL_link_བརྙན་གཟུགས་ཟློས་གར།.json: 5
page key name: Page བརྙན་གཟུགས་ཟློས་གར། 5
Page key code: Page བརྙན་གཟུགས་ཟློས་གར། 








  0%|          | 0/99 [00:00<?, ?it/s][A[A[A[A[A[A









  7%|▋         | 206/3000 [01:08<11:12,  4.15it/s][A[A[A[A[A[A[A[A[A[A



 11%|█         | 21/195 [00:09<01:04,  2.71it/s][A[A[A[A




 28%|██▊       | 29/103 [00:12<00:23,  3.12it/s][A[A[A[A[A
 38%|███▊      | 76/201 [00:27<00:34,  3.63it/s][A






 32%|███▏      | 159/492 [00:54<01:35,  3.49it/s][A[A[A[A[A[A[A

 43%|████▎     | 40/94 [00:15<00:12,  4.40it/s][A[A









  7%|▋         | 207/3000 [01:09<12:44,  3.65it/s][A[A[A[A[A[A[A[A[A[A



 11%|█▏        | 22/195 [00:09<01:06,  2.60it/s][A[A[A[A



 12%|█▏        | 23/195 [00:09<01:03,  2.71it/s][A[A[A[A







 36%|███▌      | 205/568 [01:09<02:05,  2.90it/s][A[A[A[A[A[A[A[A








 15%|█▍        | 213/1468 [01:09<05:02,  4.14it/s][A[A[A[A[A[A[A[A[A




 29%|██▉       | 30/103 [00:12<00:26,  2.71it/s][A[A[A[A[A
 38%|███▊      | 77/201 [00:27<00:43,  2.84it/s][A






 33%|███▎      | 160

Total Failure in the གནས་ཁམས་ཆེན། article: 0
scrape_shangri_ALL_content_གནས་ཁམས་ཆེན།.json
Successfully saved: scrape_shangri_ALL_content_གནས་ཁམས་ཆེན།.json
Total page in shangri_latibet_ALL_link_སྙན་དབྱངས་འགྱུར་ཁུག.json: 6
page key name: Page སྙན་དབྱངས་འགྱུར་ཁུག 6
Page key code: Page སྙན་དབྱངས་འགྱུར་ཁུག 




  0%|          | 0/103 [00:00<?, ?it/s][A[A








 18%|█▊        | 271/1468 [01:28<06:21,  3.14it/s][A[A[A[A[A[A[A[A[A





 61%|██████    | 60/99 [00:20<00:06,  5.62it/s][A[A[A[A[A[A









 99%|█████████▉| 230/232 [01:17<00:00,  3.10it/s]][A[A[A[A[A[A[A[A[A[A




 88%|████████▊ | 91/103 [00:32<00:04,  2.67it/s][A[A[A[A[A







 46%|████▋     | 263/568 [01:29<01:36,  3.17it/s][A[A[A[A[A[A[A[A








 19%|█▊        | 272/1468 [01:29<07:00,  2.84it/s][A[A[A[A[A[A[A[A[A






 45%|████▍     | 221/492 [01:14<01:21,  3.33it/s][A[A[A[A[A[A[A



 46%|████▌     | 89/195 [00:30<00:31,  3.36it/s][A[A[A[A









100%|█████████▉| 231/232 [01:18<00:00,  2.64it/s]][A[A[A[A[A[A[A[A[A[A





 62%|██████▏   | 61/99 [00:21<00:10,  3.79it/s][A[A[A[A[A[A
 70%|██████▉   | 140/201 [00:47<00:19,  3.21it/s][A




 89%|████████▉ | 92/103 [00:32<00:04,  2.22it/s][A[A[A[A[A







 46%|████▋     | 264/568 [01:29<01:48,  

Total Failure in the སློབ་གསོ། article: 0
scrape_shangri_ALL_content_སློབ་གསོ།.json
Successfully saved: scrape_shangri_ALL_content_སློབ་གསོ།.json
Total page in shangri_latibet_ALL_link_རོལ་རྩེད།.json: 2
page key name: Page རོལ་རྩེད། 2
Page key code: Page རོལ་རྩེད། 


  0%|          | 0/36 [00:00<?, ?it/s]




 94%|█████████▍| 97/103 [00:32<00:01,  4.72it/s][A[A[A[A[A



 48%|████▊     | 94/195 [00:30<00:20,  4.84it/s][A[A[A[A





 64%|██████▎   | 63/99 [00:21<00:11,  3.18it/s][A[A[A[A[A[A









  9%|▉         | 272/3000 [01:29<10:00,  4.54it/s][A[A[A[A[A[A[A[A[A[A




 95%|█████████▌| 98/103 [00:33<00:01,  4.61it/s][A[A[A[A[A



 49%|████▉     | 96/195 [00:31<00:17,  5.62it/s][A[A[A[A
 72%|███████▏  | 144/201 [00:48<00:15,  3.63it/s][A






 46%|████▌     | 224/492 [01:15<01:35,  2.81it/s][A[A[A[A[A[A[A








 19%|█▉        | 277/1468 [01:30<06:11,  3.20it/s][A[A[A[A[A[A[A[A[A







 47%|████▋     | 269/568 [01:30<01:20,  3.70it/s][A[A[A[A[A[A[A[A









  9%|▉         | 273/3000 [01:30<11:03,  4.11it/s][A[A[A[A[A[A[A[A[A[A

  1%|          | 1/103 [00:02<03:39,  2.15s/it][A[A





 65%|██████▍   | 64/99 [00:22<00:12,  2.91it/s][A[A[A[A[A[A




 96%|█████████▌| 99

Total Failure in the གནས་སྐོར་མཛེས་ལྗོངས། article: 0
scrape_shangri_ALL_content_གནས་སྐོར་མཛེས་ལྗོངས།.json
Successfully saved: scrape_shangri_ALL_content_གནས་སྐོར་མཛེས་ལྗོངས།.json
Total page in shangri_latibet_ALL_link_ཆེད་སྒྲིག.json: 1
page key name: Page ཆེད་སྒྲིག 1
Page key code: Page ཆེད་སྒྲིག 







  0%|          | 0/16 [00:00<?, ?it/s][A[A[A[A[A








 20%|█▉        | 288/1468 [01:33<04:19,  4.55it/s][A[A[A[A[A[A[A[A[A



 25%|██▌       | 9/36 [00:04<00:09,  2.81it/s]/s][A[A[A[A









  9%|▉         | 283/3000 [01:34<12:37,  3.59it/s][A[A[A[A[A[A[A[A[A[A







 49%|████▉     | 281/568 [01:34<01:22,  3.49it/s][A[A[A[A[A[A[A[A






 48%|████▊     | 235/492 [01:19<01:45,  2.44it/s][A[A[A[A[A[A[A








 20%|█▉        | 289/1468 [01:34<05:00,  3.92it/s][A[A[A[A[A[A[A[A[A

 13%|█▎        | 13/103 [00:06<00:27,  3.31it/s][A[A
 79%|███████▊  | 158/201 [00:52<00:10,  4.05it/s][A





 28%|██▊       | 10/36 [00:04<00:09,  2.66it/s][A[A[A[A[A[A









  9%|▉         | 284/3000 [01:34<13:52,  3.26it/s][A[A[A[A[A[A[A[A[A[A







 50%|████▉     | 282/568 [01:34<01:26,  3.30it/s][A[A[A[A[A[A[A[A






 48%|████▊     | 236/492 [01:19<01:36,  2.66it/s][A[A[A[A[A[A[A








 20%|█▉        | 290

Total Failure in the ཆེད་སྒྲིག article: 0
scrape_shangri_ALL_content_ཆེད་སྒྲིག.json
Successfully saved: scrape_shangri_ALL_content_ཆེད་སྒྲིག.json
Total page in shangri_latibet_ALL_link_རང་བྱུང་གི་མཛེས་ལྗོངས།.json: 2
page key name: Page རང་བྱུང་གི་མཛེས་ལྗོངས། 2
Page key code: Page རང་བྱུང་གི་མཛེས་ལྗོངས། 







  0%|          | 0/27 [00:00<?, ?it/s][A[A[A[A[A



 67%|██████▋   | 131/195 [00:42<00:15,  4.25it/s][A[A[A[A









 10%|█         | 308/3000 [01:41<12:08,  3.69it/s][A[A[A[A[A[A[A[A[A[A







 54%|█████▍    | 306/568 [01:41<01:05,  4.01it/s][A[A[A[A[A[A[A[A





100%|██████████| 99/99 [00:34<00:00,  2.72it/s][A[A[A[A[A[A









 10%|█         | 310/3000 [01:42<10:41,  4.19it/s][A[A[A[A[A[A[A[A[A[A



 68%|██████▊   | 132/195 [00:43<00:15,  4.00it/s][A[A[A[A








 22%|██▏       | 316/1468 [01:42<04:47,  4.00it/s][A[A[A[A[A[A[A[A[A

 40%|███▉      | 41/103 [00:14<00:14,  4.23it/s][A[A
 91%|█████████ | 183/201 [01:00<00:04,  3.91it/s][A






 53%|█████▎    | 262/492 [01:27<00:53,  4.27it/s][A[A[A[A[A[A[A







100%|██████████| 99/99 [00:34<00:00,  2.89it/s]s][A[A[A[A[A[A[A[A


Total Failure in the བརྙན་གཟུགས་ཟློས་གར། article: 0
scrape_shangri_ALL_content_བརྙན་གཟུགས་ཟློས་གར།.json
Successfully saved: scrape_shangri_ALL_content_བརྙན་གཟུགས་ཟློས་གར།.json
Total page in shangri_latibet_ALL_link_མི་རིགས་ཀྱི་གོམས་གཤིས།.json: 1
page key name: Page མི་རིགས་ཀྱི་གོམས་གཤིས། 1
Page key code: Page མི་རིགས་ཀྱི་གོམས་གཤིས། 








  0%|          | 0/6 [00:00<?, ?it/s][A[A[A[A[A[A









 10%|█         | 312/3000 [01:42<10:02,  4.46it/s][A[A[A[A[A[A[A[A[A[A








 22%|██▏       | 318/1468 [01:42<04:28,  4.28it/s][A[A[A[A[A[A[A[A[A



 68%|██████▊   | 133/195 [00:43<00:17,  3.64it/s][A[A[A[A







 54%|█████▍    | 308/568 [01:42<01:12,  3.56it/s][A[A[A[A[A[A[A[A
 97%|█████████▋| 35/36 [00:12<00:00,  2.56it/s]s][A



 69%|██████▊   | 134/195 [00:43<00:15,  3.89it/s][A[A[A[A









 10%|█         | 314/3000 [01:42<08:50,  5.06it/s][A[A[A[A[A[A[A[A[A[A







 54%|█████▍    | 309/568 [01:42<01:10,  3.68it/s][A[A[A[A[A[A[A[A

 41%|████      | 42/103 [00:14<00:17,  3.49it/s][A[A








100%|██████████| 36/36 [00:13<00:00,  2.70it/s]/s][A[A[A[A[A[A[A[A[A



100%|██████████| 36/36 [00:13<00:00,  2.71it/s]s][A[A[A[A


Total Failure in the རོལ་རྩེད། article: 0
scrape_shangri_ALL_content_རོལ་རྩེད།.json
Successfully saved: scrape_shangri_ALL_content_རོལ་རྩེད།.json






 70%|██████▉   | 136/195 [00:44<00:13,  4.32it/s][A[A[A[A








 22%|██▏       | 320/1468 [01:43<04:49,  3.96it/s][A[A[A[A[A[A[A[A[A







 55%|█████▍    | 310/568 [01:43<01:15,  3.40it/s][A[A[A[A[A[A[A[A
 92%|█████████▏| 185/201 [01:01<00:05,  3.07it/s][A

 43%|████▎     | 44/103 [00:15<00:15,  3.81it/s][A[A



 70%|███████   | 137/195 [00:44<00:12,  4.83it/s][A[A[A[A









 10%|█         | 315/3000 [01:43<11:58,  3.74it/s][A[A[A[A[A[A[A[A[A[A






 54%|█████▎    | 264/492 [01:28<01:16,  2.96it/s][A[A[A[A[A[A[A

 45%|████▍     | 46/103 [00:15<00:12,  4.52it/s][A[A






 54%|█████▍    | 265/492 [01:29<01:08,  3.33it/s][A[A[A[A[A[A[A

 46%|████▌     | 47/103 [00:15<00:11,  4.88it/s][A[A







 55%|█████▍    | 311/568 [01:43<01:27,  2.92it/s][A[A[A[A[A[A[A[A









 11%|█         | 316/3000 [01:43<12:55,  3.46it/s][A[A[A[A[A[A[A[A[A[A




  4%|▎         | 1/27 [00:02<00:50,  1.94s/it][A[A[A[A[A


Total Failure in the མི་རིགས་ཀྱི་གོམས་གཤིས། article: 0
scrape_shangri_ALL_content_མི་རིགས་ཀྱི་གོམས་གཤིས།.json
Successfully saved: scrape_shangri_ALL_content_མི་རིགས་ཀྱི་གོམས་གཤིས།.json


 54%|█████▍    | 56/103 [00:18<00:10,  4.28it/s][A[A






 56%|█████▌    | 275/492 [01:32<01:07,  3.22it/s][A[A[A[A[A[A[A




 44%|████▍     | 12/27 [00:04<00:02,  5.22it/s][A[A[A[A[A

 55%|█████▌    | 57/103 [00:18<00:09,  4.61it/s][A[A






 56%|█████▌    | 276/492 [01:32<00:59,  3.62it/s][A[A[A[A[A[A[A



 74%|███████▍  | 145/195 [00:47<00:16,  3.05it/s][A[A[A[A







 57%|█████▋    | 322/568 [01:46<00:53,  4.57it/s][A[A[A[A[A[A[A[A






 57%|█████▋    | 279/492 [01:32<00:38,  5.51it/s][A[A[A[A[A[A[A




 48%|████▊     | 13/27 [00:04<00:02,  5.19it/s][A[A[A[A[A








 23%|██▎       | 331/1468 [01:46<04:58,  3.80it/s][A[A[A[A[A[A[A[A[A



 75%|███████▍  | 146/195 [00:47<00:14,  3.28it/s][A[A[A[A
 98%|█████████▊| 196/201 [01:05<00:01,  3.10it/s][A

 57%|█████▋    | 59/103 [00:19<00:10,  4.35it/s][A[A








 23%|██▎       | 332/1468 [01:47<05:02,  3.76it/s][A[A[A[A[A[A[A[A[A









 11%|█         | 325/30

Total Failure in the ཡུལ་སྲོལ་གོམས་གཤིས། article: 0
scrape_shangri_ALL_content_ཡུལ་སྲོལ་གོམས་གཤིས།.json
Successfully saved: scrape_shangri_ALL_content_ཡུལ་སྲོལ་གོམས་གཤིས།.json


 58%|█████▊    | 331/568 [01:49<00:53,  4.46it/s][A[A[A[A[A[A[A[A









 11%|█         | 334/3000 [01:49<15:15,  2.91it/s][A[A[A[A[A[A[A[A[A[A






 58%|█████▊    | 286/492 [01:34<00:57,  3.59it/s][A[A[A[A[A[A[A








 23%|██▎       | 341/1468 [01:49<05:42,  3.29it/s][A[A[A[A[A[A[A[A[A




 81%|████████▏ | 22/27 [00:07<00:01,  3.23it/s][A[A[A[A[A

 63%|██████▎   | 65/103 [00:21<00:13,  2.78it/s][A[A






 58%|█████▊    | 287/492 [01:35<00:50,  4.07it/s][A[A[A[A[A[A[A









 11%|█         | 335/3000 [01:49<13:50,  3.21it/s][A[A[A[A[A[A[A[A[A[A









 11%|█         | 336/3000 [01:49<12:24,  3.58it/s][A[A[A[A[A[A[A[A[A[A




 85%|████████▌ | 23/27 [00:08<00:01,  3.12it/s][A[A[A[A[A



 81%|████████  | 158/195 [00:50<00:10,  3.53it/s][A[A[A[A








 23%|██▎       | 342/1468 [01:50<06:28,  2.90it/s][A[A[A[A[A[A[A[A[A






 59%|█████▊    | 288/492 [01:35<00:55,  3.68it/s][A[A[A[A[A[A[

Total Failure in the རང་བྱུང་གི་མཛེས་ལྗོངས། article: 0
scrape_shangri_ALL_content_རང་བྱུང་གི་མཛེས་ལྗོངས།.json
Successfully saved: scrape_shangri_ALL_content_རང་བྱུང་གི་མཛེས་ལྗོངས།.json






 86%|████████▌ | 167/195 [00:52<00:05,  5.29it/s][A[A[A[A






 60%|█████▉    | 293/492 [01:37<01:20,  2.48it/s][A[A[A[A[A[A[A







 59%|█████▉    | 337/568 [01:52<01:38,  2.34it/s][A[A[A[A[A[A[A[A









 11%|█▏        | 344/3000 [01:52<12:51,  3.44it/s][A[A[A[A[A[A[A[A[A[A








 24%|██▍       | 349/1468 [01:52<07:16,  2.57it/s][A[A[A[A[A[A[A[A[A






 60%|█████▉    | 294/492 [01:38<01:15,  2.63it/s][A[A[A[A[A[A[A







 60%|█████▉    | 338/568 [01:52<01:30,  2.54it/s][A[A[A[A[A[A[A[A








 24%|██▍       | 350/1468 [01:52<06:28,  2.88it/s][A[A[A[A[A[A[A[A[A









 12%|█▏        | 345/3000 [01:52<13:51,  3.19it/s][A[A[A[A[A[A[A[A[A[A

 73%|███████▎  | 75/103 [00:24<00:10,  2.66it/s][A[A



 86%|████████▌ | 168/195 [00:53<00:08,  3.34it/s][A[A[A[A






 60%|█████▉    | 295/492 [01:38<01:15,  2.60it/s][A[A[A[A[A[A[A







 60%|█████▉    | 339/568 [01:52<01:26,  2.66it/s][A[A[A[A

Total Failure in the སྙན་དབྱངས་འགྱུར་ཁུག article: 0
scrape_shangri_ALL_content_སྙན་དབྱངས་འགྱུར་ཁུག.json
Successfully saved: scrape_shangri_ALL_content_སྙན་དབྱངས་འགྱུར་ཁུག.json











 26%|██▌       | 376/1468 [02:00<05:39,  3.21it/s][A[A[A[A[A[A[A[A[A









 12%|█▏        | 370/3000 [02:00<16:30,  2.65it/s][A[A[A[A[A[A[A[A[A[A








 26%|██▌       | 377/1468 [02:00<05:17,  3.44it/s][A[A[A[A[A[A[A[A[A








 26%|██▌       | 378/1468 [02:00<04:49,  3.76it/s][A[A[A[A[A[A[A[A[A



 99%|█████████▉| 194/195 [01:01<00:00,  2.41it/s][A[A[A[A









 12%|█▏        | 373/3000 [02:00<10:21,  4.23it/s][A[A[A[A[A[A[A[A[A[A









 12%|█▏        | 374/3000 [02:00<09:32,  4.59it/s][A[A[A[A[A[A[A[A[A[A







 64%|██████▍   | 366/568 [02:01<01:20,  2.50it/s][A[A[A[A[A[A[A[A



100%|██████████| 195/195 [01:01<00:00,  3.16it/s][A[A[A[A










 12%|█▎        | 375/3000 [02:01<08:32,  5.12it/s][A[A[A[A[A[A[A[A[A[A







 65%|██████▍   | 367/568 [02:01<01:10,  2.85it/s][A[A[A[A[A[A[A[A








 26%|██▌       | 380/1468 [02:01<04:15,  4.26it/s][A[A[A[A[A[A[A[A[A

Total Failure in the སྐྱེ་ཁམས་སྲུང་སྐྱོང་། article: 0
scrape_shangri_ALL_content_སྐྱེ་ཁམས་སྲུང་སྐྱོང་།.json
Successfully saved: scrape_shangri_ALL_content_སྐྱེ་ཁམས་སྲུང་སྐྱོང་།.json









 66%|██████▌   | 324/492 [01:46<01:27,  1.92it/s][A[A[A[A[A[A[A







 65%|██████▍   | 368/568 [02:01<01:06,  3.01it/s][A[A[A[A[A[A[A[A








 26%|██▌       | 381/1468 [02:01<05:12,  3.48it/s][A[A[A[A[A[A[A[A[A







 65%|██████▌   | 370/568 [02:01<00:54,  3.63it/s][A[A[A[A[A[A[A[A






 66%|██████▌   | 325/492 [01:47<01:29,  1.86it/s][A[A[A[A[A[A[A







 65%|██████▌   | 371/568 [02:02<00:52,  3.74it/s][A[A[A[A[A[A[A[A









 13%|█▎        | 377/3000 [02:02<13:18,  3.29it/s][A[A[A[A[A[A[A[A[A[A








 26%|██▌       | 382/1468 [02:02<05:43,  3.16it/s][A[A[A[A[A[A[A[A[A






 66%|██████▋   | 326/492 [01:47<01:15,  2.21it/s][A[A[A[A[A[A[A









 13%|█▎        | 378/3000 [02:02<12:16,  3.56it/s][A[A[A[A[A[A[A[A[A[A








 26%|██▌       | 383/1468 [02:02<05:10,  3.50it/s][A[A[A[A[A[A[A[A[A






 67%|██████▋   | 331/492 [01:47<00:25,  6.23it/s][A[A[A[A[A[A[A







 65

Total Failure in the གསོ་རིག article: 1
scrape_shangri_ALL_content_གསོ་རིག.json
Successfully saved: scrape_shangri_ALL_content_གསོ་རིག.json










 95%|█████████▍| 537/568 [02:50<00:05,  5.50it/s][A[A[A[A[A[A[A[A







 95%|█████████▍| 538/568 [02:50<00:05,  5.79it/s][A[A[A[A[A[A[A[A









 18%|█▊        | 543/3000 [02:50<13:50,  2.96it/s][A[A[A[A[A[A[A[A[A[A








 37%|███▋      | 550/1468 [02:50<05:06,  3.00it/s][A[A[A[A[A[A[A[A[A









 18%|█▊        | 544/3000 [02:50<12:49,  3.19it/s][A[A[A[A[A[A[A[A[A[A








 38%|███▊      | 551/1468 [02:50<04:31,  3.37it/s][A[A[A[A[A[A[A[A[A








 38%|███▊      | 552/1468 [02:51<04:09,  3.68it/s][A[A[A[A[A[A[A[A[A









 18%|█▊        | 545/3000 [02:51<13:10,  3.11it/s][A[A[A[A[A[A[A[A[A[A









 18%|█▊        | 546/3000 [02:51<14:07,  2.90it/s][A[A[A[A[A[A[A[A[A[A








 38%|███▊      | 553/1468 [02:51<05:10,  2.95it/s][A[A[A[A[A[A[A[A[A







 95%|█████████▍| 539/568 [02:51<00:12,  2.41it/s][A[A[A[A[A[A[A[A









 18%|█▊        | 548/3000 [02:51<09:52,  4.

Total Failure in the རྒྱལ་ཕྱི་ནང་གསར་འགྱུར། article: 0
scrape_shangri_ALL_content_རྒྱལ་ཕྱི་ནང་གསར་འགྱུར།.json
Successfully saved: scrape_shangri_ALL_content_རྒྱལ་ཕྱི་ནང་གསར་འགྱུར།.json











 40%|███▉      | 581/1468 [03:00<06:06,  2.42it/s][A[A[A[A[A[A[A[A[A








 40%|███▉      | 582/1468 [03:00<05:25,  2.73it/s][A[A[A[A[A[A[A[A[A








 40%|███▉      | 585/1468 [03:00<03:35,  4.10it/s][A[A[A[A[A[A[A[A[A









 19%|█▉        | 575/3000 [03:00<17:21,  2.33it/s][A[A[A[A[A[A[A[A[A[A









 19%|█▉        | 577/3000 [03:01<12:30,  3.23it/s][A[A[A[A[A[A[A[A[A[A









 19%|█▉        | 579/3000 [03:01<08:44,  4.61it/s][A[A[A[A[A[A[A[A[A[A








 40%|████      | 588/1468 [03:01<03:20,  4.39it/s][A[A[A[A[A[A[A[A[A








 40%|████      | 589/1468 [03:01<03:16,  4.48it/s][A[A[A[A[A[A[A[A[A








 40%|████      | 590/1468 [03:01<03:08,  4.66it/s][A[A[A[A[A[A[A[A[A









 19%|█▉        | 580/3000 [03:01<12:48,  3.15it/s][A[A[A[A[A[A[A[A[A[A









 19%|█▉        | 582/3000 [03:02<10:33,  3.81it/s][A[A[A[A[A[A[A[A[A[A









 19%|█▉        | 583/300

Total Failure in the བོད་ཁུལ་གསར་འགྱུར། article: 3
scrape_shangri_ALL_content_བོད་ཁུལ་གསར་འགྱུར།.json
Successfully saved: scrape_shangri_ALL_content_བོད་ཁུལ་གསར་འགྱུར།.json












 49%|████▉     | 1467/3000 [07:18<07:29,  3.41it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1469/3000 [07:19<07:29,  3.40it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1470/3000 [07:19<09:08,  2.79it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1471/3000 [07:20<08:27,  3.02it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1472/3000 [07:20<08:50,  2.88it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1473/3000 [07:20<07:12,  3.53it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1475/3000 [07:20<04:47,  5.30it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1476/3000 [07:21<07:13,  3.52it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1477/3000 [07:21<07:09,  3.54it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1478/3000 [07:21<06:42,  3.78it/s][A[A[A[A[A[A[A[A[A[A









 49%|████▉     | 1480/3000 [07:23<11:00,  2.30it/s][A[A[A[A[A[A[A[A[A[

Total Failure in the ས་གནས་གསར་འགྱུར། article: 10
scrape_shangri_ALL_content_ས་གནས་གསར་འགྱུར།.json





100%|██████████| 33/33 [14:43<00:00, 26.78s/it]  [A[A[A

Successfully saved: scrape_shangri_ALL_content_ས་གནས་གསར་འགྱུར།.json
Processed 33 files
CPU times: user 3min 52s, sys: 13.7 s, total: 4min 5s
Wall time: 14min 43s





In [None]:
# 14:44

In [7]:
pwd()

'/workspace/web_scrab/new_news_Articles/shangri-latibet'

In [11]:
json_files = [os.path.join(directory, f) for f in os.listdir(directory) if f.endswith('.json')]
json_files

NameError: name 'directory' is not defined