# About this notebook:

- We are collecting articles ID that are related to diseases from [PubMed](https://pubmed.ncbi.nlm.nih.gov/) 
- We will be using [NCBI API (E-utilities)](https://www.ncbi.nlm.nih.gov/books/NBK25497/) to obtain our data

**About PubMed**<br>
PubMed is a database that indexes and provides access to biomedical and life sciences literature, including scientific research articles, clinical studies, and reviews. Scientists are one of the primary users of PubMed, as they rely on the database to find relevant literature and stay up-to-date with the latest developments in their field of study.

PubMed plays a crucial role in the scientific community by providing access to a vast amount of research literature.

# Import Libraries

In [1]:
# Import libaries
import numpy as np 
import pandas as pd 

from IPython.core.interactiveshell import InteractiveShell
InteractiveShell.ast_node_interactivity = "all"

In [1]:
import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

from Bio import Entrez
import pandas as pd


import time
from tqdm import tqdm

# Set the email address associated with your NCBI account
Entrez.email = "geok1723@gmail.com"

# Part 1: Create a list of dates
> We will be limiting our articles that are published betweeen 2010-2019.

In [2]:
print("Create a list of Dates")

import datetime

# Define start and end dates
start_date = datetime.date(2010, 1, 1)
end_date = datetime.date(2019, 12, 31)

# Create a list of dates from start to end, inclusive
date_list = [start_date + datetime.timedelta(days=x) for x in range((end_date - start_date).days + 1)]

# Format each date as a string in the desired format
date_strings = [date.strftime("%Y/%m/%d") for date in date_list]


Create a list of Dates


In [3]:
len(date_strings)

3652

# Part 2: Create a dataframe of 'Date' and 'ID'

In [5]:
print("Create a dataframe of 'Date' and 'ID'")


df_DateTracking = pd.DataFrame(columns=['Date', 'total_record'])
id_df = pd.DataFrame(columns=['Date', 'id'])

for date in tqdm(date_strings):
    id_list = []
    num = len(df_DateTracking)
    
    if num<10:
        print(num)
    elif num%10==0:
        print(num)
    
    search_terms = "disease"
    date_filter = f"{date}[PubDate]"
    # Retrieve the total number of records matching the search term and date filter
    handle = Entrez.esearch(db="pubmed", term=search_terms, mindate=date_filter, maxdate=date_filter, retmax=9999)
    record = Entrez.read(handle)
    total_records = int(record["Count"])
    id_list = record["IdList"]
    # Append the date and total_records to the dataframe
    df_DateTracking.loc[len(df_DateTracking)] = [date, total_records]
    id_df.loc[len(id_df)] = [date, id_list]
print(df_DateTracking)
print(id_df)

Create a dataframe of 'Date' and 'ID'


  0%|          | 0/3652 [00:00<?, ?it/s]

0


  0%|          | 1/3652 [00:01<1:50:51,  1.82s/it]

1


  0%|          | 2/3652 [00:03<1:29:50,  1.48s/it]

2


  0%|          | 3/3652 [00:04<1:20:39,  1.33s/it]

3


  0%|          | 4/3652 [00:05<1:16:13,  1.25s/it]

4


  0%|          | 5/3652 [00:06<1:16:14,  1.25s/it]

5


  0%|          | 6/3652 [00:08<1:26:39,  1.43s/it]

6


  0%|          | 7/3652 [00:09<1:22:42,  1.36s/it]

7


  0%|          | 8/3652 [00:10<1:19:37,  1.31s/it]

8


  0%|          | 9/3652 [00:12<1:22:43,  1.36s/it]

9


  0%|          | 10/3652 [00:14<1:33:17,  1.54s/it]

10


  1%|          | 20/3652 [00:27<1:18:25,  1.30s/it]

20


  1%|          | 30/3652 [00:40<1:23:35,  1.38s/it]

30


  1%|          | 40/3652 [00:53<1:19:49,  1.33s/it]

40


  1%|▏         | 50/3652 [01:06<1:21:54,  1.36s/it]

50


  2%|▏         | 60/3652 [01:19<1:17:02,  1.29s/it]

60


  2%|▏         | 70/3652 [01:35<1:24:49,  1.42s/it]

70


  2%|▏         | 80/3652 [01:48<1:18:09,  1.31s/it]

80


  2%|▏         | 90/3652 [02:01<1:19:57,  1.35s/it]

90


  3%|▎         | 100/3652 [02:15<1:21:48,  1.38s/it]

100


  3%|▎         | 110/3652 [02:28<1:16:26,  1.30s/it]

110


  3%|▎         | 120/3652 [02:41<1:18:41,  1.34s/it]

120


  4%|▎         | 130/3652 [02:54<1:15:14,  1.28s/it]

130


  4%|▍         | 140/3652 [03:08<1:17:14,  1.32s/it]

140


  4%|▍         | 150/3652 [03:21<1:15:20,  1.29s/it]

150


  4%|▍         | 160/3652 [03:34<1:11:20,  1.23s/it]

160


  5%|▍         | 170/3652 [03:48<1:20:27,  1.39s/it]

170


  5%|▍         | 180/3652 [04:01<1:16:21,  1.32s/it]

180


  5%|▌         | 190/3652 [04:14<1:19:16,  1.37s/it]

190


  5%|▌         | 200/3652 [04:27<1:12:07,  1.25s/it]

200


  6%|▌         | 210/3652 [04:41<1:18:15,  1.36s/it]

210


  6%|▌         | 220/3652 [04:54<1:15:10,  1.31s/it]

220


  6%|▋         | 230/3652 [05:06<1:15:27,  1.32s/it]

230


  7%|▋         | 240/3652 [05:20<1:19:17,  1.39s/it]

240


  7%|▋         | 250/3652 [05:34<1:10:48,  1.25s/it]

250


  7%|▋         | 260/3652 [05:47<1:13:07,  1.29s/it]

260


  7%|▋         | 270/3652 [06:00<1:09:51,  1.24s/it]

270


  8%|▊         | 280/3652 [06:13<1:13:49,  1.31s/it]

280


  8%|▊         | 290/3652 [06:26<1:12:34,  1.30s/it]

290


  8%|▊         | 300/3652 [06:39<1:14:32,  1.33s/it]

300


  8%|▊         | 310/3652 [06:52<1:15:37,  1.36s/it]

310


  9%|▉         | 320/3652 [07:05<1:11:13,  1.28s/it]

320


  9%|▉         | 330/3652 [07:18<1:15:32,  1.36s/it]

330


  9%|▉         | 340/3652 [07:31<1:09:31,  1.26s/it]

340


 10%|▉         | 350/3652 [07:44<1:11:37,  1.30s/it]

350


 10%|▉         | 360/3652 [07:57<1:11:05,  1.30s/it]

360


 10%|█         | 370/3652 [08:10<1:13:42,  1.35s/it]

370


 10%|█         | 380/3652 [08:23<1:12:32,  1.33s/it]

380


 11%|█         | 390/3652 [08:36<1:12:20,  1.33s/it]

390


 11%|█         | 400/3652 [08:49<1:09:19,  1.28s/it]

400


 11%|█         | 410/3652 [09:02<1:07:58,  1.26s/it]

410


 12%|█▏        | 420/3652 [09:16<1:11:03,  1.32s/it]

420


 12%|█▏        | 430/3652 [09:29<1:12:24,  1.35s/it]

430


 12%|█▏        | 440/3652 [09:43<1:13:07,  1.37s/it]

440


 12%|█▏        | 450/3652 [09:56<1:13:42,  1.38s/it]

450


 13%|█▎        | 460/3652 [10:09<1:09:47,  1.31s/it]

460


 13%|█▎        | 470/3652 [10:22<1:11:53,  1.36s/it]

470


 13%|█▎        | 480/3652 [10:35<1:05:03,  1.23s/it]

480


 13%|█▎        | 490/3652 [10:48<1:08:35,  1.30s/it]

490


 14%|█▎        | 500/3652 [11:01<1:07:39,  1.29s/it]

500


 14%|█▍        | 510/3652 [11:15<1:11:06,  1.36s/it]

510


 14%|█▍        | 520/3652 [11:28<1:09:59,  1.34s/it]

520


 15%|█▍        | 530/3652 [11:41<1:03:51,  1.23s/it]

530


 15%|█▍        | 540/3652 [11:55<1:11:18,  1.37s/it]

540


 15%|█▌        | 550/3652 [12:08<1:05:33,  1.27s/it]

550


 15%|█▌        | 560/3652 [12:21<1:07:27,  1.31s/it]

560


 16%|█▌        | 570/3652 [12:34<1:06:57,  1.30s/it]

570


 16%|█▌        | 580/3652 [12:48<1:07:45,  1.32s/it]

580


 16%|█▌        | 590/3652 [13:01<1:09:27,  1.36s/it]

590


 16%|█▋        | 600/3652 [13:14<1:06:15,  1.30s/it]

600


 17%|█▋        | 610/3652 [13:27<1:11:25,  1.41s/it]

610


 17%|█▋        | 620/3652 [13:40<1:04:00,  1.27s/it]

620


 17%|█▋        | 630/3652 [13:54<1:10:07,  1.39s/it]

630


 18%|█▊        | 640/3652 [14:08<1:09:07,  1.38s/it]

640


 18%|█▊        | 650/3652 [14:21<1:07:44,  1.35s/it]

650


 18%|█▊        | 660/3652 [14:34<1:08:45,  1.38s/it]

660


 18%|█▊        | 670/3652 [14:47<1:05:27,  1.32s/it]

670


 19%|█▊        | 680/3652 [15:01<1:08:48,  1.39s/it]

680


 19%|█▉        | 690/3652 [15:14<1:03:24,  1.28s/it]

690


 19%|█▉        | 700/3652 [15:27<1:07:30,  1.37s/it]

700


 19%|█▉        | 710/3652 [15:40<1:01:02,  1.24s/it]

710


 20%|█▉        | 720/3652 [15:54<1:05:49,  1.35s/it]

720


 20%|█▉        | 730/3652 [16:07<1:03:08,  1.30s/it]

730


 20%|██        | 740/3652 [16:21<1:05:16,  1.34s/it]

740


 21%|██        | 750/3652 [16:35<1:07:27,  1.39s/it]

750


 21%|██        | 760/3652 [16:49<1:02:26,  1.30s/it]

760


 21%|██        | 770/3652 [17:02<1:03:55,  1.33s/it]

770


 21%|██▏       | 780/3652 [17:16<1:03:47,  1.33s/it]

780


 22%|██▏       | 790/3652 [17:29<59:07,  1.24s/it]

790


 22%|██▏       | 800/3652 [17:43<1:03:54,  1.34s/it]

800


 22%|██▏       | 810/3652 [17:56<1:03:20,  1.34s/it]

810


 22%|██▏       | 820/3652 [18:11<1:14:08,  1.57s/it]

820


 23%|██▎       | 830/3652 [18:24<1:01:01,  1.30s/it]

830


 23%|██▎       | 840/3652 [18:38<1:05:42,  1.40s/it]

840


 23%|██▎       | 850/3652 [18:52<1:01:32,  1.32s/it]

850


 24%|██▎       | 860/3652 [19:05<1:01:25,  1.32s/it]

860


 24%|██▍       | 870/3652 [19:18<1:02:33,  1.35s/it]

870


 24%|██▍       | 880/3652 [19:32<1:07:29,  1.46s/it]

880


 24%|██▍       | 890/3652 [19:46<1:05:22,  1.42s/it]

890


 25%|██▍       | 900/3652 [20:00<58:43,  1.28s/it]  

900


 25%|██▍       | 910/3652 [20:14<1:04:23,  1.41s/it]

910


 25%|██▌       | 920/3652 [20:27<1:01:28,  1.35s/it]

920


 25%|██▌       | 930/3652 [20:41<1:02:00,  1.37s/it]

930


 26%|██▌       | 940/3652 [20:55<1:04:36,  1.43s/it]

940


 26%|██▌       | 950/3652 [21:08<1:00:02,  1.33s/it]

950


 26%|██▋       | 960/3652 [21:21<59:10,  1.32s/it]

960


 27%|██▋       | 970/3652 [21:35<57:23,  1.28s/it]

970


 27%|██▋       | 980/3652 [21:48<59:39,  1.34s/it]

980


 27%|██▋       | 990/3652 [22:02<59:14,  1.34s/it]  

990


 27%|██▋       | 1000/3652 [22:15<59:49,  1.35s/it]

1000


 28%|██▊       | 1010/3652 [22:29<58:02,  1.32s/it]

1010


 28%|██▊       | 1020/3652 [22:42<58:39,  1.34s/it]

1020


 28%|██▊       | 1030/3652 [22:56<1:01:04,  1.40s/it]

1030


 28%|██▊       | 1040/3652 [23:09<55:52,  1.28s/it]

1040


 29%|██▉       | 1050/3652 [23:23<57:28,  1.33s/it]

1050


 29%|██▉       | 1060/3652 [23:36<54:37,  1.26s/it]

1060


 29%|██▉       | 1070/3652 [23:49<1:00:06,  1.40s/it]

1070


 30%|██▉       | 1080/3652 [24:03<59:48,  1.40s/it]

1080


 30%|██▉       | 1090/3652 [24:16<55:21,  1.30s/it]

1090


 30%|███       | 1100/3652 [24:29<59:17,  1.39s/it]

1100


 30%|███       | 1110/3652 [24:42<53:38,  1.27s/it]

1110


 31%|███       | 1120/3652 [24:55<57:01,  1.35s/it]

1120


 31%|███       | 1130/3652 [25:09<55:18,  1.32s/it]

1130


 31%|███       | 1140/3652 [25:23<1:05:11,  1.56s/it]

1140


 31%|███▏      | 1150/3652 [25:36<55:57,  1.34s/it]

1150


 32%|███▏      | 1160/3652 [25:50<56:16,  1.36s/it]

1160


 32%|███▏      | 1170/3652 [26:04<57:06,  1.38s/it]

1170


 32%|███▏      | 1180/3652 [26:17<53:19,  1.29s/it]

1180


 33%|███▎      | 1190/3652 [26:31<56:28,  1.38s/it]

1190


 33%|███▎      | 1200/3652 [26:44<55:22,  1.36s/it]

1200


 33%|███▎      | 1210/3652 [26:59<57:20,  1.41s/it]

1210


 33%|███▎      | 1220/3652 [27:12<54:28,  1.34s/it]

1220


 34%|███▎      | 1230/3652 [27:25<49:34,  1.23s/it]

1230


 34%|███▍      | 1240/3652 [27:39<56:29,  1.41s/it]

1240


 34%|███▍      | 1250/3652 [27:53<52:32,  1.31s/it]

1250


 35%|███▍      | 1260/3652 [28:07<52:54,  1.33s/it]

1260


 35%|███▍      | 1270/3652 [28:20<50:38,  1.28s/it]

1270


 35%|███▌      | 1280/3652 [28:34<56:12,  1.42s/it]

1280


 35%|███▌      | 1290/3652 [28:48<56:13,  1.43s/it]

1290


 36%|███▌      | 1300/3652 [29:03<58:12,  1.48s/it]

1300


 36%|███▌      | 1310/3652 [29:17<1:05:57,  1.69s/it]

1310


 36%|███▌      | 1320/3652 [29:30<49:05,  1.26s/it]

1320


 36%|███▋      | 1330/3652 [29:45<56:36,  1.46s/it]

1330


 37%|███▋      | 1340/3652 [29:58<49:49,  1.29s/it]

1340


 37%|███▋      | 1350/3652 [30:12<52:37,  1.37s/it]

1350


 37%|███▋      | 1360/3652 [30:25<51:21,  1.34s/it]

1360


 38%|███▊      | 1370/3652 [30:39<51:26,  1.35s/it]

1370


 38%|███▊      | 1380/3652 [30:54<58:29,  1.54s/it]  

1380


 38%|███▊      | 1390/3652 [31:07<48:01,  1.27s/it]

1390


 38%|███▊      | 1400/3652 [31:21<51:50,  1.38s/it]

1400


 39%|███▊      | 1410/3652 [31:34<48:52,  1.31s/it]

1410


 39%|███▉      | 1420/3652 [31:48<52:42,  1.42s/it]

1420


 39%|███▉      | 1430/3652 [32:02<49:35,  1.34s/it]

1430


 39%|███▉      | 1440/3652 [32:15<50:01,  1.36s/it]

1440


 40%|███▉      | 1450/3652 [32:28<52:13,  1.42s/it]

1450


 40%|███▉      | 1460/3652 [32:41<45:41,  1.25s/it]

1460


 40%|████      | 1470/3652 [32:55<50:01,  1.38s/it]

1470


 41%|████      | 1480/3652 [33:08<49:21,  1.36s/it]

1480


 41%|████      | 1490/3652 [33:22<49:32,  1.37s/it]

1490


 41%|████      | 1500/3652 [33:36<49:57,  1.39s/it]

1500


 41%|████▏     | 1510/3652 [33:49<48:02,  1.35s/it]

1510


 42%|████▏     | 1520/3652 [34:03<51:37,  1.45s/it]

1520


 42%|████▏     | 1530/3652 [34:17<46:08,  1.30s/it]

1530


 42%|████▏     | 1540/3652 [34:30<49:54,  1.42s/it]

1540


 42%|████▏     | 1550/3652 [34:44<48:32,  1.39s/it]

1550


 43%|████▎     | 1560/3652 [34:58<47:50,  1.37s/it]

1560


 43%|████▎     | 1570/3652 [35:12<47:04,  1.36s/it]

1570


 43%|████▎     | 1580/3652 [35:26<46:50,  1.36s/it]

1580


 44%|████▎     | 1590/3652 [35:40<50:35,  1.47s/it]

1590


 44%|████▍     | 1600/3652 [35:53<43:34,  1.27s/it]

1600


 44%|████▍     | 1610/3652 [36:07<47:34,  1.40s/it]

1610


 44%|████▍     | 1620/3652 [36:21<46:26,  1.37s/it]

1620


 45%|████▍     | 1630/3652 [36:34<46:05,  1.37s/it]

1630


 45%|████▍     | 1640/3652 [36:48<47:19,  1.41s/it]

1640


 45%|████▌     | 1650/3652 [37:01<43:33,  1.31s/it]

1650


 45%|████▌     | 1660/3652 [37:15<50:41,  1.53s/it]

1660


 46%|████▌     | 1670/3652 [37:29<42:47,  1.30s/it]

1670


 46%|████▌     | 1680/3652 [37:42<43:21,  1.32s/it]

1680


 46%|████▋     | 1690/3652 [37:56<43:52,  1.34s/it]

1690


 47%|████▋     | 1700/3652 [38:09<45:29,  1.40s/it]

1700


 47%|████▋     | 1710/3652 [38:23<45:47,  1.41s/it]

1710


 47%|████▋     | 1720/3652 [38:37<44:32,  1.38s/it]

1720


 47%|████▋     | 1730/3652 [38:51<46:53,  1.46s/it]

1730


 48%|████▊     | 1740/3652 [39:04<41:50,  1.31s/it]

1740


 48%|████▊     | 1750/3652 [39:18<44:03,  1.39s/it]

1750


 48%|████▊     | 1760/3652 [39:32<43:10,  1.37s/it]

1760


 48%|████▊     | 1770/3652 [39:45<42:40,  1.36s/it]

1770


 49%|████▊     | 1780/3652 [40:00<44:04,  1.41s/it]

1780


 49%|████▉     | 1790/3652 [40:13<42:32,  1.37s/it]

1790


 49%|████▉     | 1800/3652 [40:28<46:42,  1.51s/it]

1800


 50%|████▉     | 1810/3652 [40:41<38:13,  1.24s/it]

1810


 50%|████▉     | 1820/3652 [40:56<42:12,  1.38s/it]

1820


 50%|█████     | 1830/3652 [41:09<39:25,  1.30s/it]

1830


 50%|█████     | 1840/3652 [41:26<49:40,  1.65s/it]

1840


 51%|█████     | 1850/3652 [41:40<42:07,  1.40s/it]

1850


 51%|█████     | 1860/3652 [41:56<46:43,  1.56s/it]

1860


 51%|█████     | 1870/3652 [42:10<41:54,  1.41s/it]

1870


 51%|█████▏    | 1880/3652 [42:25<43:34,  1.48s/it]

1880


 52%|█████▏    | 1890/3652 [42:40<42:32,  1.45s/it]

1890


 52%|█████▏    | 1900/3652 [42:53<40:14,  1.38s/it]

1900


 52%|█████▏    | 1910/3652 [43:07<39:42,  1.37s/it]

1910


 53%|█████▎    | 1920/3652 [43:21<39:44,  1.38s/it]

1920


 53%|█████▎    | 1930/3652 [43:34<38:45,  1.35s/it]

1930


 53%|█████▎    | 1940/3652 [43:49<40:35,  1.42s/it]

1940


 53%|█████▎    | 1950/3652 [44:03<38:10,  1.35s/it]

1950


 54%|█████▎    | 1960/3652 [44:17<38:17,  1.36s/it]

1960


 54%|█████▍    | 1970/3652 [44:30<37:40,  1.34s/it]

1970


 54%|█████▍    | 1980/3652 [44:44<38:57,  1.40s/it]

1980


 54%|█████▍    | 1990/3652 [44:58<39:42,  1.43s/it]

1990


 55%|█████▍    | 2000/3652 [45:12<38:12,  1.39s/it]

2000


 55%|█████▌    | 2010/3652 [45:26<38:54,  1.42s/it]

2010


 55%|█████▌    | 2020/3652 [45:39<32:55,  1.21s/it]

2020


 56%|█████▌    | 2030/3652 [45:53<37:34,  1.39s/it]

2030


 56%|█████▌    | 2040/3652 [46:08<39:30,  1.47s/it]

2040


 56%|█████▌    | 2050/3652 [46:23<45:30,  1.70s/it]

2050


 56%|█████▋    | 2060/3652 [46:38<41:57,  1.58s/it]

2060


 57%|█████▋    | 2070/3652 [46:51<36:37,  1.39s/it]

2070


 57%|█████▋    | 2080/3652 [47:05<34:54,  1.33s/it]

2080


 57%|█████▋    | 2090/3652 [47:18<33:53,  1.30s/it]

2090


 58%|█████▊    | 2100/3652 [47:33<37:59,  1.47s/it]

2100


 58%|█████▊    | 2110/3652 [47:47<34:56,  1.36s/it]

2110


 58%|█████▊    | 2120/3652 [48:00<35:47,  1.40s/it]

2120


 58%|█████▊    | 2130/3652 [48:14<36:16,  1.43s/it]

2130


 59%|█████▊    | 2140/3652 [48:28<33:45,  1.34s/it]

2140


 59%|█████▉    | 2150/3652 [48:42<36:17,  1.45s/it]

2150


 59%|█████▉    | 2160/3652 [48:56<32:24,  1.30s/it]

2160


 59%|█████▉    | 2170/3652 [49:09<33:08,  1.34s/it]

2170


 60%|█████▉    | 2180/3652 [49:23<35:16,  1.44s/it]

2180


 60%|█████▉    | 2190/3652 [49:37<33:16,  1.37s/it]

2190


 60%|██████    | 2200/3652 [49:50<33:58,  1.40s/it]

2200


 61%|██████    | 2210/3652 [50:04<32:29,  1.35s/it]

2210


 61%|██████    | 2220/3652 [50:18<33:49,  1.42s/it]

2220


 61%|██████    | 2230/3652 [50:31<31:11,  1.32s/it]

2230


 61%|██████▏   | 2240/3652 [50:45<34:28,  1.46s/it]

2240


 62%|██████▏   | 2250/3652 [50:59<32:48,  1.40s/it]

2250


 62%|██████▏   | 2260/3652 [51:13<31:35,  1.36s/it]

2260


 62%|██████▏   | 2270/3652 [51:27<33:56,  1.47s/it]

2270


 62%|██████▏   | 2280/3652 [51:41<29:20,  1.28s/it]

2280


 63%|██████▎   | 2290/3652 [51:55<32:18,  1.42s/it]

2290


 63%|██████▎   | 2300/3652 [52:08<29:16,  1.30s/it]

2300


 63%|██████▎   | 2310/3652 [52:22<31:21,  1.40s/it]

2310


 64%|██████▎   | 2320/3652 [52:36<30:36,  1.38s/it]

2320


 64%|██████▍   | 2330/3652 [52:50<31:56,  1.45s/it]

2330


 64%|██████▍   | 2340/3652 [53:04<31:47,  1.45s/it]

2340


 64%|██████▍   | 2350/3652 [53:18<28:23,  1.31s/it]

2350


 65%|██████▍   | 2360/3652 [53:31<30:14,  1.40s/it]

2360


 65%|██████▍   | 2370/3652 [53:45<28:09,  1.32s/it]

2370


 65%|██████▌   | 2380/3652 [54:00<32:46,  1.55s/it]

2380


 65%|██████▌   | 2390/3652 [54:14<29:00,  1.38s/it]

2390


 66%|██████▌   | 2400/3652 [54:27<27:10,  1.30s/it]

2400


 66%|██████▌   | 2410/3652 [54:42<29:04,  1.40s/it]

2410


 66%|██████▋   | 2420/3652 [54:55<28:09,  1.37s/it]

2420


 67%|██████▋   | 2430/3652 [55:09<31:04,  1.53s/it]

2430


 67%|██████▋   | 2440/3652 [55:23<26:34,  1.32s/it]

2440


 67%|██████▋   | 2450/3652 [55:37<28:02,  1.40s/it]

2450


 67%|██████▋   | 2460/3652 [55:50<27:22,  1.38s/it]

2460


 68%|██████▊   | 2470/3652 [56:04<28:02,  1.42s/it]

2470


 68%|██████▊   | 2480/3652 [56:18<26:43,  1.37s/it]

2480


 68%|██████▊   | 2490/3652 [56:33<32:31,  1.68s/it]

2490


 68%|██████▊   | 2500/3652 [56:48<28:36,  1.49s/it]

2500


 69%|██████▊   | 2510/3652 [57:02<26:25,  1.39s/it]

2510


 69%|██████▉   | 2520/3652 [57:17<26:33,  1.41s/it]

2520


 69%|██████▉   | 2530/3652 [57:30<25:30,  1.36s/it]

2530


 70%|██████▉   | 2540/3652 [57:44<26:21,  1.42s/it]

2540


 70%|██████▉   | 2550/3652 [57:58<25:28,  1.39s/it]

2550


 70%|███████   | 2560/3652 [58:11<24:09,  1.33s/it]

2560


 70%|███████   | 2570/3652 [58:26<25:32,  1.42s/it]

2570


 71%|███████   | 2580/3652 [58:39<23:13,  1.30s/it]

2580


 71%|███████   | 2590/3652 [58:55<25:32,  1.44s/it]

2590


 71%|███████   | 2600/3652 [59:09<24:05,  1.37s/it]

2600


 71%|███████▏  | 2610/3652 [59:23<23:28,  1.35s/it]

2610


 72%|███████▏  | 2620/3652 [59:37<24:53,  1.45s/it]

2620


 72%|███████▏  | 2630/3652 [59:50<23:26,  1.38s/it]

2630


 72%|███████▏  | 2640/3652 [1:00:05<24:20,  1.44s/it]

2640


 73%|███████▎  | 2650/3652 [1:00:18<21:54,  1.31s/it]

2650


 73%|███████▎  | 2660/3652 [1:00:33<23:55,  1.45s/it]

2660


 73%|███████▎  | 2670/3652 [1:00:47<22:34,  1.38s/it]

2670


 73%|███████▎  | 2680/3652 [1:01:00<21:51,  1.35s/it]

2680


 74%|███████▎  | 2690/3652 [1:01:15<23:33,  1.47s/it]

2690


 74%|███████▍  | 2700/3652 [1:01:28<21:34,  1.36s/it]

2700


 74%|███████▍  | 2710/3652 [1:01:42<22:19,  1.42s/it]

2710


 74%|███████▍  | 2720/3652 [1:01:56<20:38,  1.33s/it]

2720


 75%|███████▍  | 2730/3652 [1:02:11<23:04,  1.50s/it]

2730


 75%|███████▌  | 2740/3652 [1:02:25<21:00,  1.38s/it]

2740


 75%|███████▌  | 2750/3652 [1:02:38<20:27,  1.36s/it]

2750


 76%|███████▌  | 2760/3652 [1:02:53<21:23,  1.44s/it]

2760


 76%|███████▌  | 2770/3652 [1:03:06<18:47,  1.28s/it]

2770


 76%|███████▌  | 2780/3652 [1:03:20<20:19,  1.40s/it]

2780


 76%|███████▋  | 2790/3652 [1:03:33<18:35,  1.29s/it]

2790


 77%|███████▋  | 2800/3652 [1:03:47<19:32,  1.38s/it]

2800


 77%|███████▋  | 2810/3652 [1:04:01<19:05,  1.36s/it]

2810


 77%|███████▋  | 2820/3652 [1:04:15<19:14,  1.39s/it]

2820


 77%|███████▋  | 2830/3652 [1:04:29<19:21,  1.41s/it]

2830


 78%|███████▊  | 2840/3652 [1:04:42<17:25,  1.29s/it]

2840


 78%|███████▊  | 2850/3652 [1:04:57<19:29,  1.46s/it]

2850


 78%|███████▊  | 2860/3652 [1:05:10<17:32,  1.33s/it]

2860


 79%|███████▊  | 2870/3652 [1:05:25<18:56,  1.45s/it]

2870


 79%|███████▉  | 2880/3652 [1:05:39<18:23,  1.43s/it]

2880


 79%|███████▉  | 2890/3652 [1:05:53<18:10,  1.43s/it]

2890


 79%|███████▉  | 2900/3652 [1:06:07<18:00,  1.44s/it]

2900


 80%|███████▉  | 2910/3652 [1:06:23<19:33,  1.58s/it]

2910


 80%|███████▉  | 2920/3652 [1:06:37<15:49,  1.30s/it]

2920


 80%|████████  | 2930/3652 [1:06:50<15:48,  1.31s/it]

2930


 81%|████████  | 2940/3652 [1:07:04<16:25,  1.38s/it]

2940


 81%|████████  | 2950/3652 [1:07:18<16:03,  1.37s/it]

2950


 81%|████████  | 2960/3652 [1:07:33<17:39,  1.53s/it]

2960


 81%|████████▏ | 2970/3652 [1:07:47<16:28,  1.45s/it]

2970


 82%|████████▏ | 2980/3652 [1:08:01<15:22,  1.37s/it]

2980


 82%|████████▏ | 2990/3652 [1:08:15<15:55,  1.44s/it]

2990


 82%|████████▏ | 3000/3652 [1:08:29<14:04,  1.30s/it]

3000


 82%|████████▏ | 3010/3652 [1:08:44<15:11,  1.42s/it]

3010


 83%|████████▎ | 3020/3652 [1:08:58<14:22,  1.36s/it]

3020


 83%|████████▎ | 3030/3652 [1:09:12<16:11,  1.56s/it]

3030


 83%|████████▎ | 3040/3652 [1:09:26<14:41,  1.44s/it]

3040


 84%|████████▎ | 3050/3652 [1:09:40<14:33,  1.45s/it]

3050


 84%|████████▍ | 3060/3652 [1:09:54<14:17,  1.45s/it]

3060


 84%|████████▍ | 3070/3652 [1:10:09<12:37,  1.30s/it]

3070


 84%|████████▍ | 3080/3652 [1:10:23<13:29,  1.41s/it]

3080


 85%|████████▍ | 3090/3652 [1:10:36<12:48,  1.37s/it]

3090


 85%|████████▍ | 3100/3652 [1:10:51<13:12,  1.44s/it]

3100


 85%|████████▌ | 3110/3652 [1:11:05<12:46,  1.41s/it]

3110


 85%|████████▌ | 3120/3652 [1:11:18<11:47,  1.33s/it]

3120


 86%|████████▌ | 3130/3652 [1:11:33<12:32,  1.44s/it]

3130


 86%|████████▌ | 3140/3652 [1:11:47<11:26,  1.34s/it]

3140


 86%|████████▋ | 3150/3652 [1:12:02<12:42,  1.52s/it]

3150


 87%|████████▋ | 3160/3652 [1:12:16<11:38,  1.42s/it]

3160


 87%|████████▋ | 3170/3652 [1:12:30<10:55,  1.36s/it]

3170


 87%|████████▋ | 3180/3652 [1:12:43<11:11,  1.42s/it]

3180


 87%|████████▋ | 3190/3652 [1:12:57<10:33,  1.37s/it]

3190


 88%|████████▊ | 3200/3652 [1:13:11<10:57,  1.46s/it]

3200


 88%|████████▊ | 3210/3652 [1:13:25<09:33,  1.30s/it]

3210


 88%|████████▊ | 3220/3652 [1:13:38<09:41,  1.35s/it]

3220


 88%|████████▊ | 3230/3652 [1:13:52<09:04,  1.29s/it]

3230


 89%|████████▊ | 3240/3652 [1:14:06<09:41,  1.41s/it]

3240


 89%|████████▉ | 3250/3652 [1:14:21<10:12,  1.52s/it]

3250


 89%|████████▉ | 3260/3652 [1:14:35<08:20,  1.28s/it]

3260


 90%|████████▉ | 3270/3652 [1:14:49<09:34,  1.50s/it]

3270


 90%|████████▉ | 3280/3652 [1:15:03<08:49,  1.42s/it]

3280


 90%|█████████ | 3290/3652 [1:15:15<07:41,  1.27s/it]

3290


 90%|█████████ | 3300/3652 [1:15:30<08:13,  1.40s/it]

3300


 91%|█████████ | 3310/3652 [1:15:44<08:05,  1.42s/it]

3310


 91%|█████████ | 3320/3652 [1:15:59<08:12,  1.48s/it]

3320


 91%|█████████ | 3330/3652 [1:16:12<07:15,  1.35s/it]

3330


 91%|█████████▏| 3340/3652 [1:16:26<07:02,  1.35s/it]

3340


 92%|█████████▏| 3350/3652 [1:16:40<06:33,  1.30s/it]

3350


 92%|█████████▏| 3360/3652 [1:16:54<06:59,  1.44s/it]

3360


 92%|█████████▏| 3370/3652 [1:17:08<06:23,  1.36s/it]

3370


 93%|█████████▎| 3380/3652 [1:17:22<06:28,  1.43s/it]

3380


 93%|█████████▎| 3390/3652 [1:17:36<06:25,  1.47s/it]

3390


 93%|█████████▎| 3400/3652 [1:17:51<05:58,  1.42s/it]

3400


 93%|█████████▎| 3410/3652 [1:18:04<05:33,  1.38s/it]

3410


 94%|█████████▎| 3420/3652 [1:18:18<05:17,  1.37s/it]

3420


 94%|█████████▍| 3430/3652 [1:18:32<05:11,  1.40s/it]

3430


 94%|█████████▍| 3440/3652 [1:18:46<04:37,  1.31s/it]

3440


 94%|█████████▍| 3450/3652 [1:18:59<04:34,  1.36s/it]

3450


 95%|█████████▍| 3460/3652 [1:19:14<05:06,  1.60s/it]

3460


 95%|█████████▌| 3470/3652 [1:19:28<04:17,  1.42s/it]

3470


 95%|█████████▌| 3480/3652 [1:19:42<04:01,  1.40s/it]

3480


 96%|█████████▌| 3490/3652 [1:19:56<03:46,  1.40s/it]

3490


 96%|█████████▌| 3500/3652 [1:20:10<03:40,  1.45s/it]

3500


 96%|█████████▌| 3510/3652 [1:20:24<03:13,  1.36s/it]

3510


 96%|█████████▋| 3520/3652 [1:20:38<03:06,  1.41s/it]

3520


 97%|█████████▋| 3530/3652 [1:20:53<02:58,  1.47s/it]

3530


 97%|█████████▋| 3540/3652 [1:21:07<02:38,  1.41s/it]

3540


 97%|█████████▋| 3550/3652 [1:21:20<02:20,  1.38s/it]

3550


 97%|█████████▋| 3560/3652 [1:21:34<02:02,  1.34s/it]

3560


 98%|█████████▊| 3570/3652 [1:21:49<02:04,  1.51s/it]

3570


 98%|█████████▊| 3580/3652 [1:22:02<01:38,  1.37s/it]

3580


 98%|█████████▊| 3590/3652 [1:22:16<01:26,  1.39s/it]

3590


 99%|█████████▊| 3600/3652 [1:22:30<01:16,  1.46s/it]

3600


 99%|█████████▉| 3610/3652 [1:22:45<00:58,  1.40s/it]

3610


 99%|█████████▉| 3620/3652 [1:22:59<00:42,  1.33s/it]

3620


 99%|█████████▉| 3630/3652 [1:23:13<00:28,  1.31s/it]

3630


100%|█████████▉| 3640/3652 [1:23:27<00:17,  1.43s/it]

3640


100%|█████████▉| 3650/3652 [1:23:41<00:02,  1.37s/it]

3650


100%|██████████| 3652/3652 [1:23:44<00:00,  1.38s/it]

            Date total_record
0     2010/01/01         3455
1     2010/01/02          333
2     2010/01/03            0
3     2010/01/04            0
4     2010/01/05          504
...          ...          ...
3647  2019/12/27          576
3648  2019/12/28          904
3649  2019/12/29          537
3650  2019/12/30            2
3651  2019/12/31         1206

[3652 rows x 2 columns]
            Date                                                 id
0     2010/01/01  [33897310, 33467806, 32809304, 32688721, 32288...
1     2010/01/02  [20044808, 20044807, 20044806, 20044801, 20044...
2     2010/01/03                                                 []
3     2010/01/04                                                 []
4     2010/01/05  [27713240, 27713239, 20047197, 20047183, 20047...
...          ...                                                ...
3647  2019/12/27  [34316618, 33693170, 31877613, 31877605, 31877...
3648  2019/12/28  [33693217, 31881556, 31881554, 31881553, 31881...
364




In [6]:
df_DateTracking.to_csv('df_DateTracking.csv',index=False)

In [7]:
data_list = []

for index, row in id_df.iterrows():
    for i, id in enumerate(row['id']):
        data_list.append({'Date': row['Date'], 'ID': id})

id_df = pd.DataFrame(data_list)
id_df.to_csv('id_df.csv',index=False)
id_df

Unnamed: 0,Date,ID
0,2010/01/01,33897310
1,2010/01/01,33467806
2,2010/01/01,32809304
3,2010/01/01,32688721
4,2010/01/01,32288940
...,...,...
2699263,2019/12/31,31883521
2699264,2019/12/31,31883520
2699265,2019/12/31,31883515
2699266,2019/12/31,31883514
