In [41]:
# Cell 1: Imports and environment checks

import sqlite3
import pandas as pd
import os

# (Optional) For printing DataFrames nicely in Jupyter:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_colwidth', None)

In [43]:
# Cell 2: Set up the database path and connect

# Make sure this path is correct. If you're at your user home "~", you might need a full absolute path
# For example: "/Users/your_username/Desktop/patents/data/patent.db"

db_path = os.path.expanduser("~/Desktop/patents/data/patent.db")

# Connect to the SQLite database
conn = sqlite3.connect(db_path)

print(f"Connected to database at {db_path}")

Connected to database at /Users/yuxiangwang/Desktop/patents/data/patent.db


In [45]:
# Cell 3: Explore more tables

# Let's list out all the tables we have, by checking sqlite_master
tables_query = """
SELECT name 
FROM sqlite_master 
WHERE type='table' 
ORDER BY name;
"""
df_tables = pd.read_sql(tables_query, conn)
df_tables

Unnamed: 0,name
0,applications_claiming_priority
1,assignees
2,child_applications
3,cited_by
4,claims
5,classifications
6,concepts
7,error_logs
8,events
9,external_links


In [47]:
# Cell 4: Quick look at the main 'patents' table

query = "SELECT * FROM patents"
df_patents = pd.read_sql(query, conn)
df_patents

Unnamed: 0,patent_id,title,type,pdf_link,publication_number,country,application_number,priority_date,filing_date,publication_date,prior_art_date,family_id,abstract,description_link
0,US20190160148A1,Combination of pembrolizumab and abemaciclib for the treatment of cancer,patent,https://patentimages.storage.googleapis.com/22/ef/4c/7eee828934d5ed/US20190160148A1.pdf,US20190160148A1,United States,"US16/301,835",2016-05-23 00:00:00,2017-05-19 00:00:00,2019-05-30 00:00:00,2016-05-23 00:00:00,59021571,"The present invention relates to a combination of abemaciclib and pembrolizumab and methods of using the combination to treat certain disorders, such as breast cancer and non-small cell lung cancer.",https://serpapi.com/searches/67cb376a460263e0dd05923f/google_patents_details/description.html
1,US20210347889A1,Dosing regimen of anti-lag3 antibody and combination therapy with anti-pd-1 antibody for treating cancer,patent,https://patentimages.storage.googleapis.com/16/d4/e8/578718e90ac2cc/US20210347889A1.pdf,US20210347889A1,United States,"US17/289,810",2018-11-05 00:00:00,2019-11-04 00:00:00,2021-11-11 00:00:00,2018-11-05 00:00:00,70611084,"The present invention relates to dosing regimens of an anti-LAG3 antibody useful for the treatment of cancer. In particular, the invention relates to the dosing regimen in a combination therapy which comprises administering an antibody of a Programmed Death 1 protein (PD-1) or Programmed Death Ligand 1 (PD-L1) and an antibody of Lymphocyte-Activation Gene 3 (LAG3). The invention also provides a method for treating cancer in a patient comprising administering to the patient an anti-LAG3 antibody and an anti-PD-1 antibody, wherein the tumor tissue section of the patient is PD-L 1 expression positive, and optionally LAG3 expression positive.",https://serpapi.com/searches/67cb376b39e4a8f068a55c1f/google_patents_details/description.html
2,US20180333503A1,Anti-folr1 immunoconjugates and anti-pd-1 antibody combinations,patent,https://patentimages.storage.googleapis.com/62/ec/90/67d092982661c0/US20180333503A1.pdf,US20180333503A1,United States,"US15/979,989",2017-05-16 00:00:00,2018-05-15 00:00:00,2018-11-22 00:00:00,2017-05-16 00:00:00,64269828,"Therapeutic combinations of immunoconjugates that bind to FOLR1 (e.g., IMGN853) with anti-PD-1 antibodies or antigen-binding fragments thereof (e.g., pembrolizumab) are provided. Methods of administering the combinations to treat cancers, e.g., ovarian, peritoneal, or fallopian tube cancers, with greater clinical efficacy and/or decreased toxicity are also provided.",https://serpapi.com/searches/67cb376cb7b03808798bfa8a/google_patents_details/description.html
3,US20210403557A1,Dosing regimen of anti-tigit antibody for treatment of cancer,patent,https://patentimages.storage.googleapis.com/af/00/bb/a9e1b627545c6a/US20210403557A1.pdf,US20210403557A1,United States,"US17/288,641",2018-11-05 00:00:00,2019-11-04 00:00:00,2021-12-30 00:00:00,2018-11-05 00:00:00,70611082,"The present invention relates to dosing regimens of an anti-TIGIT antibody useful for the treatment of cancer. In particular, the invention relates to the dosing regimen in a combination therapy which comprises administering an antibody of a Programmed Death 1 protein (PD-1) or Programmed Death Ligand 1 (PD-L1) and an anti-TIGIT antibody.",https://serpapi.com/searches/67cb376ebc84b8472472ff5b/google_patents_details/description.html
4,US20170089914A1,Anti-pembrolizumab antibodies,patent,https://patentimages.storage.googleapis.com/8c/6b/a3/cfa14432c1dc01/US20170089914A1.pdf,US20170089914A1,United States,"US15/274,330",2015-09-25 00:00:00,2016-09-23 00:00:00,2017-03-30 00:00:00,2015-09-25 00:00:00,58408842,"The present invention provides antibodies and antigen-binding fragments thereof that bind to the antibody pembrolizumab (pembrolizumab). These antibodies are useful, for example, for use as positive controls in assays for detecting the presence of anti-drug antibodies in a sample, e.g., the blood of a patient who has been administered pembrolizumab.",https://serpapi.com/searches/67cb37703dca69e505f1441d/google_patents_details/description.html
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
61,US20200361931A1,Prmt5 inhibitors,patent,https://patentimages.storage.googleapis.com/1b/c1/9e/f29a0a5b8413f6/US20200361931A1.pdf,US20200361931A1,United States,"US16/762,201",2017-11-08 00:00:00,2018-11-05 00:00:00,2020-11-19 00:00:00,2017-11-08 00:00:00,66438946,"The present invention provides a compound of Formula (I) or the pharmaceutically acceptable salts thereof, which are PRMT5 inhibitors.",https://serpapi.com/searches/67cb37e656f17df444dbeca3/google_patents_details/description.html
62,US20190241655A1,Ilt3 ligand,patent,https://patentimages.storage.googleapis.com/50/bf/c2/1e4cdc39a6b193/US20190241655A1.pdf,US20190241655A1,United States,"US16/342,582",2016-11-10 00:00:00,2017-11-06 00:00:00,2019-08-08 00:00:00,2016-11-10 00:00:00,62109704,"The present invention provides antibodies and antigen-binding fragments thereof that bind ILT3, ILT3 ligand (i.e., PI16) or a complex between ILT3 and the ILT3 ligand. Methods for determining whether ILT3 and the ILT3 ligand bind together or whether a substance agonizes or antagonizes such binding are also provided.",https://serpapi.com/searches/67cb37e9e8a9fadbfc854d66/google_patents_details/description.html
63,US20220267369A1,Methods of separating host cell lipases from a production protein in chromatographic processes,patent,https://patentimages.storage.googleapis.com/e9/fb/b2/19e87f2fec41dc/US20220267369A1.pdf,US20220267369A1,United States,"US17/261,365",2018-07-25 00:00:00,2019-07-24 00:00:00,2022-08-25 00:00:00,2018-07-25 00:00:00,69180557,Provided herein are methods of separating host cell lipases from a production protein in chromatographic processes and methods of improving polysorbate-80 stability in a production protein formulation by separating host cell lipases from the production protein using chromatographic processes. Also provided are pharmaceutical compositions comprising less than 1 ppm of a host cell lipase.,https://serpapi.com/searches/67cb37eb4ef4fde4be2d9fcb/google_patents_details/description.html
64,US20200048258A1,Kdm5 inhibitors,patent,https://patentimages.storage.googleapis.com/a9/78/25/da053ed4a2005f/US20200048258A1.pdf,US20200048258A1,United States,"US16/341,313",2016-10-12 00:00:00,2017-10-06 00:00:00,2020-02-13 00:00:00,2016-10-12 00:00:00,61905936,"The present invention provides a compound of Formula (I) (represented as tautomers Ia and Ib) or the pharmaceutically acceptable salts thereof, which are KDM5 inhibitors.",https://serpapi.com/searches/67cb37eda0fdbcf7aa5ba4a8/google_patents_details/description.html


In [51]:
query = "SELECT * FROM claims"
df_patents = pd.read_sql(query, conn)
df_patents

Unnamed: 0,id,patent_id,claim_no,claim_txt
0,1,US20190160148A1,1,"1. A method of treating breast cancer, comprising administering to a patient 200 mg of an anti-PD-1 antibody or antigen binding fragment thereof comprising three light chain CDRs (CDRL1, CDRL2 and CDRL3) and three heavy chain CDRs (CDRH1, CDRH2, and CDRH3), wherein CDRL1 comprises the amino acid sequence set forth in SEQ ID NO:5, CDRL2 comprises the amino acid sequence set forth in SEQ ID NO:6, CDRL3 comprises the amino acid sequence set forth in SEQ ID NO:7, CDRH1 comprises the amino acid sequence set forth in SEQ ID NO:8, CDRH2 comprises the amino acid sequence set forth in SEQ ID NO:9, and CDRH3 comprises the amino acid sequence set forth in SEQ ID NO:10 on day 1 of a 21-day cycle and 150 mg of abemaciclib or a pharmaceutically acceptable salt thereof twice daily on days 1-21 of the 21-day cycle."
1,2,US20190160148A1,2,"2. A method of treating breast cancer, comprising administering to a patient 200 mg of an anti-PD-1 antibody or antigen binding fragment thereof comprising three light chain CDRs (CDRL1, CDRL2 and CDRL3) and three heavy chain CDRs (CDRH1, CDRH2, and CDRH3), wherein CDRL1 comprises the amino acid sequence set forth in SEQ ID NO:5, CDRL2 comprises the amino acid sequence set forth in SEQ ID NO:6 , CDRL3 comprises the amino acid sequence set forth in SEQ ID NO:7, CDRH1 comprises the amino acid sequence set forth in SEQ ID NO:8, CDRH2 comprises the amino acid sequence set forth in SEQ ID NO:9, and CDRH3 comprises the amino acid sequence set forth in SEQ ID NO:10 in combination with 150 mg of abemaciclib or a pharmaceutically acceptable salt thereof wherein initial administration of the abemaciclib or the salt thereof is administered to the patient without the antibody or the antigen binding fragment thereof for at least 24 hours and the abemaciclib or the salt thereof is then administered to the patient in combination with the antibody or the antigen binding fragment thereof."
2,3,US20190160148A1,3,"3. The method according to claim 1, wherein the antibody or antigen binding fragment thereof comprises a light chain variable region (LCVR) amino acid sequence of SEQ ID NO:1 and a heavy chain variable region (HCVR) amino acid sequence of SEQ ID NO: 2."
3,4,US20190160148A1,4,4. (canceled)
4,5,US20190160148A1,5,5. (canceled)
...,...,...,...,...
2165,2166,US20220380469A1,12,"12. The method of claim 1, wherein the anti-PD-1 antibody or antigen-binding fragment thereof is administered to the patient by intravenous or subcutaneous administration."
2166,2167,US20220380469A1,13,"13. The method of claim 1, wherein the anti-PD-1 antibody or antigen-binding fragment thereof is pembrolizumab."
2167,2168,US20220380469A1,14,"14. The method of claim 1, wherein the method comprises administering:\n(i) about 200 mg of an anti-PD-1 antibody, or antigen binding fragment thereof, to the patient every approximately three weeks; or (ii) about 400 mg of an anti-PD-1 antibody, or antigen binding fragment thereof, to the patient every approximately six weeks."
2168,2169,US20220380469A1,15,"15. The method of claim 8, wherein the patient has disease progression following the at least two prior systemic treatments."
