# Libraries

In [14]:
import pandas as pd
import requests

pd.set_option('display.max_columns', None) # display all columns in DF

# Uploading data

In [47]:
df_orangebook = pd.read_excel('Searchable Database of Orange Book Drug Patents.xlsx', skiprows = 1)
df_openFDA = pd.read_excel('raw_openFDA_data.xlsx')  
df_medicaid = pd.read_csv('raw_medicaid_data.csv')

In [48]:
len(df_openFDA)

25374

# Data manipulation

### OpenFDA

In [49]:
df = df_openFDA
len(df)

25374

In [52]:
df.dtypes

submissions                   object
application_number            object
sponsor_name                  object
products                      object
openfda.application_number    object
openfda.brand_name            object
openfda.generic_name          object
openfda.manufacturer_name     object
openfda.product_ndc           object
openfda.product_type          object
openfda.route                 object
openfda.substance_name        object
openfda.rxcui                 object
openfda.spl_id                object
openfda.spl_set_id            object
openfda.package_ndc           object
openfda.unii                  object
openfda.nui                   object
openfda.pharm_class_epc       object
openfda.pharm_class_cs        object
openfda.pharm_class_moa       object
openfda.pharm_class_pe        object
dtype: object

In [53]:
df = df.explode('openfda.product_ndc') # unpacking lists
len(df)

25374

In [54]:
df.head()

Unnamed: 0,submissions,application_number,sponsor_name,products,openfda.application_number,openfda.brand_name,openfda.generic_name,openfda.manufacturer_name,openfda.product_ndc,openfda.product_type,openfda.route,openfda.substance_name,openfda.rxcui,openfda.spl_id,openfda.spl_set_id,openfda.package_ndc,openfda.unii,openfda.nui,openfda.pharm_class_epc,openfda.pharm_class_cs,openfda.pharm_class_moa,openfda.pharm_class_pe
0,"[{'submission_type': 'SUPPL', 'submission_numb...",ANDA206552,FRESENIUS KABI USA,"[{'product_number': '001', 'reference_drug': '...",['ANDA206552'],['HEPARIN SODIUM'],['HEPARIN SODIUM'],"['Fresenius Kabi USA, LLC']",['76045-108'],['HUMAN PRESCRIPTION DRUG'],"['INTRAVENOUS', 'SUBCUTANEOUS']",['HEPARIN SODIUM'],['1798389'],['151a54ec-f7e5-4e6d-9810-cbfa75a16a22'],['07438e10-1589-4683-9f26-e5494d076cf0'],"['76045-108-00', '76045-108-10']",['ZZ45AB24CA'],,,,,
1,"[{'submission_type': 'SUPPL', 'submission_numb...",NDA019532,LANNETT CO INC,"[{'product_number': '001', 'reference_drug': '...",,,,,,,,,,,,,,,,,,
2,"[{'submission_type': 'SUPPL', 'submission_numb...",NDA019594,ALLERGAN,"[{'product_number': '001', 'reference_drug': '...",['NDA019594'],['URSODIOL'],['URSODIOL'],"['Actavis Pharma, Inc.']",['0591-3159'],['HUMAN PRESCRIPTION DRUG'],['ORAL'],['URSODIOL'],['858747'],['9f386262-71fb-48f0-b992-773d35e952c5'],['a061bb07-a85d-4b08-877f-ce02156f0de7'],['0591-3159-01'],['724L30Y2QR'],"['N0000175802', 'M0002475']",['Bile Acid [EPC]'],['Bile Acids and Salts [CS]'],,
3,"[{'submission_type': 'SUPPL', 'submission_numb...",BLA125509,ELUSYS THERAPEUTICS INC,"[{'product_number': '001', 'reference_drug': '...",['BLA125509'],['ANTHIM'],['OBILTOXAXIMAB'],"['Elusys Therapeutics, Inc.']",['69604-204'],['HUMAN PRESCRIPTION DRUG'],['INTRAVENOUS'],['OBILTOXAXIMAB'],"['1746910', '1746915']",['9a6bcd22-1783-400b-b87a-c825315f600c'],['39ad8799-00a4-4fc8-9852-c0536350c474'],['69604-204-02'],['29Z5DNL48C'],"['N0000192703', 'N0000192702']",['Anthrax Protective Antigen-directed Antibody...,,['Anthrax Protective Antigen-directed Antibody...,
4,"[{'submission_type': 'ORIG', 'submission_numbe...",ANDA200884,SUN PHARM,"[{'product_number': '002', 'reference_drug': '...",['ANDA200884'],['FENOFIBRATE'],['FENOFIBRATE'],"['Sun Pharmaceutical Industries, Inc.']","['63304-448', '63304-449']",['HUMAN PRESCRIPTION DRUG'],['ORAL'],['FENOFIBRATE'],"['477560', '477562']",['5f5e6f81-fe5a-4ad6-be4e-0cf5f28a0f00'],['125bbd7e-86a2-4209-90a5-ad353e572d1b'],"['63304-448-30', '63304-448-90', '63304-448-05...",['U202363UOS'],"['N0000175596', 'N0000175375', 'M0199111']",['Peroxisome Proliferator Receptor alpha Agoni...,['PPAR alpha [CS]'],['Peroxisome Proliferator-activated Receptor a...,


### Medicaid

In [39]:
df_medicaid['labeler_code'] = pd.to_numeric(df_medicaid['labeler_code'])
df_medicaid['labeler_code'] = pd.to_numeric(df_medicaid['product_code'])

# Merging data

### Orange Book and OpenFDA

Creating a commen key

In [40]:
df_openFDA['NDA #'] = df_openFDA['application_number'].str.replace(r'\D', '') # cleaning application_number
df_openFDA['NDA #'] = pd.to_numeric(df_openFDA['NDA #'])

Merging

In [41]:
df = pd.merge(df_openFDA, df_orangebook, on="NDA #", how="left")

### Orange Book, OpenFDA and Medicaid

In [43]:
df.head(10)

Unnamed: 0,submissions,application_number,sponsor_name,products,openfda.application_number,openfda.brand_name,openfda.generic_name,openfda.manufacturer_name,openfda.product_ndc,openfda.product_type,openfda.route,openfda.substance_name,openfda.rxcui,openfda.spl_id,openfda.spl_set_id,openfda.package_ndc,openfda.unii,openfda.nui,openfda.pharm_class_epc,openfda.pharm_class_cs,openfda.pharm_class_moa,openfda.pharm_class_pe,NDA #,Ingredient(s),Company,Product Name,Approval Date,Earliest Protection DateEarliest Prot. Date,Latest Protection DateLatest Prot. Date,dsad,Months of Additional Protection TimeMonths Add. Prot. Time,Total Number of ProtectionsNum. Prot.,Unique Patents,Number of Orphan Drug ExclusivitiesNum. ODE's,Extensions
0,"[{'submission_type': 'SUPPL', 'submission_numb...",ANDA206552,FRESENIUS KABI USA,"[{'product_number': '001', 'reference_drug': '...",['ANDA206552'],['HEPARIN SODIUM'],['HEPARIN SODIUM'],"['Fresenius Kabi USA, LLC']",['76045-108'],['HUMAN PRESCRIPTION DRUG'],"['INTRAVENOUS', 'SUBCUTANEOUS']",['HEPARIN SODIUM'],['1798389'],['151a54ec-f7e5-4e6d-9810-cbfa75a16a22'],['07438e10-1589-4683-9f26-e5494d076cf0'],"['76045-108-00', '76045-108-10']",['ZZ45AB24CA'],,,,,,206552,,,,,,,,,,,,
1,"[{'submission_type': 'SUPPL', 'submission_numb...",NDA019532,LANNETT CO INC,"[{'product_number': '001', 'reference_drug': '...",,,,,,,,,,,,,,,,,,,19532,,,,,,,,,,,,
2,"[{'submission_type': 'SUPPL', 'submission_numb...",NDA019594,ALLERGAN,"[{'product_number': '001', 'reference_drug': '...",['NDA019594'],['URSODIOL'],['URSODIOL'],"['Actavis Pharma, Inc.']",['0591-3159'],['HUMAN PRESCRIPTION DRUG'],['ORAL'],['URSODIOL'],['858747'],['9f386262-71fb-48f0-b992-773d35e952c5'],['a061bb07-a85d-4b08-877f-ce02156f0de7'],['0591-3159-01'],['724L30Y2QR'],"['N0000175802', 'M0002475']",['Bile Acid [EPC]'],['Bile Acids and Salts [CS]'],,,19594,,,,,,,,,,,,
3,"[{'submission_type': 'SUPPL', 'submission_numb...",BLA125509,ELUSYS THERAPEUTICS INC,"[{'product_number': '001', 'reference_drug': '...",['BLA125509'],['ANTHIM'],['OBILTOXAXIMAB'],"['Elusys Therapeutics, Inc.']",['69604-204'],['HUMAN PRESCRIPTION DRUG'],['INTRAVENOUS'],['OBILTOXAXIMAB'],"['1746910', '1746915']",['9a6bcd22-1783-400b-b87a-c825315f600c'],['39ad8799-00a4-4fc8-9852-c0536350c474'],['69604-204-02'],['29Z5DNL48C'],"['N0000192703', 'N0000192702']",['Anthrax Protective Antigen-directed Antibody...,,['Anthrax Protective Antigen-directed Antibody...,,125509,,,,,,,,,,,,
4,"[{'submission_type': 'ORIG', 'submission_numbe...",ANDA200884,SUN PHARM,"[{'product_number': '002', 'reference_drug': '...",['ANDA200884'],['FENOFIBRATE'],['FENOFIBRATE'],"['Sun Pharmaceutical Industries, Inc.']","['63304-448', '63304-449']",['HUMAN PRESCRIPTION DRUG'],['ORAL'],['FENOFIBRATE'],"['477560', '477562']",['5f5e6f81-fe5a-4ad6-be4e-0cf5f28a0f00'],['125bbd7e-86a2-4209-90a5-ad353e572d1b'],"['63304-448-30', '63304-448-90', '63304-448-05...",['U202363UOS'],"['N0000175596', 'N0000175375', 'M0199111']",['Peroxisome Proliferator Receptor alpha Agoni...,['PPAR alpha [CS]'],['Peroxisome Proliferator-activated Receptor a...,,200884,,,,,,,,,,,,
5,"[{'submission_type': 'ORIG', 'submission_numbe...",ANDA201687,ANCHEN PHARMS,"[{'product_number': '001', 'reference_drug': '...",['ANDA201687'],['TRETINOIN'],['TRETINOIN'],"['Par Pharmaceutical, Inc.']",['10370-268'],['HUMAN PRESCRIPTION DRUG'],['ORAL'],['TRETINOIN'],['199159'],['a3f53b5e-8c97-4d1d-be93-f09c740cc803'],['9c4ae9d9-c2a0-4995-a27a-e3f0f0284db9'],['10370-268-01'],['5688UTC01R'],"['N0000175607', 'M0018962']",['Retinoid [EPC]'],['Retinoids [CS]'],,,201687,,,,,,,,,,,,
6,"[{'submission_type': 'SUPPL', 'submission_numb...",ANDA202204,HIKMA,"[{'product_number': '001', 'reference_drug': '...",,,,,,,,,,,,,,,,,,,202204,,,,,,,,,,,,
7,"[{'submission_type': 'SUPPL', 'submission_numb...",ANDA202553,ACCORD HLTHCARE,"[{'product_number': '003', 'reference_drug': '...",,,,,,,,,,,,,,,,,,,202553,,,,,,,,,,,,
8,"[{'submission_type': 'SUPPL', 'submission_numb...",ANDA202906,DR REDDYS LABS LTD,"[{'product_number': '001', 'reference_drug': '...",['ANDA202906'],['MONTELUKAST SODIUM'],['MONTELUKAST SODIUM'],"[""Dr.Reddy's Laboratories Limited""]",['55111-763'],['HUMAN PRESCRIPTION DRUG'],['ORAL'],['MONTELUKAST SODIUM'],['351246'],['1d9ac31e-956b-897f-2d41-da76d70dd40c'],['3d3df874-d710-7fa4-bb21-434977518337'],"['55111-763-07', '55111-763-03']",['U1O3J18SFL'],,,,,,202906,,,,,,,,,,,,
9,"[{'submission_type': 'ORIG', 'submission_numbe...",ANDA203299,AKORN,"[{'product_number': '001', 'reference_drug': '...",['ANDA203299'],['BIMATOPROST'],['BIMATOPROST'],"['Hi-Tech Pharmacal Co., Inc.']",['50383-908'],['HUMAN PRESCRIPTION DRUG'],['OPHTHALMIC'],['BIMATOPROST'],['308739'],['2726cb5a-56a3-4736-9020-b2ccc7caca83'],['ce5c7f22-ade3-41ea-8dd8-3ec0399d3279'],"['50383-908-02', '50383-908-05', '50383-908-07']",['QXS94885MZ'],"['N0000175454', 'M0017805']",['Prostaglandin Analog [EPC]'],['Prostaglandins [CS]'],,,203299,,,,,,,,,,,,
