### Importing

In [11]:
from CB_IPO import scrape

### Initializing

In [12]:
scraper = scrape()

### Scraping for recent IPO filings (S-1)

In [16]:
company_names, file_dates, form_types = scraper.edgar_scrape(5)
print(company_names)
print(file_dates)
print(form_types)


['Allarity Therapeutics, Inc.  (ALLR) ', 'Greenwave Technology Solutions, Inc.  (GWAV) ', 'APPlife Digital Solutions Inc  (ALDS) ', 'MAIA Biotechnology, Inc.  (MAIA) ', 'Neolara Corp. ']
['2023-04-04', '2023-04-04', '2023-04-04', '2023-04-04', '2023-04-04']
{'S-1/A'}


### Formatting into Dataframe

In [17]:
df = scraper.generate_df(5,1)
print(df)

                                           names filing date
0           Allarity Therapeutics, Inc.  (ALLR)   2023-04-04
1  Greenwave Technology Solutions, Inc.  (GWAV)   2023-04-04
2         APPlife Digital Solutions Inc  (ALDS)   2023-04-04
3              MAIA Biotechnology, Inc.  (MAIA)   2023-04-04
4                                 Neolara Corp.   2023-04-04


### Modifying Search Dates

In [20]:
scraper.set_search_date("2021-01-01", "2023-03-31")

company_names, file_dates, form_types = scraper.edgar_scrape(5)
print (file_dates)

df = scraper.generate_df(5,1)
print(df)

['2023-03-31', '2023-03-31', '2023-03-31', '2023-03-31', '2023-03-31']
                                               names filing date
0           Intuitive Machines, Inc.  (LUNR, LUNRW)   2023-03-31
1                     Nuburu, Inc.  (BURU, BURU-WT)   2023-03-31
2                           SOLIGENIX, INC.  (SNGX)   2023-03-31
3              NovaBay Pharmaceuticals, Inc.  (NBY)   2023-03-31
4  Artificial Intelligence Technology Solutions I...  2023-03-31


### Modifying Form Types

In [19]:
scraper.reset_url()
scraper.add_forms(['10-K', '10-Q'])

company_names, file_dates, form_types = scraper.edgar_scrape(5)
print (form_types)

df = scraper.generate_df(5,1)
print(df)

{'10-Q', '10-K'}
                                               names filing date
0  Compute Health Acquisition Corp.  (CPUH, CPUH-...  2023-04-04
1                     DARDEN RESTAURANTS INC  (DRI)   2023-04-04
2                               LINDSAY CORP  (LNN)   2023-04-04
3                SMART Global Holdings, Inc.  (SGH)   2023-04-04
4  ACCRETION ACQUISITION CORP.  (ENER, ENERR, ENE...  2023-04-04


### Generating Reference Codes and Accession Numbers

In [30]:
#This is the cik that identifies Pfizer
cik = '0000078003'

#This will yield all references and the name of a company tied to a cik
references, name = scraper.get_refs(cik,3)

#This will yield all accession numbers tied to a cik
accession_numbers = scraper.get_anums(cik,3)

print(references)
print(name)

['000007800323000024', '000007800322000027', '000007800321000038']
['pfe-20221231.htm', 'pfe-20211231.htm', 'pfe-20201231.htm']
PFIZER INC  (PFE) 


### Finding xbrl Links for a Company

In [39]:
links,c_name = scraper.create_links(cik, 3)

for link in links:
    print(link)

['000007800323000024', '000007800322000027', '000007800321000038']
https://www.sec.gov/ix?doc=/Archives/edgar/data/0000078003/000007800323000024/pfe-20221231.htm
https://www.sec.gov/ix?doc=/Archives/edgar/data/0000078003/000007800322000027/pfe-20211231.htm
https://www.sec.gov/ix?doc=/Archives/edgar/data/0000078003/000007800321000038/pfe-20201231.htm


### Scraping Link for Financial Info

In [40]:
for link in links:
    total_assets, total_liabilities, net_income = scraper.scrape_xbrl(link)
    print('Assets: ',total_assets)
    print('Liabilities: ',total_liabilities)
    print('NI: ',net_income) 
    print()

Assets:  197,205
Liabilities:  101,288
NI:  31,407

Assets:  181,476
Liabilities:  104,013
NI:  22,025

Assets:  154,229
Liabilities:  90,756
NI:  9,652

