In [1]:
pip install linkedin-jobs-scraper



[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m A new release of pip available: [0m[31;49m22.1.2[0m[39;49m -> [0m[32;49m22.2[0m
[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m To update, run: [0m[32;49mpip install --upgrade pip[0m
Note: you may need to restart the kernel to use updated packages.


In [40]:
from bs4 import BeautifulSoup as bs


In [4]:
import logging
from linkedin_jobs_scraper import LinkedinScraper
from linkedin_jobs_scraper.events import Events, EventData, EventMetrics
from linkedin_jobs_scraper.query import Query, QueryOptions, QueryFilters
from linkedin_jobs_scraper.filters import RelevanceFilters, TimeFilters, TypeFilters, ExperienceLevelFilters, RemoteFilters




In [5]:
# Changing root logger level (default is WARN)
logging.basicConfig(level = logging.INFO)

In [6]:
# Fired once for each successfully processed job
def on_data(data: EventData):
    print('[ON_DATA]', data.title, data.company, data.company_link, data.date, data.link, data.insights, len(data.description))

# Fired once for each page (25 jobs)
def on_metrics(metrics: EventMetrics):
  print('[ON_METRICS]', str(metrics))

def on_error(error):
    print('[ON_ERROR]', error)

def on_end():
    print('[ON_END]')

In [24]:
scraper = LinkedinScraper(
    chrome_executable_path=None,  
    chrome_options=None,  
    headless=True,  # Overrides headless mode only if chrome_options is None
    max_workers=1,  
    slow_mo=1.3,  # Slows scraper to avoid 'Too many requests 429' errors 
    page_load_timeout=20  # Page load timeout    
)

INFO:li:scraper:('Using strategy AnonymousStrategy',)


In [25]:
# Adding event listeners
scraper.on(Events.DATA, on_data)
scraper.on(Events.ERROR, on_error)
scraper.on(Events.END, on_end)

In [26]:
# obtaining job listings from linkedin
queries = [
    Query(
        options=QueryOptions(            
            limit=27  # Limit the number of jobs to scrape.            
        )
    ),
    Query(
        query='Data',
        options=QueryOptions(
            locations=['United States'],            
            apply_link = True,  # Try to extract apply link (easy applies are skipped). Default to False.
            limit=5,
            filters=QueryFilters(              
                company_jobs_url='https://www.linkedin.com/jobs/search/?f_C=1441%2C17876832%2C791962%2C2374003%2C18950635%2C16140%2C10440912&geoId=92000000',  # Filter by companies.
                relevance=RelevanceFilters.RECENT,
                time=TimeFilters.WEEK,
                type=[TypeFilters.FULL_TIME],
                experience=[ExperienceLevelFilters.ENTRY_LEVEL],                
            )
        )
    ),
]

scraper.run(queries)

INFO:li:scraper:('Starting new query', "Query(query= options=QueryOptions(limit=27 locations=['Worldwide'] optimize=False apply_link=False))")
INFO:li:scraper:('Chrome debugger url', 'http://localhost:59262')
INFO:li:scraper:('[][Worldwide]', 'Opening https://www.linkedin.com/jobs/search?location=Worldwide')
INFO:li:scraper:('[][Worldwide]', 'Trying first selectors set')
INFO:li:scraper:('[][Worldwide]', 'Trying second selectors set')
INFO:li:scraper:('[][Worldwide]', 'OK')
INFO:li:scraper:('[][Worldwide]', 'Starting pagination loop')
INFO:li:scraper:('[][Worldwide]', 'Found 25 jobs')
INFO:li:scraper:('[][Worldwide][1]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187226469?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=UyZhk82vrl0yZp4M86ucUQ%3D%3D&position=1&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][2]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187223717?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=Y3GqT3On5nuT9ptDyFxgVg%3D%3D&position=2&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


ERROR:li:scraper:('[][Worldwide][3]', 'Timeout on loading job details')
NoneType: None
INFO:li:scraper:('[][Worldwide][3]', 'Processed')


[ON_DATA] Interior Designer Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-designer-at-actalent-3187129924?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=9Xq49BqXT1fIi9fW%2F3%2BGxg%3D%3D&position=4&pageNum=0&trk=public_jobs_jserp-result_search-card [] 1636


INFO:li:scraper:('[][Worldwide][4]', 'Processed')


[ON_DATA] Interior Designer Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-designer-at-actalent-3187133821?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=%2FfIh8l%2FlUrgMyraA1FYasA%3D%3D&position=5&pageNum=0&trk=public_jobs_jserp-result_search-card [] 1695


INFO:li:scraper:('[][Worldwide][5]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187230133?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=kiG9BffMZTvYKznrfLHlsw%3D%3D&position=6&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][6]', 'Processed')


[ON_DATA] Interior Designer Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-designer-at-actalent-3187137468?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=U8BRDDzEHLzg0VolyokXbA%3D%3D&position=7&pageNum=0&trk=public_jobs_jserp-result_search-card [] 1928


INFO:li:scraper:('[][Worldwide][7]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187222977?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=T7O%2FV2AQ59FkLdxBujPqKw%3D%3D&position=8&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][8]', 'Processed')


[ON_DATA] Sharepoint Admin Dice  2022-07-24 https://www.linkedin.com/jobs/view/sharepoint-admin-at-dice-3187223670?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=66ewsCzxgt3Oa0sFSE%2FMjg%3D%3D&position=9&pageNum=0&trk=public_jobs_jserp-result_search-card [] 3788


INFO:li:scraper:('[][Worldwide][9]', 'Processed')


[ON_DATA] Vice President of Marketing TMX Finance Family of Companies  2022-07-24 https://www.linkedin.com/jobs/view/vice-president-of-marketing-at-tmx-finance-family-of-companies-3187226751?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=2%2Bo%2FZcxt7iF5XybPpFSffw%3D%3D&position=10&pageNum=0&trk=public_jobs_jserp-result_search-card [] 6461


INFO:li:scraper:('[][Worldwide][10]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187223691?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=irvbnAyDdz%2FRA%2FQaMP%2BJ%2Bg%3D%3D&position=11&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][11]', 'Processed')


[ON_DATA] Interior Designer Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-designer-at-actalent-3187133341?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=mUJ7AVWMnYUXE3LPMHTa4A%3D%3D&position=12&pageNum=0&trk=public_jobs_jserp-result_search-card [] 5189


INFO:li:scraper:('[][Worldwide][12]', 'Processed')


[ON_DATA] Interior Architect Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-architect-at-actalent-3187106458?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=74cjCP2lbYmf1T5KZJtlSg%3D%3D&position=13&pageNum=0&trk=public_jobs_jserp-result_search-card [] 1649


INFO:li:scraper:('[][Worldwide][13]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187222853?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=WBWg8J25Ewxm8S7DjQubpA%3D%3D&position=14&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


ERROR:li:scraper:('[][Worldwide][14]', 'Timeout on loading job details')
NoneType: None
INFO:li:scraper:('[][Worldwide][14]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187221829?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=ukIPxm7NeSBdl%2FQqZYPuoQ%3D%3D&position=16&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][15]', 'Processed')


[ON_DATA] PCB Layout Designer Trenton Systems  2022-07-24 https://www.linkedin.com/jobs/view/pcb-layout-designer-at-trenton-systems-3187171274?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=AXGqg3RHBICdG3kXzEAtmw%3D%3D&position=17&pageNum=0&trk=public_jobs_jserp-result_search-card [] 1271


INFO:li:scraper:('[][Worldwide][16]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187229131?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=sRLSIQsCvv49W5FQAW%2FhRA%3D%3D&position=18&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][17]', 'Processed')


[ON_DATA] Sr. Operations Analyst REQ-220412 ICE Mortgage Technology  2022-07-02 https://www.linkedin.com/jobs/view/sr-operations-analyst-req-220412-at-ice-mortgage-technology-3187225477?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=x3fioz%2BbmYs7vJjp%2FcNSvQ%3D%3D&position=19&pageNum=0&trk=public_jobs_jserp-result_search-card [] 4045


INFO:li:scraper:('[][Worldwide][18]', 'Processed')


[ON_DATA] Team Member-Franchise - 4005 - Stellhorn Rd-Ft Wayne, IN (Fort Wayne, IN) Checkers & Rally’s Drive-In Restaurants  2022-07-24 https://www.linkedin.com/jobs/view/team-member-franchise-4005-stellhorn-rd-ft-wayne-in-fort-wayne-in-at-checkers-rally%E2%80%99s-drive-in-restaurants-3187114025?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=z7JkQnm2%2FKr%2BJdJwkC25Vg%3D%3D&position=20&pageNum=0&trk=public_jobs_jserp-result_search-card [] 295


ERROR:li:scraper:('[][Worldwide][19]', 'Timeout on loading job details')
NoneType: None
INFO:li:scraper:('[][Worldwide][19]', 'Processed')


[ON_DATA] Interior Designer Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-designer-at-actalent-3187131778?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=lECQPpM8wsWfawwK%2Bz8rFw%3D%3D&position=22&pageNum=0&trk=public_jobs_jserp-result_search-card [] 1636


INFO:li:scraper:('[][Worldwide][20]', 'Processed')


[ON_DATA] Architectural Interior Designer Actalent  2022-07-24 https://www.linkedin.com/jobs/view/architectural-interior-designer-at-actalent-3187107129?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=0qbm2QNeMl%2F4T6f4VVsrSA%3D%3D&position=23&pageNum=0&trk=public_jobs_jserp-result_search-card [] 3849


INFO:li:scraper:('[][Worldwide][21]', 'Processed')


[ON_DATA] Entry Level HR Admin Aston Carter  2022-07-24 https://www.linkedin.com/jobs/view/entry-level-hr-admin-at-aston-carter-3187108100?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=TTGQLe2KXv1f4cL0iQ8NNA%3D%3D&position=24&pageNum=0&trk=public_jobs_jserp-result_search-card [] 3708


INFO:li:scraper:('[][Worldwide][22]', 'Processed')


[ON_DATA] SAP Warranty Management Consultant Dice  2022-07-24 https://www.linkedin.com/jobs/view/sap-warranty-management-consultant-at-dice-3187221636?refId=bbdM5%2F3Labj2Z0Clh%2Bs0Vw%3D%3D&trackingId=j%2Bik%2BhJDdRcuZzx1HNumvA%3D%3D&position=25&pageNum=0&trk=public_jobs_jserp-result_search-card [] 3555


INFO:li:scraper:('[][Worldwide][23]', 'Processed')


[ON_DATA] SAP Warranty Management Consultant Dice  2022-07-24 https://www.linkedin.com/jobs/view/sap-warranty-management-consultant-at-dice-3187221636?refId=s2D5PpiXW1bCPcB0ALPPWg%3D%3D&trackingId=AeI5yJJw15gjydUIbIS2RA%3D%3D&position=1&pageNum=1&trk=public_jobs_jserp-result_search-card [] 3555


ERROR:li:scraper:('[][Worldwide][24]', 'Timeout on loading job details')
NoneType: None
INFO:li:scraper:('[][Worldwide][24]', 'Processed')


[ON_DATA] Interior Designer (NCIDQ Not Required) Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-designer-ncidq-not-required-at-actalent-3186987290?refId=s2D5PpiXW1bCPcB0ALPPWg%3D%3D&trackingId=vmYITmmYs4A1jARimukf%2BA%3D%3D&position=3&pageNum=1&trk=public_jobs_jserp-result_search-card [] 3849


INFO:li:scraper:('[][Worldwide][25]', 'Processed')


[ON_DATA] Interior Architect Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-architect-at-actalent-3187106313?refId=s2D5PpiXW1bCPcB0ALPPWg%3D%3D&trackingId=AAAqoLpawoEVXObJymh%2FRw%3D%3D&position=4&pageNum=1&trk=public_jobs_jserp-result_search-card [] 1945


ERROR:li:scraper:('[][Worldwide][26]', 'Timeout on loading job details')
NoneType: None
INFO:li:scraper:('[][Worldwide][26]', 'Processed')


[ON_DATA] Interior Architect Actalent  2022-07-24 https://www.linkedin.com/jobs/view/interior-architect-at-actalent-3187108188?refId=s2D5PpiXW1bCPcB0ALPPWg%3D%3D&trackingId=qdz5hEbFQ2CvXgVZUT2NiQ%3D%3D&position=6&pageNum=1&trk=public_jobs_jserp-result_search-card [] 1601


INFO:li:scraper:('[][Worldwide][27]', 'Processed')


[ON_DATA] Assistant Maintenance Supervisor - Cobble Court Apartments Tarragon Property Services  2022-07-24 https://www.linkedin.com/jobs/view/assistant-maintenance-supervisor-cobble-court-apartments-at-tarragon-property-services-3187248642?refId=s2D5PpiXW1bCPcB0ALPPWg%3D%3D&trackingId=LD%2Byjatk%2BS7eAm5lKjK2xA%3D%3D&position=7&pageNum=1&trk=public_jobs_jserp-result_search-card [] 5421


INFO:li:scraper:('Starting new query', "Query(query=Data options=QueryOptions(limit=5 locations=['United States'] filters=QueryFilters(company_jobs_url=https://www.linkedin.com/jobs/search/?f_C=1441%2C17876832%2C791962%2C2374003%2C18950635%2C16140%2C10440912&geoId=92000000 relevance=RelevanceFilters.RECENT time=TimeFilters.WEEK type=[<TypeFilters.FULL_TIME: 'F'>] experience=[<ExperienceLevelFilters.ENTRY_LEVEL: '2'>]) optimize=False apply_link=True))")


[ON_END]


INFO:li:scraper:('Chrome debugger url', 'http://localhost:59628')
INFO:li:scraper:('[Data][United States]', 'Opening https://www.linkedin.com/jobs/search?keywords=Data&location=United+States&f_C=1441%2C17876832%2C791962%2C2374003%2C18950635%2C16140%2C10440912&sortBy=DD&f_TPR=r604800&f_JT=F&f_E=2&start=0')
INFO:li:scraper:('[Data][United States]', 'Trying first selectors set')
INFO:li:scraper:('[Data][United States]', 'Trying second selectors set')
INFO:li:scraper:('[Data][United States]', 'OK')
INFO:li:scraper:('[Data][United States]', 'Starting pagination loop')
INFO:li:scraper:('[Data][United States]', 'No jobs found, skip')


[ON_END]


In [41]:
# parsing obtained data to json
json = []
 for job in job_lists:
            job_info = extract_job_info(job)
            json.append(job_info)
            39

import json
   
# Data to be written
#dictionary ={
 # "locations": "04",
  #"apply_link": "sunil",
  #"company_jobs_url", 
#}
   
# Serializing json 
#json_object = json.dumps(dictionary, indent = 4)
#print(json_object)

job_lists = soup.find_all("div", {"class": "job_seen_beacon"})
for job in job_lists:
            job_info = extract_job_info(job)
            json.append(job_info)
            
job_lists = job_lists = soup.find_all("div", {"class": "job_seen_beacon"})

for job in job_lists:
            job_info = extract_job_info(job)
            json.append(job_info)

job_info = {
        "job_id":job_id,
        "company_name":company_name,
        "role": role_name,
        "location":location,
        "salary_estimated": salary_estimated,
        "job_description": job_description,
        "url": prefix+hyperlink,
    }




NameError: name 'soup' is not defined