## Importing Dependencies

In [1]:
from bs4 import BeautifulSoup as bs
from splinter import Browser
import requests
import time
import pandas as pd

## Setting Up Splinter

In [2]:
# For macOS users
!which chromedriver

/usr/local/bin/chromedriver


In [3]:
executable_path = {'executable_path': '/usr/local/bin/chromedriver'}
browser = Browser('chrome', **executable_path, headless = False)

In [4]:
# For Windows users
# executable_path = {'executable_path': 'chromedriver.exe'}
# browser = Browser('chrome', **executable_path, headless = False)

## World Economic Forum

In [5]:
wef_url = 'https://www.weforum.org/search?query=digital+economics'
browser.visit(wef_url)
wef_html = browser.html
wef_soup = bs(wef_html, 'html.parser')
time.sleep(3)

In [6]:
wef_content = wef_soup.find('div', class_ = 'gs-title')

wef = {}
wef['link'] = wef_content.a['data-ctorig']
wef['title'] = wef_content.text.strip()
wef['snippet'] = wef_soup.find('div', class_ = 'gs-bidi-start-align gs-snippet').text.strip()

print(wef)

{'link': 'https://www.weforum.org/platforms/shaping-the-future-of-digital-economy-and-new-value-creation', 'title': 'Shaping the Future of Digital Economy and New Value Creation ...', 'snippet': "Currently, about 50% of the world's population does not currently participate in \nthe digital economy at all – and growth in internet adoption is slowing. The G20's\n\xa0..."}


## McKinsey & Company

In [7]:
mckinsey_url = 'https://www.mckinsey.com/search?q=digital%20economy'
browser.visit(mckinsey_url)
mckinsey_html = browser.html
mckinsey_soup = bs(mckinsey_html, 'html.parser')
time.sleep(3)

In [8]:
mckinsey_body = mckinsey_soup.find('div', class_ = 'search-results')
mckinsey_content = mckinsey_body.find('div', class_ = 'text-wrapper')

mckinsey = {}
mckinsey['link'] = mckinsey_content.a['href']
mckinsey['title'] = mckinsey_content.h3.text.strip()
mckinsey['snippet'] = mckinsey_body.find('div', class_ = 'description').text.strip()

print(mckinsey)

{'link': 'https://www.mckinsey.com/business-functions/mckinsey-digital/our-insights/powering-the-digital-economy', 'title': 'Powering the digital economy', 'snippet': 'The economics of energy are changing: cheaper storage is bending the electricity cost curve, giving a boost to charging stations. Utilities meanwhile are refining...  strategies and raising their digital game.'}


## Visual Capitalist

In [9]:
vc_url = 'https://www.visualcapitalist.com/?s=digital+transformation'
browser.visit(vc_url)
vc_html = browser.html
vc_soup = bs(vc_html, 'html.parser')
time.sleep(3)

In [10]:
vc_content = vc_soup.find('li', class_ = 'mvp-blog-story-wrap left relative infinite-post')

vc = {}
vc['link'] = vc_content.a['href']
vc['title'] = vc_content.h2.text.strip()
vc['snippet'] = ''

print(vc)

{'link': 'https://www.visualcapitalist.com/how-technology-is-disrupting-the-construction-industry/', 'title': 'How Technology is Disrupting the Construction Industry', 'snippet': ''}


## HBR

In [11]:
hbr_url = 'https://hbr.org/search?search_type=&term=digital+economy'
browser.visit(hbr_url)
hbr_html = browser.html
hbr_soup = bs(hbr_html, 'html.parser')
time.sleep(3)

In [12]:
hbr_content = hbr_soup.find('stream-item', class_ = 'stream-item overflow-hidden')

hbr = {}
hbr_link = hbr_content.h3.a['href']
hbr['link'] = f'https://hbr.org{hbr_link}'
hbr['title'] = hbr_content.h3.text.strip()
hbr['snippet'] = hbr_content.find('div', class_ = 'dek hide-for-small').text.strip()

print(hbr)

{'link': 'https://hbr.org/2018/12/what-big-consumer-brands-can-do-to-compete-in-a-digital-economy', 'title': 'What Big Consumer Brands Can Do to Compete in a Digital Economy', 'snippet': 'Companies like P&G need to adapt to compete with the likes of Amazon.'}


## Forbes

In [13]:
forbes_url = 'https://www.forbes.com/search/?q=digital+economy'
browser.visit(forbes_url)
forbes_html = browser.html
forbes_soup = bs(forbes_html, 'html.parser')
time.sleep(3)

In [14]:
forbes_content = forbes_soup.find('div', class_ = 'stream-item__text')

forbes = {}
forbes['link'] = forbes_content.a['href']
forbes['title'] = forbes_content.h2.text.strip()
forbes['snippet'] = ''

print(forbes)

{'link': 'https://www.forbes.com/sites/baxiabhishek/2019/09/25/google-pay-is-evolving-into-a-platform-to-grab-a-slice-of-indias-growing-digital-economy/', 'title': "Google Pay Is Evolving Into A Platform To Grab A Slice Of India's Growing Digital Economy", 'snippet': ''}


## Summary

In [15]:
articles = [wef, mckinsey, vc, hbr, forbes]

summary = {
    'articles': articles
}

print(summary)

{'articles': [{'link': 'https://www.weforum.org/platforms/shaping-the-future-of-digital-economy-and-new-value-creation', 'title': 'Shaping the Future of Digital Economy and New Value Creation ...', 'snippet': "Currently, about 50% of the world's population does not currently participate in \nthe digital economy at all – and growth in internet adoption is slowing. The G20's\n\xa0..."}, {'link': 'https://www.mckinsey.com/business-functions/mckinsey-digital/our-insights/powering-the-digital-economy', 'title': 'Powering the digital economy', 'snippet': 'The economics of energy are changing: cheaper storage is bending the electricity cost curve, giving a boost to charging stations. Utilities meanwhile are refining...  strategies and raising their digital game.'}, {'link': 'https://www.visualcapitalist.com/how-technology-is-disrupting-the-construction-industry/', 'title': 'How Technology is Disrupting the Construction Industry', 'snippet': ''}, {'link': 'https://hbr.org/2018/12/what-big-cons