In [1]:
import pandas as pd

import plotly.express as px
import plotly.graph_objs as go

In [2]:
def plot_trend(data, x, y, legend):
    fig = px.line(data, x=x, y=y,color=legend)
    fig.show()

# Load data

## Stock price

### NYSE stock closing price

In [3]:
stock_nyse = pd.read_csv('../sample_dataset/nyse-energy-company-stock-closing-prices-2020.csv', parse_dates=['Date'])
print(stock_nyse.shape)
display(stock_nyse.head(5))
# display(stock_nyse.describe())

(2502, 13)


Unnamed: 0,Value,Date,Super Region,Ticker,Time Level,Source,Stock Name,Sub-Sector,Stock Attribute,Currency,Data Provider,Stock Exchange,Location
0,41.22,2020-12-31,GLOBAL DATA,XOM,DAILY,WORLDDATA.AI,EXXON MOBIL CORPORATION,GLOBAL STOCK EXCHANGE DATA,CLOSING PRICE,USD,NEW YORK STOCK EXCHANGE,NEW YORK STOCK EXCHANGE - STOCK PRICES,AMERICA-NEW_YORK
1,41.36,2020-12-31,GLOBAL DATA,MPC,DAILY,WORLDDATA.AI,MARATHON PETROLEUM CORPORATION,GLOBAL STOCK EXCHANGE DATA,CLOSING PRICE,USD,NEW YORK STOCK EXCHANGE,NEW YORK STOCK EXCHANGE - STOCK PRICES,AMERICA-NEW_YORK
2,69.94,2020-12-31,GLOBAL DATA,PSX,DAILY,WORLDDATA.AI,PHILLIPS 66,GLOBAL STOCK EXCHANGE DATA,CLOSING PRICE,USD,NEW YORK STOCK EXCHANGE,NEW YORK STOCK EXCHANGE - STOCK PRICES,AMERICA-NEW_YORK
3,56.57,2020-12-31,GLOBAL DATA,VLO,DAILY,WORLDDATA.AI,VALERO ENERGY CORPORATION,GLOBAL STOCK EXCHANGE DATA,CLOSING PRICE,USD,NEW YORK STOCK EXCHANGE,NEW YORK STOCK EXCHANGE - STOCK PRICES,AMERICA-NEW_YORK
4,17.31,2020-12-31,GLOBAL DATA,OXY,DAILY,WORLDDATA.AI,OCCIDENTAL PETROLEUM CORPORATION,GLOBAL STOCK EXCHANGE DATA,CLOSING PRICE,USD,NEW YORK STOCK EXCHANGE,NEW YORK STOCK EXCHANGE - STOCK PRICES,AMERICA-NEW_YORK


In [4]:
plot_trend(stock_nyse,'Date','Value','Ticker')

### Stock index

1. <b>Dow Jones Utilities Average</b>, DJUA is a stock index from S&P Dow Jones Indices that tracks the performance of 15 prominent utility companies traded in the United States.
2. <b>Dow Jones Transportation Average</b>, DJTA is a price-weighted average of 20 transportation stocks traded in the United States.
3. <b>Dow Jones Industrial Average</b>, DJIA is a stock market index that measures the stock performance of 30 large companies listed on stock exchanges in the United States.
4. <b>Dow Jones Composite Average</b> is a stock index from Dow Jones Indexes that tracks 65 prominent companies. The average's components include every stock from the Dow Jones Industrial Average (30 components), the Dow Jones Transportation Average (20), and the Dow Jones Utility Average (15)
5. <b>S&P500 (Standard & Poor 500)</b> is a stock market index that measures the stock performance of 500 large companies listed on stock exchanges in the United States. It is one of the most commonly followed equity indices.

In [5]:
stock_index = pd.read_csv('../sample_dataset/some-stock-market-indicators-&-index-2020.csv', parse_dates=['Date'])
print(stock_index.shape)
display(stock_index.head(5))
# display(stock_index.describe())

(1265, 10)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Description,Time Level,Category 2,Seasonal Adjustment,Unit,Source
0,864.64,2020-12-31,STOCK MARKET INDICATORS & INDEX,UNITED STATES,DOW JONES UTILITY AVERAGE,DAILY,FINANCIAL INDICATORS,NOT SEASONALLY ADJUSTED,INDEX,FEDERAL RESERVE ECONOMIC DATA-FRED
1,3756.07,2020-12-31,STOCK MARKET INDICATORS & INDEX,UNITED STATES,S&P 500,DAILY,FINANCIAL INDICATORS,NOT SEASONALLY ADJUSTED,INDEX,FEDERAL RESERVE ECONOMIC DATA-FRED
2,10108.71,2020-12-31,STOCK MARKET INDICATORS & INDEX,UNITED STATES,DOW JONES COMPOSITE AVERAGE,DAILY,FINANCIAL INDICATORS,NOT SEASONALLY ADJUSTED,INDEX,FEDERAL RESERVE ECONOMIC DATA-FRED
3,30606.48,2020-12-31,STOCK MARKET INDICATORS & INDEX,UNITED STATES,DOW JONES INDUSTRIAL AVERAGE,DAILY,FINANCIAL INDICATORS,NOT SEASONALLY ADJUSTED,INDEX,FEDERAL RESERVE ECONOMIC DATA-FRED
4,12506.93,2020-12-31,STOCK MARKET INDICATORS & INDEX,UNITED STATES,DOW JONES TRANSPORTATION AVERAGE,DAILY,FINANCIAL INDICATORS,NOT SEASONALLY ADJUSTED,INDEX,FEDERAL RESERVE ECONOMIC DATA-FRED


In [6]:
plot_trend(stock_index,'Date','Value','Description')

## Crude oil related prices

### Commodity Prices

In [7]:
price_commodity = pd.read_csv('../sample_dataset/crude-oil-commodity-prices-2020.csv', parse_dates=['Date'])
print(price_commodity.shape)
display(price_commodity.head(5))
# display(price_commodity.describe())

(2014, 8)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Commodity And Exchange,Frequency,Source,Indicator
0,0.12,2020-12-31,COMMODITY PRICES,GLOBAL DATA,NYMEX CRUDE OIL FUTURES,DAILY,COMMODITY EXCHANGE,CHANGE
1,364939.0,2020-12-31,COMMODITY PRICES,GLOBAL DATA,NYMEX CRUDE OIL FUTURES,DAILY,COMMODITY EXCHANGE,PREVIOUS DAY OPEN INTEREST
2,48.35,2020-12-31,COMMODITY PRICES,GLOBAL DATA,NYMEX CRUDE OIL FUTURES,DAILY,COMMODITY EXCHANGE,OPEN
3,48.52,2020-12-31,COMMODITY PRICES,GLOBAL DATA,NYMEX CRUDE OIL FUTURES,DAILY,COMMODITY EXCHANGE,SETTLE
4,0.17,2020-12-31,COMMODITY PRICES,GLOBAL DATA,ICE BRENT CRUDE OIL FUTURES,DAILY,COMMODITY EXCHANGE,CHANGE


In [9]:
price_commodity.Indicator.unique()

array(['CHANGE', 'PREVIOUS DAY OPEN INTEREST', 'OPEN', 'SETTLE', 'VALUE',
       'PREV# DAY OPEN INTEREST'], dtype=object)

In [12]:
plot_trend(price_commodity[price_commodity.Indicator == 'SETTLE'],'Date','Value','Commodity And Exchange')

### Future Prices

In [13]:
price_future = pd.read_csv('../sample_dataset/crude-oil-related-product-future-prices-from-ice-2020.csv', parse_dates=['Date Value'])
print(price_future.shape)
display(price_future.head(5))
# display(price_future.describe())

(59100, 16)


Unnamed: 0,Sub-Sector,Product Id,ProductID_Contract,Exchange City,Super Region,Product Type,Sector,Time Level,Exchange Country,Unit,Product Description,Source,Super Region.1,Value,Date Value,Period Value
0,ENERGY FUTURES PRICES,1886,1886_JUN21,SINGAPORE,GLOBAL DATA,CRUDE OIL AND REFINED,FINANCIAL MARKET,DAILY,SINGAPORE,PRICE,NAPHTHA C+F JAPAN CARGO SWAP,INTERCONTINENTAL EXCHANGE - ICE,GLOBAL DATA,455.28,2020-12-31,d
1,ENERGY FUTURES PRICES,5631,5631_FEB21,SINGAPORE,GLOBAL DATA,CRUDE OIL AND REFINED,FINANCIAL MARKET,DAILY,SINGAPORE,PRICE,URALS MED VS DATED BRENT SWAP,INTERCONTINENTAL EXCHANGE - ICE,GLOBAL DATA,-0.4,2020-12-31,d
2,ENERGY FUTURES PRICES,5631,5631_APR21,SINGAPORE,GLOBAL DATA,CRUDE OIL AND REFINED,FINANCIAL MARKET,DAILY,SINGAPORE,PRICE,URALS MED VS DATED BRENT SWAP,INTERCONTINENTAL EXCHANGE - ICE,GLOBAL DATA,-1.0,2020-12-31,d
3,ENERGY FUTURES PRICES,20031,20031_APR21,SINGAPORE,GLOBAL DATA,CRUDE OIL AND REFINED,FINANCIAL MARKET,DAILY,SINGAPORE,PRICE,SINGAPORE GASOIL SWAP,INTERCONTINENTAL EXCHANGE - ICE,GLOBAL DATA,56.73,2020-12-31,d
4,ENERGY FUTURES PRICES,23490,23490_MAR21,SINGAPORE,GLOBAL DATA,CRUDE OIL AND REFINED,FINANCIAL MARKET,DAILY,SINGAPORE,PRICE,MARINE FUEL 0.5% FOB ROTTERDAM BARGE SWAP,INTERCONTINENTAL EXCHANGE - ICE,GLOBAL DATA,370.5,2020-12-31,d


In [16]:
price_future['Product Description'].unique()

array(['NAPHTHA C+F JAPAN CARGO SWAP', 'URALS MED  VS DATED BRENT SWAP',
       'SINGAPORE GASOIL SWAP',
       'MARINE FUEL 0.5% FOB ROTTERDAM BARGE SWAP',
       'NEW YORK 1% FUEL OIL SWAP', 'URALS NWE  VS DATED BRENT SWAP',
       'USGC HSFO FUEL OIL SWAP', 'MARINE FUEL 0.5% FOB SINGAPORE SWAP',
       'USGC HSFO FUEL OIL VS BRENT 1ST LINE SWAP',
       'GASOIL 0.1% CIF NWE CARGOES VS LOW SULPHUR GASOIL 1ST LINE SWAP',
       'NEW YORK 1% FUEL OIL VS FUEL OIL 1% FOB NWE CARGOES SWAP',
       'NEW YORK 1% FUEL OIL VS BRENT 1ST LINE SWAP',
       'JET FOB ROTTERDAM BARGES VS LOW SULPHUR GASOIL 1ST LINE SWAP',
       'GASOIL 0.1% CIF MED CARGOES VS LOW SULPHUR GASOIL 1ST LINE SWAP',
       'DIESEL 10PPM FOB ARA BARGES VS LOW SULPHUR GASOIL 1ST LINE SWAP',
       'FUEL OIL 1% FOB ROTTERDAM BARGES VS 1% FOB NWE CARGOES SWAP',
       'FUEL OIL 1% FOB ROTTERDAM BARGES SWAP',
       'FUEL OIL 180 CST SINGAPORE SWAP',
       'NAPHTHA CIF NWE CARGOES VS BRENT 1ST LINE SWAP',
       'FUEL OIL 

In [15]:
plot_trend(price_future,'Date Value','Value','Product Description')

## Financial Statement

In [17]:
financial_statement = pd.read_csv('../sample_dataset/some-energy-company-financial-statements-2020.csv', parse_dates=['Date Value'])
print(financial_statement.shape)
display(financial_statement.head(5))
# display(financial_statement.describe())

(557, 19)


Unnamed: 0,Super Region,Sector,Ticker,Time Level,Unit,Source,Exchange,Sub-Sector,Company Name,Industry Level 2,Industry Level 1,Company Website,Statement Type,Market Cap,Financial Metric,Super Region.1,Value,Date Value,Period Value
0,UNITED STATES,FINANCIAL MARKET,VLO,QUARTER,USD,COMPANY SEC FILINGS,NEW YORK STOCK EXCHANGE,FINANCIAL STATEMENT,VALERO ENERGY CORPORATION,OIL & GAS - REFINING & MARKETING,ENERGY,HTTP://WWW.VALERO.COM,INCOME-STATEMENT,GREATER THAN $1BILLION MARKET CAP,INCOME TAX EXPENSE,UNITED STATES,-337000000.0,2020-09-30,d
1,UNITED STATES,FINANCIAL MARKET,VLO,QUARTER,USD,COMPANY SEC FILINGS,NEW YORK STOCK EXCHANGE,FINANCIAL STATEMENT,VALERO ENERGY CORPORATION,OIL & GAS - REFINING & MARKETING,ENERGY,HTTP://WWW.VALERO.COM,INCOME-STATEMENT,GREATER THAN $1BILLION MARKET CAP,EPS,UNITED STATES,-2.62,2020-09-30,d
2,UNITED STATES,FINANCIAL MARKET,VLO,QUARTER,USD,COMPANY SEC FILINGS,NEW YORK STOCK EXCHANGE,FINANCIAL STATEMENT,VALERO ENERGY CORPORATION,OIL & GAS - REFINING & MARKETING,ENERGY,HTTP://WWW.VALERO.COM,INCOME-STATEMENT,GREATER THAN $1BILLION MARKET CAP,OPERATING INCOME,UNITED STATES,-621000000.0,2020-09-30,d
3,UNITED STATES,FINANCIAL MARKET,PSX,QUARTER,USD,COMPANY SEC FILINGS,NEW YORK STOCK EXCHANGE,FINANCIAL STATEMENT,PHILLIPS 66,OIL & GAS - REFINING & MARKETING,ENERGY,HTTP://WWW.PHILLIPS66.COM,INCOME-STATEMENT,GREATER THAN $1BILLION MARKET CAP,GROSS PROFIT,UNITED STATES,1068000000.0,2020-09-30,d
4,UNITED STATES,FINANCIAL MARKET,PSX,QUARTER,USD,COMPANY SEC FILINGS,NEW YORK STOCK EXCHANGE,FINANCIAL STATEMENT,PHILLIPS 66,OIL & GAS - REFINING & MARKETING,ENERGY,HTTP://WWW.PHILLIPS66.COM,INCOME-STATEMENT,GREATER THAN $1BILLION MARKET CAP,EPS DILUTED,UNITED STATES,-1.82,2020-09-30,d


In [18]:
financial_statement['Financial Metric'].unique()

array(['INCOME TAX EXPENSE', 'EPS', 'OPERATING INCOME', 'GROSS PROFIT',
       'EPS DILUTED', 'OPERATING EXPENSES', 'NET PROFIT MARGIN',
       'NET INCOME COM', 'EBIT', 'EBIT MARGIN', 'COST OF REVENUE',
       'EBITDA', 'WEIGHTED AVERAGE SHS OUT', 'GROSS MARGIN',
       'EBITDA MARGIN', 'DIVIDEND PER SHARE', 'PROFIT MARGIN',
       'SG&A EXPENSE', 'REVENUE GROWTH', 'INTEREST EXPENSE',
       'EARNINGS BEFORE TAX', 'REVENUE', 'NET INCOME',
       'WEIGHTED AVERAGE SHS OUT (DIL)', 'CONSOLIDATED INCOME',
       'EARNINGS BEFORE TAX MARGIN', 'FREE CASH FLOW MARGIN',
       'R&D EXPENSES'], dtype=object)

In [26]:
filter_list = ['REVENUE']
plot_trend(financial_statement[financial_statement['Financial Metric'].isin(filter_list)],'Date Value','Value','Ticker')

## Interest rate

In [29]:
interest_rate = pd.read_csv('../sample_dataset/oecd-interest-rates.csv', parse_dates=['Date'])
print(interest_rate.shape)
display(interest_rate.head(5))
display(interest_rate.describe())

(1376, 10)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Measure,Frequency,Region,Source,Indicator,Subject
0,1.64,2020-12-31,INTEREST RATES,GLOBAL DATA,PERCENT PER ANNUM,Q,EURO AREA(16 COUNTRIES),OECD,LONG-TERM INTEREST RATES FORECAST,TOTAL
1,4.35,2020-12-31,INTEREST RATES,GLOBAL DATA,PERCENT PER ANNUM,Q,CHINA,OECD,SHORT-TERM INTEREST RATES FORECAST,TOTAL
2,6.3,2020-12-31,INTEREST RATES,GLOBAL DATA,PERCENT PER ANNUM,Q,INDIA,OECD,LONG-TERM INTEREST RATES FORECAST,TOTAL
3,0.28,2020-12-31,INTEREST RATES,GLOBAL DATA,PERCENT PER ANNUM,Q,EURO AREA(16 COUNTRIES),OECD,SHORT-TERM INTEREST RATES FORECAST,TOTAL
4,1.77,2020-12-31,INTEREST RATES,GLOBAL DATA,PERCENT PER ANNUM,Q,UNITED STATES,OECD,SHORT-TERM INTEREST RATES FORECAST,TOTAL


Unnamed: 0,Value
count,1376.0
mean,4.345974
std,3.596752
min,-0.52
25%,1.83
50%,4.15
75%,6.25
max,50.19


In [30]:
interest_rate.Indicator.unique()

array(['LONG-TERM INTEREST RATES FORECAST',
       'SHORT-TERM INTEREST RATES FORECAST', 'LONG-TERM INTEREST RATES',
       'SHORT-TERM INTEREST RATES'], dtype=object)

In [36]:
plot_trend(interest_rate[interest_rate.Region=='UNITED STATES'],'Date','Value','Indicator')

In [31]:
plot_trend(interest_rate[interest_rate.Indicator=='LONG-TERM INTEREST RATES'],'Date','Value','Region')

## Inventory outlook

In [34]:
inventory = pd.read_csv('../sample_dataset/short-term-crude-oil-inventory-outlook.csv', parse_dates=['Date'])
print(inventory.shape)
display(inventory.head(5))
display(inventory.describe())

(448, 10)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Timelevel,Frequency,Region,Parameter,Unit,Source
0,455.91,2021-12-31,SHORT-TERM ENERGY OUTLOOK,GLOBAL DATA,MONTHLY,M,UNITED STATES,CRUDE OIL INVENTORY (EXCLUDING SPR),"MILLION BARRELS, END-OF-PERIOD",U.S.ENERGY INFORMATION ADMINISTRATION
1,455.91,2021-12-31,SHORT-TERM ENERGY OUTLOOK,GLOBAL DATA,QUARTERLY,Q,UNITED STATES,CRUDE OIL INVENTORY (EXCLUDING SPR),"MILLION BARRELS, END-OF-PERIOD",U.S.ENERGY INFORMATION ADMINISTRATION
2,469.81,2021-11-30,SHORT-TERM ENERGY OUTLOOK,GLOBAL DATA,MONTHLY,M,UNITED STATES,CRUDE OIL INVENTORY (EXCLUDING SPR),"MILLION BARRELS, END-OF-PERIOD",U.S.ENERGY INFORMATION ADMINISTRATION
3,470.17,2021-10-31,SHORT-TERM ENERGY OUTLOOK,GLOBAL DATA,MONTHLY,M,UNITED STATES,CRUDE OIL INVENTORY (EXCLUDING SPR),"MILLION BARRELS, END-OF-PERIOD",U.S.ENERGY INFORMATION ADMINISTRATION
4,457.92,2021-09-30,SHORT-TERM ENERGY OUTLOOK,GLOBAL DATA,MONTHLY,M,UNITED STATES,CRUDE OIL INVENTORY (EXCLUDING SPR),"MILLION BARRELS, END-OF-PERIOD",U.S.ENERGY INFORMATION ADMINISTRATION


Unnamed: 0,Value
count,448.0
mean,352.546496
std,66.543891
min,268.39
25%,307.885
50%,332.345
75%,362.4375
max,538.6


In [45]:
inventory['Unit'].unique()

array(['MILLION BARRELS, END-OF-PERIOD'], dtype=object)

In [46]:
plot_trend(inventory[inventory.Frequency=='M'],'Date','Value','Unit')

## Oil demand

In [47]:
oil_demand = pd.read_csv('../sample_dataset/jodi-oil-demand-2020.csv', parse_dates=['Date'])
print(oil_demand.shape)
display(oil_demand.head(5))
display(oil_demand.describe())

(392, 10)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Energy Product,Flow Breakdown,Time Level,Country,Unit of Measurement,Source
0,24.66,2020-07-01,JODI OIL-WORLD DATABASE,GLOBAL DATA,TOTAL OIL PRODUCTS,DEMAND,MONTHLY,BRUNEI DARUSSALAM,THOUSAND BARRELS PER DAY(KB-D),JOINT ORGANISATIONS DATA INITIATIVE - JODI
1,2075.0,2020-07-01,JODI OIL-WORLD DATABASE,GLOBAL DATA,TOTAL OIL PRODUCTS,DEMAND,MONTHLY,GERMANY,THOUSAND BARRELS PER DAY(KB-D),JOINT ORGANISATIONS DATA INITIATIVE - JODI
2,55.9,2020-07-01,JODI OIL-WORLD DATABASE,GLOBAL DATA,TOTAL OIL PRODUCTS,DEMAND,MONTHLY,CYPRUS,THOUSAND BARRELS PER DAY(KB-D),JOINT ORGANISATIONS DATA INITIATIVE - JODI
3,187.0,2020-07-01,JODI OIL-WORLD DATABASE,GLOBAL DATA,TOTAL OIL PRODUCTS,DEMAND,MONTHLY,SWITZERLAND,THOUSAND BARRELS PER DAY(KB-D),JOINT ORGANISATIONS DATA INITIATIVE - JODI
4,18309.48,2020-07-01,JODI OIL-WORLD DATABASE,GLOBAL DATA,TOTAL OIL PRODUCTS,DEMAND,MONTHLY,UNITED STATES,THOUSAND BARRELS PER DAY(KB-D),JOINT ORGANISATIONS DATA INITIATIVE - JODI


Unnamed: 0,Value
count,392.0
mean,1144.385714
std,3037.775847
min,1.0
25%,56.56
50%,208.5
75%,982.75
max,20508.41


In [48]:
plot_trend(oil_demand,'Date','Value','Country')

## Mobility data

### Apple

In [49]:
mobility_apple = pd.read_excel('../sample_dataset/apple-mobility-california-2020.xlsx', parse_dates=['Date'])
print(mobility_apple.shape)
display(mobility_apple.head(5))
display(mobility_apple.describe())

(1060, 11)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Frequency,Region,Country,Unit,Geography Type,Transportation Type,Source
0,33.65,2020-12-31,APPLE MOBILITY INDEX,GLOBAL DATA,DAILY,CALIFORNIA,UNITED STATES,INDEX,SUB-REGION,TRANSIT,"APPLE, INC."
1,91.63,2020-12-31,APPLE MOBILITY INDEX,GLOBAL DATA,DAILY,CALIFORNIA,UNITED STATES,INDEX,SUB-REGION,DRIVING,"APPLE, INC."
2,93.16,2020-12-31,APPLE MOBILITY INDEX,GLOBAL DATA,DAILY,CALIFORNIA,UNITED STATES,INDEX,SUB-REGION,WALKING,"APPLE, INC."
3,39.23,2020-12-30,APPLE MOBILITY INDEX,GLOBAL DATA,DAILY,CALIFORNIA,UNITED STATES,INDEX,SUB-REGION,TRANSIT,"APPLE, INC."
4,100.03,2020-12-30,APPLE MOBILITY INDEX,GLOBAL DATA,DAILY,CALIFORNIA,UNITED STATES,INDEX,SUB-REGION,DRIVING,"APPLE, INC."


Unnamed: 0,Value
count,1060.0
mean,81.731406
std,33.969962
min,18.39
25%,46.1475
50%,93.37
75%,108.0475
max,158.4


In [50]:
plot_trend(mobility_apple,'Date','Value','Transportation Type')

### Google

In [52]:
mobility_google = pd.read_csv('../sample_dataset/google-mobility-index-la-county-2020.csv', parse_dates=['Date'])
print(mobility_google.shape)
display(mobility_google.head(5))
display(mobility_google.describe())

(1900, 11)


Unnamed: 0,Value,Date,Sub-Sector,Super Region,Sub Region 2,Frequency,Country Region,Sub Region 1,Unit,Source,Indicator
0,-52,2020-12-31,GOOGLE MOBILITY INDEX,GLOBAL DATA,LOS ANGELES COUNTY,DAILY,UNITED STATES,CALIFORNIA,INDEX,GOOGLE LLC,TRANSIT STATIONS PERCENT CHANGE FROM BASELINE
1,-32,2020-12-31,GOOGLE MOBILITY INDEX,GLOBAL DATA,LOS ANGELES COUNTY,DAILY,UNITED STATES,CALIFORNIA,INDEX,GOOGLE LLC,PARKS PERCENT CHANGE FROM BASELINE
2,20,2020-12-31,GOOGLE MOBILITY INDEX,GLOBAL DATA,LOS ANGELES COUNTY,DAILY,UNITED STATES,CALIFORNIA,INDEX,GOOGLE LLC,RESIDENTIAL PERCENT CHANGE FROM BASELINE
3,-30,2020-12-31,GOOGLE MOBILITY INDEX,GLOBAL DATA,LOS ANGELES COUNTY,DAILY,UNITED STATES,CALIFORNIA,INDEX,GOOGLE LLC,RETAIL AND RECREATION PERECENT CHANGE FROM BAS...
4,-58,2020-12-31,GOOGLE MOBILITY INDEX,GLOBAL DATA,LOS ANGELES COUNTY,DAILY,UNITED STATES,CALIFORNIA,INDEX,GOOGLE LLC,WORKPLACES PERCENT CHANGE FROM BASELINE


Unnamed: 0,Value
count,1900.0
mean,-20.753684
std,21.94755
min,-83.0
25%,-39.0
50%,-24.0
75%,-4.0
max,37.0


In [53]:
plot_trend(mobility_google,'Date','Value','Indicator')

# News Sentiment

In [59]:
news_sentiment = pd.read_csv('../sample_dataset/ave-daily-news-sentiment-exxon-2020.csv', parse_dates=['DateTime'])
news_sentiment['Unit'] = 'score'

print(news_sentiment.shape)
display(news_sentiment.head(5))
display(news_sentiment.describe())

(101, 3)


Unnamed: 0,DateTime,Daily News Sentiment,Unit
0,2020-12-31,-0.1,score
1,2020-12-30,-0.4,score
2,2020-12-29,-0.5,score
3,2020-12-24,-0.2,score
4,2020-12-22,0.3,score


Unnamed: 0,Daily News Sentiment
count,101.0
mean,-0.198218
std,0.228173
min,-0.8
25%,-0.35
50%,-0.2
75%,-0.1
max,0.3


In [60]:
plot_trend(news_sentiment,'DateTime','Daily News Sentiment','Unit')

# Data preparation