In [1]:
from bs4 import BeautifulSoup
import pandas as pd
import time
from splinter import Browser
import requests

In [2]:
executable_path = {'executable_path': '/usr/local/bin/chromedriver'}
browser = Browser('chrome', **executable_path, headless=False)

# NASA Mars News

In [3]:
# Navigate to the page
news_url = 'https://mars.nasa.gov/news/'
browser.visit(news_url)

In [4]:
time.sleep(4)

# Assign the HTML content of the page to a variable
news_html = browser.html

# Parse HTML with Beautifulsoup
soup = BeautifulSoup(news_html,'html.parser')

In [5]:
# Retrieve the latest News Title and Paragraph Text
result = soup.find('div', class_="list_text")

news_title = result.a.text
news_p = result.find('div',class_="article_teaser_body").text

print(f"news_title: {news_title}")
print(f"news_p: {news_p}")

news_title: NASA's Mars Rover Drivers Need Your Help
news_p: Using an online tool to label Martian terrain types, you can train an artificial intelligence algorithm that could improve the way engineers guide the Curiosity rover.


# JPL Mars Space Images - Featured Image

In [6]:
# Navigate to the page
img_url = 'https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars'
browser.visit(img_url)

In [7]:
time.sleep(4)

# Assign the HTML content of the page to a variable
imgs_html = browser.html
# Parse HTML with Beautifulsoup
soup = BeautifulSoup(imgs_html,'html.parser')

In [8]:
# Find the image url for the current Featured Mars Image
img_result = soup.find('article', class_="carousel_item")['style']

img_url = img_result.replace("background-image: url('","").replace("');","")
featured_image_url = f"https://www.jpl.nasa.gov{img_url}"

print(featured_image_url)

https://www.jpl.nasa.gov/spaceimages/images/wallpaper/PIA18273-1920x1200.jpg


# Mars Weather

In [9]:
# Navigate to the page
weather_url = 'https://twitter.com/marswxreport?lang=en'
browser.visit(weather_url)

In [10]:
time.sleep(4)

# Assign the HTML content of the page to a variable
weather_html = browser.html
# Parse HTML with Beautifulsoup
soup = BeautifulSoup(weather_html, 'html.parser')

In [11]:
span_class = "css-901oao css-16my406 r-1qd0xha r-ad9z0x r-bcqeeo r-qvutc0"
results = soup.body.find_all("span", class_=span_class)

# Retrieve the latest Mars weather tweet from the page.
for index, result in enumerate(results):
    if "InSight" in result.text:
        mars_weather = result.text
        print(mars_weather)
        break  # get the first result only
    else:
        pass

InSight sol 549 (2020-06-12) low -91.8ºC (-133.3ºF) high -1.5ºC (29.3ºF)
winds from the SW at 4.5 m/s (10.1 mph) gusting to 18.2 m/s (40.6 mph)
pressure at 7.40 hPa


# Mars Facts

In [12]:
# Collect the tables from the page 
facts_url = 'https://space-facts.com/mars/'
browser.visit(facts_url)

# Retrieve the table containing facts about the planet 

#tables = pd.read_html(requests.get('https://space-facts.com/mars/').text)
tables = pd.read_html(facts_url)
df = tables[0]
df.columns = ["Description","Value"]
idx_df = df.set_index("Description")
idx_df

Unnamed: 0_level_0,Value
Description,Unnamed: 1_level_1
Equatorial Diameter:,"6,792 km"
Polar Diameter:,"6,752 km"
Mass:,6.39 × 10^23 kg (0.11 Earths)
Moons:,2 (Phobos & Deimos)
Orbit Distance:,"227,943,824 km (1.38 AU)"
Orbit Period:,687 days (1.9 years)
Surface Temperature:,-87 to -5 °C
First Record:,2nd millennium BC
Recorded By:,Egyptian astronomers


In [13]:
## Export to a HTML file
mars_df = idx_df.to_html("table.html", border="1",justify="left")

# Mars Hemispheres

In [14]:
# Navigate to the page
hemisphere_url = 'https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars'
browser.visit(hemisphere_url)

In [15]:
time.sleep(4)

# Assign the HTML content of the page to a variable
hemisphere_html = browser.html
# Parse HTML with Beautifulsoup
soup = BeautifulSoup(hemisphere_html,'html.parser')

In [16]:
# Collect the urls for the hemisphere images
items = soup.find_all("div", class_="item")

main_url = "https://astrogeology.usgs.gov"
hemisphere_urls = []

for item in items:
    hemisphere_urls.append(f"{main_url}{item.find('a', class_='itemLink')['href']}")

print(*hemisphere_urls, sep = "\n") 

https://astrogeology.usgs.gov/search/map/Mars/Viking/cerberus_enhanced
https://astrogeology.usgs.gov/search/map/Mars/Viking/schiaparelli_enhanced
https://astrogeology.usgs.gov/search/map/Mars/Viking/syrtis_major_enhanced
https://astrogeology.usgs.gov/search/map/Mars/Viking/valles_marineris_enhanced


In [17]:
# Create a list to store the data
hemisphere_image_urls=[]

# Loop through each url
for url in hemisphere_urls:
    # Navigate to the page
    browser.visit(url)
    
    time.sleep(4)
    
    # Assign the HTML content of the page to a variable
    hemisphere_html = browser.html
    # Parse HTML with Beautifulsoup
    soup = BeautifulSoup(hemisphere_html,'html.parser')
    
    img_url = soup.find('img', class_="wide-image")['src']
    title = soup.find('h2', class_="title").text
    
    hemisphere_image_urls.append({"title":title,"img_url":f"https://astrogeology.usgs.gov{img_url}"})

In [18]:
hemisphere_image_urls

[{'title': 'Cerberus Hemisphere Enhanced',
  'img_url': 'https://astrogeology.usgs.gov/cache/images/f5e372a36edfa389625da6d0cc25d905_cerberus_enhanced.tif_full.jpg'},
 {'title': 'Schiaparelli Hemisphere Enhanced',
  'img_url': 'https://astrogeology.usgs.gov/cache/images/3778f7b43bbbc89d6e3cfabb3613ba93_schiaparelli_enhanced.tif_full.jpg'},
 {'title': 'Syrtis Major Hemisphere Enhanced',
  'img_url': 'https://astrogeology.usgs.gov/cache/images/555e6403a6ddd7ba16ddb0e471cadcf7_syrtis_major_enhanced.tif_full.jpg'},
 {'title': 'Valles Marineris Hemisphere Enhanced',
  'img_url': 'https://astrogeology.usgs.gov/cache/images/b3c7c6c9138f57b4756be9b9c43e3a48_valles_marineris_enhanced.tif_full.jpg'}]

In [19]:
browser.quit()