In [4]:
from splinter import Browser
from bs4 import BeautifulSoup
import requests
import pymongo
import pandas as pd
import re
from selenium import webdriver

### NASA Mars News

* Scrape the [NASA Mars News Site](https://mars.nasa.gov/news/) and collect the latest News Title and Paragraph Text. Assign the text to variables that you can reference later.

```python
# Example:
news_title = "NASA's Next Mars Mission to Investigate Interior of Red Planet"

news_p = "Preparation of NASA's next spacecraft to Mars, InSight, has ramped up this summer, on course for launch next May from Vandenberg Air Force Base in central California -- the first interplanetary launch in history from America's West Coast."

In [11]:
url = 'https://mars.nasa.gov/news'

In [12]:
executable_path = {'executable_path':'chromedriver.exe'}

browser = Browser('chrome', **executable_path, headless = False)

browser.visit(url)

soup = BeautifulSoup(browser.html, 'lxml')

In [13]:
latest_article_text = soup.find('div', class_ = 'article_teaser_body').text
latest_article_title = soup.find('div', class_ = 'content_title').a.text

In [14]:
latest_article_text

"One month since increasing their commanding frequency, engineers have yet to hear from NASA's Opportunity rover."

### JPL Mars Space Images - Featured Image

* Visit the url for JPL Featured Space Image [here](https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars).

* Use splinter to navigate the site and find the image url for the current Featured Mars Image and assign the url string to a variable called `featured_image_url`.

* Make sure to find the image url to the full size `.jpg` image.

* Make sure to save a complete url string for this image.


In [47]:
executable_path = {'executable_path':'chromedriver.exe'}

browser = Browser('chrome', **executable_path, headless = False)

url = 'https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars'

browser.visit(url)

html = browser.html

soup = BeautifulSoup(html, 'html.parser')

string = soup.find('article', class_ = 'carousel_item')['style']

string_split = string.split('\'')

featured_image_url = 'https://www.jpl.nasa.gov/' + string_split[1]

print(featured_image_url)

browser.visit(featured_image_url)

https://www.jpl.nasa.gov//spaceimages/images/wallpaper/PIA18816-1920x1200.jpg


### Mars Weather

* Visit the Mars Weather twitter account [here](https://twitter.com/marswxreport?lang=en) and scrape the latest Mars weather tweet from the page. Save the tweet text for the weather report as a variable called `mars_weather`.


In [10]:
url = 'https://twitter.com/marswxreport?lang=en'

In [11]:
response = requests.get(url)

In [12]:
soup = BeautifulSoup(response.text, 'lxml')

In [13]:
tweets = soup.find_all('p', class_='TweetTextSize TweetTextSize--normal js-tweet-text tweet-text')

for tweet in tweets:
    if 'Sol' in tweet.text:
        mars_weather = tweet.text
        break
        

### Mars Facts

* Visit the Mars Facts webpage [here](http://space-facts.com/mars/) and use Pandas to scrape the table containing facts about the planet including Diameter, Mass, etc.

* Use Pandas to convert the data to a HTML table string.

In [14]:
url = 'https://space-facts.com/mars/'

In [15]:
df = pd.read_html(url)

In [16]:
df[0].to_html()

'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>0</th>\n      <th>1</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>Equatorial Diameter:</td>\n      <td>6,792 km</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>Polar Diameter:</td>\n      <td>6,752 km</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>Mass:</td>\n      <td>6.42 x 10^23 kg (10.7% Earth)</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>Moons:</td>\n      <td>2 (Phobos &amp; Deimos)</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>Orbit Distance:</td>\n      <td>227,943,824 km (1.52 AU)</td>\n    </tr>\n    <tr>\n      <th>5</th>\n      <td>Orbit Period:</td>\n      <td>687 days (1.9 years)</td>\n    </tr>\n    <tr>\n      <th>6</th>\n      <td>Surface Temperature:</td>\n      <td>-153 to 20 °C</td>\n    </tr>\n    <tr>\n      <th>7</th>\n      <td>First Record:</td>\n      <td>2nd millennium BC</td>\n    

### Mars Hemispheres

* Visit the USGS Astrogeology site [here](https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars) to obtain high resolution images for each of Mar's hemispheres.

* You will need to click each of the links to the hemispheres in order to find the image url to the full resolution image.

* Save both the image url string for the full resolution hemisphere image, and the Hemisphere title containing the hemisphere name. Use a Python dictionary to store the data using the keys `img_url` and `title`.

* Append the dictionary with the image url string and the hemisphere title to a list. This list will contain one dictionary for each hemisphere.

In [66]:
url4 = 'https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars'

browser = Browser('chrome', **executable_path, headless = False)

browser.visit(url4)

In [67]:
html = browser.html

big_soup = BeautifulSoup(html, 'html.parser')

links = big_soup.find_all('h3')

hemispheres = []

for link in links :
    browser.click_link_by_partial_text(link.text)
    img_dict = {}
    lil_soup = BeautifulSoup(browser.html, 'html.parser')
    img_dict['img_url'] = lil_soup.find('a', text = re.compile('Original'))["href"]
    img_dict['title'] = link.text
    hemispheres.append(img_dict)
    browser.click_link_by_partial_text('Back')

[{'img_url': 'http://astropedia.astrogeology.usgs.gov/download/Mars/Viking/cerberus_enhanced.tif',
  'title': 'Cerberus Hemisphere Enhanced'},
 {'img_url': 'http://astropedia.astrogeology.usgs.gov/download/Mars/Viking/schiaparelli_enhanced.tif',
  'title': 'Schiaparelli Hemisphere Enhanced'},
 {'img_url': 'http://astropedia.astrogeology.usgs.gov/download/Mars/Viking/syrtis_major_enhanced.tif',
  'title': 'Syrtis Major Hemisphere Enhanced'},
 {'img_url': 'http://astropedia.astrogeology.usgs.gov/download/Mars/Viking/valles_marineris_enhanced.tif',
  'title': 'Valles Marineris Hemisphere Enhanced'}]