In [69]:
# https://splinter.readthedocs.io/en/latest/drivers/chrome.html
from splinter import Browser
from bs4 import BeautifulSoup
import pymongo
import requests
import os

# ### NASA Mars News

* Scrape the [NASA Mars News Site](https://mars.nasa.gov/news/) and collect the latest News Title and Paragragh Text. Assign the text to variables that you can reference later.

```python
# Example:
news_title = "NASA's Next Mars Mission to Investigate Interior of Red Planet"

news_p = "Preparation of NASA's next spacecraft to Mars, InSight, has ramped up this summer, on course for launch next May from Vandenberg Air Force Base in central California -- the first interplanetary launch in history from America's West Coast."

In [70]:
# Initialize PyMongo to work with MongoDBs
conn = 'mongodb://localhost:27017'
client = pymongo.MongoClient(conn)

In [71]:
# Define database and collection
db = client.mars_db
collection = db.mars_news

In [74]:
browser = Browser('chrome', headless=False)
url = 'https://mars.nasa.gov/news/'
browser.visit(url)


In [76]:
html =browser.html
soup = BeautifulSoup(html, 'html.parser')

In [77]:
#collect the latest News Title and Paragragh Text. Assign the text to variables that you can reference later.
title = soup.find("div", class_="content_title").text
print(title)

NASA's Next Mars Lander Spreads its Solar Wings


In [78]:
paragraph = soup.find("div", class_="article_teaser_body").text
print(paragraph)

NASA's next mission to Mars passed a key test Tuesday, extending the solar arrays that will power the InSight spacecraft once it lands on the Red Planet this November.


In [79]:
news = {"Latest News" : title,
        "Information": paragraph}

news

{'Information': "NASA's next mission to Mars passed a key test Tuesday, extending the solar arrays that will power the InSight spacecraft once it lands on the Red Planet this November.",
 'Latest News': "NASA's Next Mars Lander Spreads its Solar Wings"}

In [80]:
db.mars_news.insert_one(news)

<pymongo.results.InsertOneResult at 0x2292d007e08>

In [88]:
# Display items in MongoDB collection
latest_news = db.mars_news.find()

for news in latest_news:
    print(news)

{'_id': ObjectId('5a6a85d4db82562e14f66102'), 'Latest News': "NASA's Next Mars Lander Spreads its Solar Wings", 'Information': "NASA's next mission to Mars passed a key test Tuesday, extending the solar arrays that will power the InSight spacecraft once it lands on the Red Planet this November."}


# ### JPL Mars Space Images - Featured Image
* Visit the url for JPL's Featured Space Image [here](https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars).
* Use splinter to navigate the site and find the image url for the current Featured Mars Image and assign the url string to a variable called `featured_image_url`.
* Make sure to find the image url to the full size `.jpg` image.
* Make sure to save a complete url string for this image.

In [89]:
mars_image = db.mars_image

In [16]:
#run splinter browser
browser = Browser('chrome', headless=False)
url = 'https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars'
browser.visit(url)

In [17]:
#click button for full image
browser.click_link_by_partial_text('FULL IMAGE')

In [18]:
#click button for full image
browser.click_link_by_partial_text('more info')

In [19]:
#parse the second column for the image URL
# Design an XPATH selector to grab the "Mars in natural color in 2007" image on the right
xpath = '//*[@id="secondary_column"]/aside[1]/ul/li[7]/div/p/a'


In [20]:
# Use splinter to Click the "Mars in natural color in 2007" image 
# to bring up the full resolution image
results = browser.find_by_xpath(xpath)
img = results[0]
img.click()

In [22]:
html = browser.html
soup = BeautifulSoup(html, 'html.parser')
img_url = soup.find("img")['src']
img_url
#why doesn't this work?

'https://photojournal.jpl.nasa.gov/jpeg/PIA14924.jpg'

In [90]:
image = {"Featured Mars Image": img_url}

In [91]:
mars_image.insert_one(image)

<pymongo.results.InsertOneResult at 0x2292cf18588>

# ### Mars Weather

* Visit the Mars Weather twitter account [here](https://twitter.com/marswxreport?lang=en) and scrape the latest Mars weather tweet from the page. Save the tweet text for the weather report as a variable called `mars_weather`.

```python
# Example:
mars_weather = 'Sol 1801 (Aug 30, 2017), Sunny, high -21C/-5F, low -80C/-112F, pressure at 8.82 hPa, daylight 06:09-17:55'
```

In [None]:
mars_weather = db.mars_weather

In [92]:
browser = Browser('chrome', headless=False)
url = 'https://twitter.com/marswxreport?lang=en'
browser.visit(url)


In [24]:
html =browser.html
soup = BeautifulSoup(html, 'html.parser')

In [26]:
weather = soup.find("div", class_="js-tweet-text-container").text
print(weather)


Happy 14th anniversary @MarsRovers Opportunity, here’s to another 7.4 more (Mars years).  That’s a lot of kilometers (45 to be exact) behind you.pic.twitter.com/BvaE6rEZ9I



# ### Mars Facts

* Visit the Mars Facts webpage [here](http://space-facts.com/mars/) and use Pandas to scrape the table containing facts about the planet including Diameter, Mass, etc.

* Use Pandas to convert the data to a HTML table string.

In [27]:
browser = Browser('chrome', headless=False)
url = 'https://space-facts.com/mars/'
browser.visit(url)

In [28]:
html =browser.html
soup = BeautifulSoup(html, 'html.parser')

In [32]:
#collect the table. Assign the table to variables that you can reference later.
table = soup.find("table", class_="tablepress tablepress-id-mars").tbody.text.replace("\n","")
print(table)

Equatorial Diameter:6,792 kmPolar Diameter:6,752 kmMass:6.42 x 10^23 kg (10.7% Earth)Moons:2 (Phobos & Deimos)Orbit Distance:227,943,824 km (1.52 AU)Orbit Period:687 days (1.9 years)Surface Temperature: -153 to 20 °CFirst Record:2nd millennium BCRecorded By:Egyptian astronomers


# ### Mars Hemisperes

* Visit the USGS Astrogeology site [here](https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars) to obtain high resolution images for each of Mar's hemispheres.

* You will need to click each of the links to the hemispheres in order to find the image url to the full resolution image.

* Save both the image url string for the full resolution hemipshere image, and the Hemisphere title containing the hemisphere name. Use a Python dictionary to store the data using the keys `img_url` and `title`.

* Append the dictionary with the image url string and the hemisphere title to a list. This list will contain one dictionary for each hemisphere.

# # Example:
hemisphere_image_urls = [
    {"title": "Valles Marineris Hemisphere", "img_url": "..."},
    {"title": "Cerberus Hemisphere", "img_url": "..."},
    {"title": "Schiaparelli Hemisphere", "img_url": "..."},
    {"title": "Syrtis Major Hemisphere", "img_url": "..."},
]

In [65]:
hem_list = ["Cerberus", "Schiaparelli", "Syrtis Major", "Valles Marineris"]
xpath1 = '//*[@id="wide-image"]/div/ul/li[1]/a'
url_list = []
hem_tite= []
hem_dic = {}

In [66]:
browser = Browser('chrome', headless=False)
url = 'https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars'
browser.visit(url)

In [67]:
#loop attempt
for hem in hem_list:
    browser.click_link_by_partial_text(hem)
    html = browser.html
    soup = BeautifulSoup(html, 'html.parser')
    img_url = soup.find("div", class_="downloads").ul.li.a["href"]
   # url_list.append(img_url)
    text = soup.body.find('h2').text
    #title.append(text)
    hem_dic = {"Title": text,
               "Image URL": img_url}
    browser.click_link_by_partial_text("Back")
    
    
    
    
    

In [68]:
hem_dic

{'Image URL': 'http://astropedia.astrogeology.usgs.gov/download/Mars/Viking/valles_marineris_enhanced.tif/full.jpg',
 'Title': 'Valles Marineris Hemisphere Enhanced'}

In [64]:
title

['Cerberus Hemisphere Enhanced',
 'Schiaparelli Hemisphere Enhanced',
 'Syrtis Major Hemisphere Enhanced',
 'Valles Marineris Hemisphere Enhanced']