In [1]:
# https://splinter.readthedocs.io/en/latest/drivers/chrome.html
from splinter import Browser
from bs4 import BeautifulSoup
import pymongo
import requests
import os
import pandas as pd

# ### NASA Mars News

* Scrape the [NASA Mars News Site](https://mars.nasa.gov/news/) and collect the latest News Title and Paragragh Text. Assign the text to variables that you can reference later.

```python
# Example:
news_title = "NASA's Next Mars Mission to Investigate Interior of Red Planet"

news_p = "Preparation of NASA's next spacecraft to Mars, InSight, has ramped up this summer, on course for launch next May from Vandenberg Air Force Base in central California -- the first interplanetary launch in history from America's West Coast."

In [7]:
browser = Browser('chrome', headless=False)
url = 'https://mars.nasa.gov/news/'
browser.visit(url)


In [8]:
html =browser.html
soup = BeautifulSoup(html, 'html.parser')

In [13]:
#collect the latest News Title and Paragragh Text. Assign the text to variables that you can reference later.
title = soup.find("div", class_="content_title").a.text
title


"NASA's Next Mars Lander Spreads its Solar Wings"

In [15]:
paragraph = soup.find("div", class_="article_teaser_body").text
paragraph

"NASA's next mission to Mars passed a key test Tuesday, extending the solar arrays that will power the InSight spacecraft once it lands on the Red Planet this November."

In [16]:
mars = {"Latest News" : title,
        "Information": paragraph}


# ### JPL Mars Space Images - Featured Image
* Visit the url for JPL's Featured Space Image [here](https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars).
* Use splinter to navigate the site and find the image url for the current Featured Mars Image and assign the url string to a variable called `featured_image_url`.
* Make sure to find the image url to the full size `.jpg` image.
* Make sure to save a complete url string for this image.

In [17]:
#run splinter browser
browser = Browser('chrome', headless=False)
url = 'https://www.jpl.nasa.gov/spaceimages/?search=&category=Mars'
browser.visit(url)

In [18]:
#click button for full image
browser.click_link_by_partial_text('FULL IMAGE')

In [19]:
#click button for full image
browser.click_link_by_partial_text('more info')

In [20]:
#click button for full image
browser.click_link_by_partial_text('.jpg')

In [21]:
html = browser.html
soup = BeautifulSoup(html, 'html.parser')
img_url = soup.find("img")['src']


In [22]:
mars["Feature Photo"] = img_url

# ### Mars Weather

* Visit the Mars Weather twitter account [here](https://twitter.com/marswxreport?lang=en) and scrape the latest Mars weather tweet from the page. Save the tweet text for the weather report as a variable called `mars_weather`.

```python
# Example:
mars_weather = 'Sol 1801 (Aug 30, 2017), Sunny, high -21C/-5F, low -80C/-112F, pressure at 8.82 hPa, daylight 06:09-17:55'
```

In [39]:
browser = Browser('chrome', headless=False)
url = 'https://twitter.com/marswxreport?lang=en'
browser.visit(url)


In [40]:
html =browser.html
soup = BeautifulSoup(html, 'html.parser')

In [41]:
weather = soup.find("div", class_="js-tweet-text-container").text.strip()
print(weather)

Sol 1945 (Jan 25, 2018), Sunny, high -22C/-7F, low -78C/-108F, pressure at 7.51 hPa, daylight 05:43-17:28


In [26]:
mars["Current Weather"] = weather

# ### Mars Facts

* Visit the Mars Facts webpage [here](http://space-facts.com/mars/) and use Pandas to scrape the table containing facts about the planet including Diameter, Mass, etc.

* Use Pandas to convert the data to a HTML table string.

In [27]:
browser = Browser('chrome', headless=False)
url = 'https://space-facts.com/mars/'
browser.visit(url)

In [28]:
html =browser.html
soup = BeautifulSoup(html, 'html.parser')

In [29]:
#collect the table. Assign the table to variables that you can reference later.
table = pd.read_html(url)


In [30]:
table_df = pd.DataFrame(table[0])


In [31]:
table_df.columns = ["Stat", "Value"]
table_df.set_index("Stat")

Unnamed: 0_level_0,Value
Stat,Unnamed: 1_level_1
Equatorial Diameter:,"6,792 km"
Polar Diameter:,"6,752 km"
Mass:,6.42 x 10^23 kg (10.7% Earth)
Moons:,2 (Phobos & Deimos)
Orbit Distance:,"227,943,824 km (1.52 AU)"
Orbit Period:,687 days (1.9 years)
Surface Temperature:,-153 to 20 °C
First Record:,2nd millennium BC
Recorded By:,Egyptian astronomers


In [32]:
value_list = table_df["Value"]
fact_list = table_df["Stat"]


In [47]:
slim_facts = []
for fact in fact_list:
    new_fact= fact.replace(" ", "")
    slim_facts.append(new_fact)
    

In [33]:
fact_value = zip(fact_list, value_list)

<zip object at 0x0000022453DC9BC8>


In [34]:
for fact, value in fact_value:
    mars[fact] = value


# ### Mars Hemisperes

* Visit the USGS Astrogeology site [here](https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars) to obtain high resolution images for each of Mar's hemispheres.

* You will need to click each of the links to the hemispheres in order to find the image url to the full resolution image.

* Save both the image url string for the full resolution hemipshere image, and the Hemisphere title containing the hemisphere name. Use a Python dictionary to store the data using the keys `img_url` and `title`.

* Append the dictionary with the image url string and the hemisphere title to a list. This list will contain one dictionary for each hemisphere.

# # Example:
hemisphere_image_urls = [
    {"title": "Valles Marineris Hemisphere", "img_url": "..."},
    {"title": "Cerberus Hemisphere", "img_url": "..."},
    {"title": "Schiaparelli Hemisphere", "img_url": "..."},
    {"title": "Syrtis Major Hemisphere", "img_url": "..."},
]

In [None]:
hem_list = ["Cerberus", "Schiaparelli", "Syrtis Major", "Valles Marineris"]
xpath1 = '//*[@id="wide-image"]/div/ul/li[1]/a'
url_list = []
hem_title= []


In [None]:
browser = Browser('chrome', headless=False)
url = 'https://astrogeology.usgs.gov/search/results?q=hemisphere+enhanced&k1=target&v1=Mars'
browser.visit(url)

In [None]:
#loop attempt
for hem in hem_list:
    browser.click_link_by_partial_text(hem)
    html = browser.html
    soup = BeautifulSoup(html, 'html.parser')
    img_url = soup.find("div", class_="downloads").ul.li.a["href"]
   # get title
    text = soup.body.find('h2').text
    #append url and title to lists
    hem_title.append(text)
    url_list.append(img_url)
    browser.click_link_by_partial_text("Back")
    
    
    
    
    

In [None]:
hem_url = zip(hem_title, url_list)

In [None]:
for title, url in hem_url:
    mars[title] = url
    


In [37]:
mars

{'Current Weather': '\nSol 1945 (Jan 25, 2018), Sunny, high -22C/-7F, low -78C/-108F, pressure at 7.51 hPa, daylight 05:43-17:28\n',
 'Equatorial Diameter:': '6,792 km',
 'Feature Photo': 'https://photojournal.jpl.nasa.gov/jpeg/PIA16837.jpg',
 'First Record:': '2nd millennium BC',
 'Information': "NASA's next mission to Mars passed a key test Tuesday, extending the solar arrays that will power the InSight spacecraft once it lands on the Red Planet this November.",
 'Latest News': "NASA's Next Mars Lander Spreads its Solar Wings",
 'Mass:': '6.42 x 10^23 kg (10.7% Earth)',
 'Moons:': '2 (Phobos & Deimos)',
 'Orbit Distance:': '227,943,824 km (1.52 AU)',
 'Orbit Period:': '687 days (1.9 years)',
 'Polar Diameter:': '6,752 km',
 'Recorded By:': 'Egyptian astronomers',
 'Surface Temperature:': '-153 to 20 °C'}