Skip to content

Commit

Permalink
Update scraper.py
Browse files Browse the repository at this point in the history
  • Loading branch information
Brandhunt committed Jan 26, 2020
1 parent 96ff6ed commit 021ca27
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions scraper.py
Expand Up @@ -348,8 +348,9 @@ def doesscrapeurlexist(scrapesitelist, scrapeurl):
if matches:
prod_url = matches[0]
if prod_url is None or prod_url == '':
print(prod_url_html)
matches = re.search(r'href\=\"\K(.*?)\"', prod_url_html)
#print(prod_url_html)
#matches = re.search(r'href\=\"\K(.*?)\"', prod_url_html)
matches = re.search(r'href\=\"(.*?)\"', prod_url_html)
prod_url = matches[1]
new_prod_url = urljoin(scrapsite['scrapeurl'], prod_url)
if prod_url != new_prod_url:
Expand Down

0 comments on commit 021ca27

Please sign in to comment.