Skip to content

Commit

Permalink
Update scraper.py
Browse files Browse the repository at this point in the history
  • Loading branch information
Brandhunt committed Jan 26, 2020
1 parent 42daba4 commit acc7255
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions scraper.py
Expand Up @@ -436,15 +436,15 @@ def doesscrapeurlexist(scrapesitelist, scrapeurl):
#print(scrapsite['scrapefield']['priceselector'])
if scrapsite['scrapefield']['priceselector'].find('[multiple],') != -1:
scrapsite['scrapefield']['priceselector'].replace('[multiple],', '')
prod_price_elements = root.cssselect(scrapsite['scrapefield']['priceselector'])
prod_price_elements = prod_root.cssselect(scrapsite['scrapefield']['priceselector'])
for el in prod_price_elements:
if el is None:
continue
prod_price = prod_price + el.text + ' '
if prod_price != '':
prod_price = re.sub(r'([^a-zA-Z]\w+\%+)', '', prod_price)
else:
prod_price_elements = root.cssselect(scrapsite['scrapefield']['priceselector'])
prod_price_elements = prod_root.cssselect(scrapsite['scrapefield']['priceselector'])
if prod_price_elements:
for price_el in prod_price_elements:
if price_el.text is not None:
Expand All @@ -470,7 +470,7 @@ def doesscrapeurlexist(scrapesitelist, scrapeurl):
if scrapsite['scrapefield']['salespriceselector']:
try:
scrapsite['scrapefield']['salespriceselector'] = scrapsite['scrapefield']['salespriceselector'].encode().decode("unicode-escape")
prod_salesprice_elements = root.cssselect(scrapsite['scrapefield']['salespriceselector'])
prod_salesprice_elements = prod_root.cssselect(scrapsite['scrapefield']['salespriceselector'])
if prod_salesprice_elements:
if any(char.isdigit() for char in prod_salesprice_elements[0].text):
prod_salesprice = prod_salesprice_elements[0].text
Expand Down Expand Up @@ -656,7 +656,7 @@ def doesscrapeurlexist(scrapesitelist, scrapeurl):
try:
scrapsite['scrapefield']['imageselector'] = scrapsite['scrapefield']['imageselector'].encode().decode("unicode-escape")
#image_urls = ''
image_elements = root.cssselect(scrapsite['scrapefield']['imageselector'])
image_elements = prod_root.cssselect(scrapsite['scrapefield']['imageselector'])
if image_elements:
for i in range(len(image_elements)):
image_elements[i] = str(etree.tostring(image_elements[i]))
Expand Down

0 comments on commit acc7255

Please sign in to comment.