diff --git a/projects/Web scraping a youtube comment/webscrapindcomment.py b/projects/Web scraping a youtube comment/webscrapindcomment.py new file mode 100644 index 00000000..4893b10e --- /dev/null +++ b/projects/Web scraping a youtube comment/webscrapindcomment.py @@ -0,0 +1,37 @@ +# -*- coding: utf-8 -*- +""" +Created on Tue Jul 21 16:55:39 2020 + +@author: hp +""" + +from selenium import webdriver +import csv +import time + +items=[] +driver=webdriver.Chrome(r"C:/Users/hp/Anaconda3/chromedriver.exe") + +driver.get('https://www.youtube.com/watch?v=iFPMz36std4') + +driver.execute_script('window.scrollTo(1, 500);') + +#now wait let load the comments +time.sleep(5) + +driver.execute_script('window.scrollTo(1, 3000);') + + +username_elems = driver.find_elements_by_xpath('//*[@id="author-text"]') +comment_elems = driver.find_elements_by_xpath('//*[@id="content-text"]') +for username, comment in zip(username_elems, comment_elems): + item = {} + item['Author'] = username.text + item['Comment'] = comment.text + items.append(item) +filename = 'C:/Users/hp/Desktop/commentlist.csv' +with open(filename, 'w', newline='', encoding='utf-8') as f: + w = csv.DictWriter(f,['Author','Comment']) + w.writeheader() + for item in items: + w.writerow(item)