import bs4 from urllib2 import urlopen as ureq from bs4 import BeautifulSoup as soup
url=’https://www.newegg.com/Xbox-One-Video-Games/SubCategory/ID-3218?Tid=21799&cm_sp=Cat_Xbox-One_2--VisNav--Xbox-One-Games’ my_url=ureq(url) page_html=my_url.read() my_url.close() page_soup=soup(page_html,”html.parser”)
page_soup.h1
print (page_soup.h1) containers=page_soup.findAll(“div”,{‘class’:’item-container’})
filename=”products.csv” f=open(‘product.csv’,’w’) headers=’brand, product_name’ f.write(‘headers’) for container in containers: brand = containers.div.div.a.img[“title”]
title_container=container.find("a",{"class":"item-title"}) product_name = title_container[0].text print ("brand:"+brand) print ("product_name:" +product_name) f.write(brand + ","+product_name.replace(",","|")) f.close()