LXML HTML Parsing Usage Example


from lxml.html import fromstring

f=open("result_urls","a+")
for x in range(0,1000):
	mySearchTree = fromstring(open(str(x)).read())
	f.write("Product Name: ")

	for a in mySearchTree.cssselect('tr input'):
		f.write(a.get('value')) #product_name
		f.write(chr(10))
	f.write("URLS:")
	f.write(chr(10))
	for a in mySearchTree.cssselect('h3 a'):
		f.write(a.get('href')) #url
		f.write(chr(10))
	f.flush()
f.close()

Leave a comment