and heres the main chunk of the code to get the URLS
THANKS
Code:
if __name__ == "__main__":
import urllib
usock = urllib.urlopen("http://uk.search.yahoo.com/search?p=cinemas+in+dublin&fr=yfp-t-501&ei=UTF-8&meta=vc%3D")
parser = URLLister()
parser.feed(usock.read())
parser.close()
usock.close()
path = u"c:\\Users\\Neil\\Desktop\\"
i = 0
for url in parser.urls:
if i <= (len(parser.urls)):
print i
print parser.urls[i]
page = urllib.urlopen(parser.urls[i]).read()
f = file(path + u"test" + str(i) + u".txt", "w+")
print >> f, page
f.close()
print "Html file successfully printed to file!"