import HTMLParser, urllib
class linkParser(HTMLParser.HTMLParser):
def __init__(self):
HTMLParser.HTMLParser.__init__(self)
self.links = []
def handle_starttag(self, tag, attrs):
if tag=='a':
self.links.append(dict(attrs)['href'])
htmlSource = urllib.urlopen("http://www.sharejs.com").read(200000)
p = linkParser()
p.feed(htmlSource)
for link in p.links:
print link
#//python/207