import HTMLParser
class TMP(HTMLParser.HTMLParser):
INI = 0
DIV = 1
OTH = 2
def __init__(self):
HTMLParser.HTMLParser.__init__(self)
self.level = 0
def handle_starttag(self, tag, attrs):
attrs = dict(attrs);self.level += 1
print '%s%r: %r' % ('\t'*self.level, tag, attrs)
def handle_endtag(self, tag):
print '%sclose tag: %r' % ('\t'*self.level, tag)
self.level -= 1
def handle_data(self, data):
print '%sdata: %r' %('\t'*(self.level+1), data)
import mechanize
def show_site(url):
br = mechanize.Browser()
r = br.open(url)
print r.info()
_a = TMP()
_a.feed(r.read())
#return _a.links
a = filter(None, show_site(raw_input('url? ')))