def __init__(self): self.data = set([]) self.href = 0 self.patt = re.compile(r'^\?p=\d+$') HTMLParser.__init__(self)