import re

def striptags(text):
    return re.compile(r'<[^>]*>').sub('', text)

def go(m):
    # .html with no anchor if present, otherwise "#" for top of page
    return m.group(1) or '#'

def strip_toplevel_anchors(text):
    return re.compile(r'(\.html)?#[-\w]+-toplevel').sub(go, text)