blob: dc2e27245a292b320cfcd5ce573de55cc13b8bfa (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
|
import re
def striptags(text):
return re.compile(r'<[^>]*>').sub('', text)
def go(m):
# .html with no anchor if present, otherwise "#" for top of page
return m.group(1) or '#'
def strip_toplevel_anchors(text):
return re.compile(r'(\.html)?#[-\w]+-toplevel').sub(go, text)
|