|
|
@ -86,6 +86,8 @@ def clean_up(html): |
|
|
|
""" |
|
|
|
html = re.sub(r'\[.*edit.*\]', '', html) # remove the [edit] |
|
|
|
html = re.sub(r'href="/book/index.php\?title=', 'href="#', html) # remove the internal wiki links |
|
|
|
html = re.sub(r'[(?=\d)', '', html) # remove left footnote bracket [ |
|
|
|
html = re.sub(r'(?<=\d)]', '', html) # remove right footnote bracket ] |
|
|
|
return html |
|
|
|
|
|
|
|
def parse_page(pagename, wiki): |
|
|
|