Add bodystart and bodyend comments to removal list.

This commit is contained in:
Ethan Dalool 2020-01-26 15:01:06 -08:00
parent 205bbf61a2
commit aa19d49ffc

View file

@ -77,6 +77,8 @@ def remove_header_br(html):
@html_cleaner
def remove_misc_strings(html):
html = html.replace('epub:type="pagebreak"', '')
html = html.replace('<!-- BodyStart-->', '')
html = html.replace('<!-- BodyEnd-->', '')
html = re.sub(r'title="[ivx]+"', '', html)
html = re.sub(r'title="\d+"', '', html)
return html