diff --git a/ox/html.py b/ox/html.py index bae9bd9..8f30609 100644 --- a/ox/html.py +++ b/ox/html.py @@ -318,5 +318,7 @@ def sanitize_fragment(html): ''' import lxml.html body = lxml.html.document_fromstring(html).find('body') - return lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8') - + html = lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8') + if html.startswith('
') and html.endswith('
'): + html = html[3:-4] + return html