diff --git a/ox/html.py b/ox/html.py index bae9bd9..8f30609 100644 --- a/ox/html.py +++ b/ox/html.py @@ -318,5 +318,7 @@ def sanitize_fragment(html): ''' import lxml.html body = lxml.html.document_fromstring(html).find('body') - return lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8') - + html = lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8') + if html.startswith('

') and html.endswith('

'): + html = html[3:-4] + return html