diff --git a/ox/html.py b/ox/html.py index 549e32f..7da078f 100644 --- a/ox/html.py +++ b/ox/html.py @@ -398,8 +398,5 @@ def sanitize_fragment(html): if not html: return u'' import lxml.html - body = lxml.html.document_fromstring(html).find('body') - html = lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8') - if html.startswith('

') and html.endswith('

'): - html = html[3:-4] - return html + html = lxml.html.fragment_fromstring(html, create_parent=False) + return lxml.html.tostring(html, encoding='utf-8').decode('utf-8')