use fragment_fromstring instead of document_fromstring

2014-02-04 10:40:01 +00:00 · 2014-02-04 10:40:01 +00:00 · 8bda86c17d
commit 8bda86c17d
parent 7577b319ce
1 changed files with 2 additions and 5 deletions
--- a/ox/html.py
+++ b/ox/html.py
@ -398,8 +398,5 @@ def sanitize_fragment(html):
    if not html:
        return u''
    import lxml.html
-    body = lxml.html.document_fromstring(html).find('body')
-    html = lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8')
-    if html.startswith('<p>') and html.endswith('</p>'):
-        html = html[3:-4]
-    return html
+    html = lxml.html.fragment_fromstring(html, create_parent=False)
+    return lxml.html.tostring(html, encoding='utf-8').decode('utf-8')