revert change, fragment_fromstring only parses single element
This commit is contained in:
parent
8bda86c17d
commit
34691832eb
1 changed files with 5 additions and 2 deletions
|
@ -398,5 +398,8 @@ def sanitize_fragment(html):
|
|||
if not html:
|
||||
return u''
|
||||
import lxml.html
|
||||
html = lxml.html.fragment_fromstring(html, create_parent=False)
|
||||
return lxml.html.tostring(html, encoding='utf-8').decode('utf-8')
|
||||
body = lxml.html.document_fromstring(html).find('body')
|
||||
html = lxml.html.tostring(body, encoding='utf-8')[6:-7].decode('utf-8')
|
||||
if html.startswith('<p>') and html.endswith('</p>'):
|
||||
html = html[3:-4]
|
||||
return html
|
||||
|
|
Loading…
Reference in a new issue