import text not html

This commit is contained in:
j 2016-01-08 15:52:07 +05:30
commit 84c15c690a
3 changed files with 15 additions and 1 deletions

View file

@ -24,3 +24,13 @@ def find_isbns(text):
def get_language(lang):
return ox.iso.codeToLang(lang.split('-')[0]) or lang
def decode_html_data(data):
if isinstance(data, dict):
for key in data:
data[key] = decode_html_data(data[key])
elif isinstance(data, list):
data = [decode_html_data(v) for v in data]
elif isinstance(data, str):
data = ox.decode_html(data)
return data