import text not html
This commit is contained in:
parent
97006b0b3e
commit
84c15c690a
3 changed files with 15 additions and 1 deletions
|
|
@ -24,3 +24,13 @@ def find_isbns(text):
|
|||
|
||||
def get_language(lang):
|
||||
return ox.iso.codeToLang(lang.split('-')[0]) or lang
|
||||
|
||||
def decode_html_data(data):
|
||||
if isinstance(data, dict):
|
||||
for key in data:
|
||||
data[key] = decode_html_data(data[key])
|
||||
elif isinstance(data, list):
|
||||
data = [decode_html_data(v) for v in data]
|
||||
elif isinstance(data, str):
|
||||
data = ox.decode_html(data)
|
||||
return data
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue