imdb: parse tenical info
This commit is contained in:
parent
0b9a3966b0
commit
da38ba3839
1 changed files with 19 additions and 0 deletions
|
@ -90,6 +90,20 @@ def parse_aspectratio(value):
|
||||||
value = '.'.join(value.strip().split('.')[:2])
|
value = '.'.join(value.strip().split('.')[:2])
|
||||||
return value
|
return value
|
||||||
|
|
||||||
|
|
||||||
|
def technical(label):
|
||||||
|
return {
|
||||||
|
'page': 'technical',
|
||||||
|
're': [
|
||||||
|
'<td class="label">\s*?%s\s*?</td>.*?<td>\s*?(.*?)\s*?</td>' % label,
|
||||||
|
lambda data: [
|
||||||
|
re.sub('\s+', ' ', d.strip()) for d in data.strip().split('<br>')
|
||||||
|
] if data else []
|
||||||
|
],
|
||||||
|
'type': 'list'
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
'''
|
'''
|
||||||
'posterIds': {
|
'posterIds': {
|
||||||
'page': 'posters',
|
'page': 'posters',
|
||||||
|
@ -300,6 +314,11 @@ class Imdb(SiteParser):
|
||||||
],
|
],
|
||||||
'type': 'list'
|
'type': 'list'
|
||||||
},
|
},
|
||||||
|
'laboratory': technical('Laboratory'),
|
||||||
|
'camera': technical('Camera'),
|
||||||
|
'negative format': technical('Negative Format'),
|
||||||
|
'cinematographic process': technical('Cinematographic Process'),
|
||||||
|
'printed film format': technical('Printed Film Format'),
|
||||||
}
|
}
|
||||||
|
|
||||||
def read_url(self, url, timeout):
|
def read_url(self, url, timeout):
|
||||||
|
|
Loading…
Reference in a new issue