cast and genre cleanup
This commit is contained in:
parent
ef49aae822
commit
f3eaf4404f
1 changed files with 4 additions and 2 deletions
|
@ -84,7 +84,8 @@ def getMovieInfo(imdbId, timeout=-1):
|
||||||
for i in re.compile('<h5>(.*?):</h5>(.*?)<div class="info"', re.DOTALL).findall(data):
|
for i in re.compile('<h5>(.*?):</h5>(.*?)<div class="info"', re.DOTALL).findall(data):
|
||||||
title = stripTags(i[0]).strip().lower()
|
title = stripTags(i[0]).strip().lower()
|
||||||
if title in ('genre', ):
|
if title in ('genre', ):
|
||||||
txt = i[1].split('</div>')[0]
|
txt = i[1].split('<a class="tn15more')[0].split('</div>')[0]
|
||||||
|
print txt
|
||||||
else:
|
else:
|
||||||
txt= i[1]
|
txt= i[1]
|
||||||
txt = stripTags(txt).strip()
|
txt = stripTags(txt).strip()
|
||||||
|
@ -277,7 +278,8 @@ def getMovieCredits(imdbId):
|
||||||
data = readUrlUnicode(url)
|
data = readUrlUnicode(url)
|
||||||
groups = data.split('<h5>')
|
groups = data.split('<h5>')
|
||||||
for g in groups:
|
for g in groups:
|
||||||
section = re.compile('''name="(.*?)".*? href="/Glossary''').findall(g)
|
#<a class="glossary" name="writers" href="/glossary/W#writer">Writing credits</a>
|
||||||
|
section = re.compile('''name="(.*?)".*? href="/Glossary''', re.IGNORECASE).findall(g)
|
||||||
if section:
|
if section:
|
||||||
credits[section[0]] = creditList(g, section[0])
|
credits[section[0]] = creditList(g, section[0])
|
||||||
return credits
|
return credits
|
||||||
|
|
Loading…
Reference in a new issue