diff --git a/ox/criterion.py b/ox/criterion.py index 5062503..3e6e653 100644 --- a/ox/criterion.py +++ b/ox/criterion.py @@ -6,6 +6,10 @@ from oxutils.html import stripTags from oxutils.text import findRe def getPosterUrl(title, director): + # imdb module is currently broken + ''' + imdbId = imdb.getMovieId(title, director) + ''' html = getUrl('http://criterion.com/asp/list.asp?sort=spine') strings = findRe(html, '(.*?)
').split('') strings.pop(0) @@ -14,13 +18,10 @@ def getPosterUrl(title, director): criterionTitle = findRe(string, 'class="title">(.*?)') criterionTitle = re.sub('(?<=\\w)
(?=\\w)', ' / ', criterionTitle) criterionTitle = criterionTitle.replace('
', '') - criteriondirector = stripTags(findRe(string, '.*?(.*?)')).strip() - print '%s %s (%s)' % (criterionId, criterionTitle, criterionDirector) - # imdb module is currently broken + criterionDirector = stripTags(findRe(string, '.*?(.*?)')).strip() + print '%s: %s (%s)' % (criterionId, criterionTitle, criterionDirector) ''' - imdbId = imdb.getMovieId(title, director) - imdbData = imdb.getMovieData(imdbId) - if imdbData['title'] == title and imdbData['director'] == director: + if imdb.getMovieId(criterionTitle, criterionDirector) == imdbId: return 'http://criterion.com/content/images/full_boxshot/%s_box_348x490.jpg' % criterionId ''' return '' @@ -29,4 +30,4 @@ def test(): return if __name__ == '__main__': - getPosterUrl('Le Mepris', 'Jean-Luc Godard') \ No newline at end of file + getPosterUrl('Le mepris', 'Jean-Luc Godard') \ No newline at end of file diff --git a/ox/imdb.py b/ox/imdb.py index e1d9c67..78b84b7 100644 --- a/ox/imdb.py +++ b/ox/imdb.py @@ -25,7 +25,6 @@ def getMovieId(title, director='', year=''): query = 'site:imdb.com %s "%s"' % (director, title) else: query = 'site:imdb.com "%s"' % title - print google.find(query, 3) for (name, url, desc) in google.find(query, 3): if url.startswith('http://www.imdb.com/title/tt'): return url[28:35]