From 84dc6241c0c444b5147510cd65ffa9e2798c3025 Mon Sep 17 00:00:00 2001 From: j <0x006A@0x2620.org> Date: Thu, 12 Apr 2007 12:57:46 +0000 Subject: [PATCH] years --- scrapeit/imdb.py | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/scrapeit/imdb.py b/scrapeit/imdb.py index db063ae..395130a 100644 --- a/scrapeit/imdb.py +++ b/scrapeit/imdb.py @@ -164,9 +164,13 @@ class IMDb: IMDbDict['year'] = html_title[0][1] IMDbDict['title'] = stripTags(title).strip() else: - title = _getTerm(data, '(.*?)').split('(') - year = title[-1].split(')')[0].strip() - title = title[0].strip().decode('utf-8') + title = _getTerm(data, '(.*?)') + m = re.compile('\((\d+)\)').findall(title) + if m: + year = m[0] + else: + year = title.split('(')[-1].split(')')[0].strip() + title = title.split('(')[0].strip().decode('utf-8') IMDbDict['title'] = title IMDbDict['year'] = year IMDbDict['title'] = htmldecode(IMDbDict['title'])