diff --git a/scrapeit/imdb.py b/scrapeit/imdb.py index 628eed7..cb202f1 100644 --- a/scrapeit/imdb.py +++ b/scrapeit/imdb.py @@ -159,9 +159,9 @@ class IMDb: html_title = str(html_title[0]) title = stripTags(html_title) title = re.sub('\(\d\d\d\d\)', '', title) - title = re.sub('\(TV\)', '', title) - title = re.sub('\(V\)', '', title) - title = re.sub('\(VG\)', '', title) + title = re.sub('\(\d\d\d\d\/I)', '', title) + for t in ('TV-Series', '(mini)', '(VG)', '(V)', '(TV)') + title = title.replace(t, '') return title.strip() def parseYear(self): @@ -174,6 +174,8 @@ class IMDb: if html_title: html_title = str(html_title[0]) year = re.compile('(\d\d\d\d)').findall(html_title) + if not year: + year = re.compile('(\d\d\d\d/I)').findall(html_title) if year: year = year[0] else: year = ''