From 2ad0c0b499ea505b105c1fc6c65c4a0c57b0820e Mon Sep 17 00:00:00 2001 From: j Date: Tue, 25 Sep 2018 10:24:27 +0200 Subject: [PATCH] fix year parsing, ref #3168 --- ox/web/imdb.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/ox/web/imdb.py b/ox/web/imdb.py index 6c5ae90..e310c88 100644 --- a/ox/web/imdb.py +++ b/ox/web/imdb.py @@ -285,7 +285,10 @@ class Imdb(SiteParser): 'writer': reference_section('writers'), 'year': { 'page': 'reference', - 're': '(\d+)', + 're': [ + '(.*?)', + '(\d+)[- ]*<', + ], 'type': 'int' }, 'credits': { @@ -444,7 +447,7 @@ class Imdb(SiteParser): if 'year' in series: self['seriesYear'] = series['year'] - if not 'year' in self: + if 'year' not in self: self['year'] = series['year'] if 'year' in self: