diff --git a/ox/web/criterion.py b/ox/web/criterion.py index 6b3ac8c..2d5aa86 100644 --- a/ox/web/criterion.py +++ b/ox/web/criterion.py @@ -82,12 +82,12 @@ def get_ids(page=None): ids = [] if page: url = "http://www.criterion.com/library/expanded_view?m=dvd&p=%s&pp=50&s=spine" % page - html = read_url(url) + html = read_url(url, unicode=True) results = re.compile("films/(\d+)").findall(html) ids += results results = re.compile("boxsets/(.*?)\"").findall(html) for result in results: - html = read_url("http://www.criterion.com/boxsets/" + result) + html = read_url("http://www.criterion.com/boxsets/" + result, unicode=True) results = re.compile("films/(\d+)").findall(html) ids += results return set(ids)