only get id from criterion
This commit is contained in:
parent
b3345523b4
commit
2050c9deae
1 changed files with 2 additions and 2 deletions
|
@ -75,13 +75,13 @@ def getIds():
|
||||||
def getIdsByPage(page):
|
def getIdsByPage(page):
|
||||||
ids = []
|
ids = []
|
||||||
html = readUrlUnicode("http://www.criterion.com/library/dvd?page=%s" % page)
|
html = readUrlUnicode("http://www.criterion.com/library/dvd?page=%s" % page)
|
||||||
results = re.compile("films/(.*?)\"").findall(html)
|
results = re.compile("films/(\d+)").findall(html)
|
||||||
for result in results:
|
for result in results:
|
||||||
ids.append(result)
|
ids.append(result)
|
||||||
results = re.compile("boxsets/(.*?)\"").findall(html)
|
results = re.compile("boxsets/(.*?)\"").findall(html)
|
||||||
for result in results:
|
for result in results:
|
||||||
html = readUrlUnicode("http://www.criterion.com/boxsets/" + result)
|
html = readUrlUnicode("http://www.criterion.com/boxsets/" + result)
|
||||||
results = re.compile("films/(.*?)\"").findall(html)
|
results = re.compile("films/(\d+)").findall(html)
|
||||||
for result in results:
|
for result in results:
|
||||||
ids.append(result)
|
ids.append(result)
|
||||||
return set(ids)
|
return set(ids)
|
||||||
|
|
Loading…
Reference in a new issue