impawards every hours is all i want, kg should only allow imdbIds with digits nothing else

2009-08-19 19:53:19 +02:00 · 2009-08-19 19:53:19 +02:00 · ddae01323a
commit ddae01323a
parent 0600d39198
2 changed files with 2 additions and 2 deletions
--- a/oxweb/impawards.py
+++ b/oxweb/impawards.py
@ -55,7 +55,7 @@ def getId(url):

 def getIds():
    ids = []
-    html = getUrlUnicode('http://www.impawards.com/archives/latest.html', timeout = 0)
+    html = getUrlUnicode('http://www.impawards.com/archives/latest.html', timeout = 60*60)
    pages = int(findRe(html, '<a href= page(.*?).html>')) + 1
    for page in range(pages, 0, -1):
        for id in getIdsByPage(page):
--- a/oxweb/karagarga.py
+++ b/oxweb/karagarga.py
@ -38,7 +38,7 @@ def getData(id):
        if string:
            data['genre'].append(string)
    data['id'] = id
-    data['imdbId'] = findRe(html, 'imdb.com/title/tt(.*?)/?"')
+    data['imdbId'] = findRe(html, 'imdb.com/title/tt(\d{7})')
    data['language'] = stripTags(parseTable(html, 'Language'))
    data['leechers'] = int(findRe(html, 'seeder\(s\), (.*?) leecher\(s\)'))
    data['link'] = stripTags(parseTable(html, 'Internet Link'))