update count after index was updated
This commit is contained in:
parent
d47f1c6a61
commit
ccff7572d0
1 changed files with 16 additions and 15 deletions
|
@ -66,6 +66,7 @@ def get_film_count(year, month=None, day=None):
|
|||
total = re.compile('<span>([\d,]+) titles.</span>', re.DOTALL).findall(data)
|
||||
if total:
|
||||
return int(total[0].replace(',', ''))
|
||||
if year > 1900:
|
||||
print('no movies', url)
|
||||
ox.web.imdb.delete_url(url)
|
||||
return 0
|
||||
|
@ -83,24 +84,23 @@ def print_info(key, film_count, film_counts):
|
|||
extra = ''
|
||||
print('update', key, 'now has', film_count, 'films', extra)
|
||||
|
||||
def update_year(year, film_counts):
|
||||
key = '%s' % year
|
||||
if film_counts[key] > MAX_PER_RANGE:
|
||||
def update_year(year, year_count, film_counts):
|
||||
if year_count > MAX_PER_RANGE:
|
||||
for month in range(1, 13):
|
||||
key = '%04d-%02d' % (year, month)
|
||||
film_count = get_film_count(year, month)
|
||||
if film_count != film_counts.get(key):
|
||||
print_info(key, film_count, film_counts)
|
||||
update_month(year, month, film_count, film_counts)
|
||||
film_counts[key] = film_count
|
||||
update_month(year, month, film_counts)
|
||||
else:
|
||||
r = update_ids(year)
|
||||
film_counts['%s' % year] = year_count
|
||||
save_film_counts(film_counts)
|
||||
|
||||
def update_month(year, month, film_counts):
|
||||
def update_month(year, month, month_count, film_counts):
|
||||
key = '%04d-%02d' % (year, month)
|
||||
if film_counts[key] > MAX_PER_RANGE:
|
||||
month_total = film_counts[key]
|
||||
if month_count > MAX_PER_RANGE:
|
||||
days_total = 0
|
||||
days = calendar.monthrange(year, month)[1]
|
||||
for day in range(1, days + 1):
|
||||
|
@ -109,13 +109,15 @@ def update_month(year, month, film_counts):
|
|||
days_total += film_count
|
||||
if film_count != film_counts.get(key):
|
||||
print_info(key, film_count, film_counts)
|
||||
film_counts[key] = film_count
|
||||
r = update_ids(year, month, day, expected=film_count)
|
||||
film_counts[key] = film_count
|
||||
save_film_counts(film_counts)
|
||||
if days_total != month_total:
|
||||
if days_total != month_count:
|
||||
print('!! month and days don\'t add up: %s month vs %s days total' % (month_total, days_total))
|
||||
else:
|
||||
r = update_ids(year, month)
|
||||
key = '%04d-%02d' % (year, month)
|
||||
film_counts[key] = month_count
|
||||
save_film_counts(film_counts)
|
||||
|
||||
def parse_cast(string):
|
||||
|
@ -263,8 +265,7 @@ def update_index(from_year=None):
|
|||
key = '%s' % year
|
||||
if film_count != film_counts.get(key):
|
||||
print_info(key, film_count, film_counts)
|
||||
film_counts[key] = film_count
|
||||
update_year(year, film_counts)
|
||||
update_year(year, film_count, film_counts)
|
||||
save_film_counts(film_counts)
|
||||
|
||||
def get_unknown_ids(known_ids):
|
||||
|
|
Loading…
Reference in a new issue