update count after index was updated

This commit is contained in:
j 2019-08-05 19:42:08 +02:00
parent d47f1c6a61
commit ccff7572d0

View file

@ -66,6 +66,7 @@ def get_film_count(year, month=None, day=None):
total = re.compile('<span>([\d,]+) titles.</span>', re.DOTALL).findall(data)
if total:
return int(total[0].replace(',', ''))
if year > 1900:
print('no movies', url)
ox.web.imdb.delete_url(url)
return 0
@ -83,24 +84,23 @@ def print_info(key, film_count, film_counts):
extra = ''
print('update', key, 'now has', film_count, 'films', extra)
def update_year(year, film_counts):
key = '%s' % year
if film_counts[key] > MAX_PER_RANGE:
def update_year(year, year_count, film_counts):
if year_count > MAX_PER_RANGE:
for month in range(1, 13):
key = '%04d-%02d' % (year, month)
film_count = get_film_count(year, month)
if film_count != film_counts.get(key):
print_info(key, film_count, film_counts)
update_month(year, month, film_count, film_counts)
film_counts[key] = film_count
update_month(year, month, film_counts)
else:
r = update_ids(year)
film_counts['%s' % year] = year_count
save_film_counts(film_counts)
def update_month(year, month, film_counts):
def update_month(year, month, month_count, film_counts):
key = '%04d-%02d' % (year, month)
if film_counts[key] > MAX_PER_RANGE:
month_total = film_counts[key]
if month_count > MAX_PER_RANGE:
days_total = 0
days = calendar.monthrange(year, month)[1]
for day in range(1, days + 1):
@ -109,13 +109,15 @@ def update_month(year, month, film_counts):
days_total += film_count
if film_count != film_counts.get(key):
print_info(key, film_count, film_counts)
film_counts[key] = film_count
r = update_ids(year, month, day, expected=film_count)
film_counts[key] = film_count
save_film_counts(film_counts)
if days_total != month_total:
if days_total != month_count:
print('!! month and days don\'t add up: %s month vs %s days total' % (month_total, days_total))
else:
r = update_ids(year, month)
key = '%04d-%02d' % (year, month)
film_counts[key] = month_count
save_film_counts(film_counts)
def parse_cast(string):
@ -263,8 +265,7 @@ def update_index(from_year=None):
key = '%s' % year
if film_count != film_counts.get(key):
print_info(key, film_count, film_counts)
film_counts[key] = film_count
update_year(year, film_counts)
update_year(year, film_count, film_counts)
save_film_counts(film_counts)
def get_unknown_ids(known_ids):