Log the size of received batches from pushshift.

master
Ethan Dalool 2020-09-06 21:41:44 -07:00
parent 83d5a8e70e
commit e136aeea4e
1 changed files with 2 additions and 0 deletions

View File

@ -109,6 +109,7 @@ def _pagination_core(url, params, dummy_type, lower=None, upper=None):
setify = lambda items: set(item['id'] for item in items)
prev_batch_ids = set()
while True:
for retry in range(5):
try:
@ -120,6 +121,7 @@ def _pagination_core(url, params, dummy_type, lower=None, upper=None):
else:
break
common.log.debug('Got batch of %d items.', len(batch))
batch_ids = setify(batch)
if len(batch_ids) == 0 or batch_ids.issubset(prev_batch_ids):
break