3 retry_attempts and a default 5 minute timeout

This commit is contained in:
James Turk 2011-09-20 16:07:24 -04:00
parent c31faa3fb7
commit 376d27a8ff
2 changed files with 11 additions and 8 deletions

View File

@ -49,11 +49,9 @@ class Client(object):
requests_per_minute=rpm,
follow_robots=False,
raise_errors=True,
timeout=timeout,
# disable scrapelib's retries
retry_attempts=0,
retry_wait_seconds=0,
)
timeout=timeout)
self.retry_attempts = retry_attempts
self.retry_wait_minutes = retry_wait_minutes
@ -136,7 +134,10 @@ class Client(object):
if error:
c_errors = doc.get('consecutive_errors', 0)
doc['consecutive_errors'] = c_errors + 1
if c_errors <= self.retry_attempts:
update_mins = self.retry_wait_minutes * (2**c_errors)
else:
update_mins = doc['update_mins']
else:
doc['consecutive_errors'] = 0
update_mins = doc['update_mins']

View File

@ -7,6 +7,8 @@ MONGO_LOG_MAXSIZE = 100000000
# scrapelib
USER_AGENT = 'oyster'
REQUESTS_PER_MINUTE = 300
REQUEST_TIMEOUT = 0
RETRY_ATTEMPTS = 0
REQUEST_TIMEOUT = 300
# other
RETRY_ATTEMPTS = 3
RETRY_WAIT_MINUTES = 60