mirror of
https://github.com/unitedstates/congress.git
synced 2025-12-25 01:00:04 -05:00
update scrapelib to 0.10, remove non-bacwards-compatible follow_robots arg.
This commit is contained in:
@@ -37,7 +37,7 @@ else:
|
||||
eastern_time_zone = timezone('US/Eastern')
|
||||
|
||||
# scraper should be instantiated at class-load time, so that it can rate limit appropriately
|
||||
scraper = scrapelib.Scraper(requests_per_minute=120, follow_robots=False, retry_attempts=3)
|
||||
scraper = scrapelib.Scraper(requests_per_minute=120, retry_attempts=3)
|
||||
scraper.user_agent = "unitedstates/congress (https://github.com/unitedstates/congress)"
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user