mirror of
https://github.com/internetarchive/brozzler.git
synced 2025-02-24 08:39:59 -05:00
correctly handle site with no pages (which means the seed was blocked by robots.txt) in frontier.seed_page
This commit is contained in:
parent
317a5eb99d
commit
c6e0e7c507
@ -313,6 +313,8 @@ class RethinkDbFrontier:
|
||||
if len(pages) > 1:
|
||||
self.logger.warn(
|
||||
"more than one seed page for site_id %s ?", site_id)
|
||||
if len(pages) < 1:
|
||||
return None
|
||||
return brozzler.Page(**pages[0])
|
||||
|
||||
def site_pages(self, site_id, unbrozzled_only=False):
|
||||
|
Loading…
x
Reference in New Issue
Block a user