mirror of
https://github.com/internetarchive/brozzler.git
synced 2025-06-08 07:03:06 -04:00
use nlevitt fork of surt library for less stupid handling of mailto: urls, etc
This commit is contained in:
parent
ee50818dca
commit
231d019659
2 changed files with 2 additions and 2 deletions
|
@ -44,7 +44,7 @@ def is_permitted_by_robots(site, url):
|
||||||
raise e.args[0]
|
raise e.args[0]
|
||||||
else:
|
else:
|
||||||
if tries_left > 0:
|
if tries_left > 0:
|
||||||
logging.warn("caught exception %s fetching robots.txt (%s tries left) for %s", repr(e), tries_left, url)
|
logging.warn("caught exception fetching robots.txt (%s tries left) for %s: %s", tries_left, url, repr(e))
|
||||||
tries_left -= 1
|
tries_left -= 1
|
||||||
else:
|
else:
|
||||||
logging.error("caught exception fetching robots.txt (0 tries left) for %s: %s", url, repr(e), exc_info=True)
|
logging.error("caught exception fetching robots.txt (0 tries left) for %s: %s", url, repr(e), exc_info=True)
|
||||||
|
|
|
@ -1,6 +1,6 @@
|
||||||
argparse
|
argparse
|
||||||
PyYAML
|
PyYAML
|
||||||
git+https://github.com/ikreymer/surt.git@py3
|
git+https://github.com/nlevitt/surt.git@py3
|
||||||
# youtube_dl
|
# youtube_dl
|
||||||
git+https://github.com/nlevitt/youtube-dl.git@brozzler
|
git+https://github.com/nlevitt/youtube-dl.git@brozzler
|
||||||
git+https://github.com/seomoz/reppy.git
|
git+https://github.com/seomoz/reppy.git
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue