mirror of
https://github.com/internetarchive/brozzler.git
synced 2025-02-24 00:29:53 -05:00
skip .pdf
This commit is contained in:
parent
48681e2a93
commit
88223cee59
@ -198,7 +198,7 @@ class BrozzlerWorker:
|
|||||||
self.logger.info("brozzling {}".format(page))
|
self.logger.info("brozzling {}".format(page))
|
||||||
ydl_fetches = None
|
ydl_fetches = None
|
||||||
outlinks = set()
|
outlinks = set()
|
||||||
if enable_youtube_dl:
|
if enable_youtube_dl and not page.url.lower().endswith(".pdf"):
|
||||||
try:
|
try:
|
||||||
ydl_fetches, outlinks = ydl.do_youtube_dl(self, site, page)
|
ydl_fetches, outlinks = ydl.do_youtube_dl(self, site, page)
|
||||||
except brozzler.ReachedLimit as e:
|
except brozzler.ReachedLimit as e:
|
||||||
|
Loading…
x
Reference in New Issue
Block a user