mirror of
https://github.com/internetarchive/brozzler.git
synced 2025-02-24 00:29:53 -05:00
WT-2950 fix typos
This commit is contained in:
parent
6fdc2b9a57
commit
12db06ae8c
@ -329,7 +329,7 @@ class BrozzlerWorker:
|
||||
|
||||
def _is_pdf(self, page_headers) -> bool:
|
||||
"""
|
||||
Determinse if the page's Content-Type header specifies that it is a PDF.
|
||||
Determines if the page's Content-Type header specifies that it is a PDF.
|
||||
"""
|
||||
return (
|
||||
"content-type" in page_headers
|
||||
|
@ -117,7 +117,7 @@ seeds starving out other jobs.
|
||||
Limits capture to PDFs based on MIME type. This value will only impact
|
||||
processing of outlinks within Brozzler. Fully limiting a crawl to only PDFs
|
||||
requires an additional entry in the Warcprox-Meta header ``mime-type-filters``
|
||||
key to fully block videos by MIME type.
|
||||
key.
|
||||
|
||||
``seeds``
|
||||
~~~~~~~~~
|
||||
|
Loading…
x
Reference in New Issue
Block a user