mirror of
https://github.com/internetarchive/brozzler.git
synced 2025-08-11 16:00:38 -04:00
fix behaviors.yaml, switch simpledo behavior to jinja2 template
This commit is contained in:
parent
3851daa27d
commit
01f5343b48
2 changed files with 88 additions and 88 deletions
|
@ -17,85 +17,88 @@
|
||||||
#
|
#
|
||||||
|
|
||||||
# first matched behavior is used, so order matters here
|
# first matched behavior is used, so order matters here
|
||||||
behaviors:
|
-
|
||||||
-
|
|
||||||
url_regex: '^https?://(?:www\.)?facebook\.com/.*$'
|
url_regex: '^https?://(?:www\.)?facebook\.com/.*$'
|
||||||
behavior_js_template: facebook.js.template
|
behavior_js_template: facebook.js
|
||||||
# default_parameters:
|
|
||||||
# parameter_username: jdoe@example.com
|
|
||||||
# parameter_password: abcd1234
|
|
||||||
request_idle_timeout_sec: 30
|
request_idle_timeout_sec: 30
|
||||||
-
|
-
|
||||||
url_regex: '^https?://(?:www\.)?marquette\.edu/.*$'
|
url_regex: '^https?://(?:www\.)?marquette\.edu/.*$'
|
||||||
behavior_js: marquette_edu.js
|
behavior_js_template: marquette_edu.js
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
-
|
-
|
||||||
url_regex: '^https?://(?:www\.)?vimeo\.com/.*$'
|
url_regex: '^https?://(?:www\.)?vimeo\.com/.*$'
|
||||||
behavior_js: vimeo.js
|
behavior_js_template: vimeo.js
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
-
|
-
|
||||||
url_regex: '^https?://(?:www\.)?psu24.psu.edu/.*$'
|
url_regex: '^https?://(?:www\.)?psu24.psu.edu/.*$'
|
||||||
behavior_js: psu24.js
|
behavior_js_template: psu24.js
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
-
|
-
|
||||||
url_regex: '^https?://(?:www\.)?instagram\.com/.*$'
|
url_regex: '^https?://(?:www\.)?instagram\.com/.*$'
|
||||||
behavior_js: instagram.js
|
behavior_js_template: instagram.js
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
-
|
-
|
||||||
url_regex: '^https?://(?:www\.)?brooklynmuseum\.org/exhibitions/.*$'
|
url_regex: '^https?://(?:www\.)?brooklynmuseum\.org/exhibitions/.*$'
|
||||||
behavior_js_template: simpleclicks.js.template
|
behavior_js_template: simpleclicks.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
click_css_selector: img.img-responsive
|
click_css_selector: img.img-responsive
|
||||||
|
click_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # acalog https://webarchive.jira.com/browse/ARI-3775
|
- # acalog https://webarchive.jira.com/browse/ARI-3775
|
||||||
url_regex: '^https?://.*[?&]catoid=[^?]*$'
|
url_regex: '^https?://.*[?&]catoid=[^?]*$'
|
||||||
behavior_js_template: simpleclicks.js.template
|
behavior_js_template: simpleclicks.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
click_css_selector: a[onclick]
|
click_css_selector: a[onclick]
|
||||||
|
click_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # https://webarchive.jira.com/browse/ARI-3956
|
- # https://webarchive.jira.com/browse/ARI-3956
|
||||||
url_regex: '^https?://(?:www\.)?usask.ca/.*$'
|
url_regex: '^https?://(?:www\.)?usask.ca/.*$'
|
||||||
behavior_js_template: simpleclicks.js.template
|
behavior_js_template: simpleclicks.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
click_css_selector: a[id='feature-next']
|
click_css_selector: a[id='feature-next']
|
||||||
|
click_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # https://webarchive.jira.com/browse/AITFIVE-451
|
- # https://webarchive.jira.com/browse/AITFIVE-451
|
||||||
url_regex: '^https?://(?:www\.)?soundcloud.com/.*$'
|
url_regex: '^https?://(?:www\.)?soundcloud.com/.*$'
|
||||||
behavior_js_template: simpledo.js.template
|
behavior_js_template: simpledo.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
sdo_css_selector: button.sc-button-play, button.playButton
|
sdo_css_selector: button.sc-button-play, button.playButton
|
||||||
sdo_action: click
|
sdo_action: click
|
||||||
|
sdo_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # https://webarchive.jira.com/browse/AITFIVE-463
|
- # https://webarchive.jira.com/browse/AITFIVE-463
|
||||||
url_regex: '^https?://(?:www\.)?christophercerrone.com/.*$'
|
url_regex: '^https?://(?:www\.)?christophercerrone.com/.*$'
|
||||||
behavior_js_template: simpleclicks.js.template
|
behavior_js_template: simpleclicks.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
click_css_selector: button.playButton.medium
|
click_css_selector: button.playButton.medium
|
||||||
|
click_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # https://webarchive.jira.com/browse/ARI-4690
|
- # https://webarchive.jira.com/browse/ARI-4690
|
||||||
url_regex: '^https?://(?:www\.)?youtube.com/.*$'
|
url_regex: '^https?://(?:www\.)?youtube.com/.*$'
|
||||||
behavior_js_template: simpleclicks.js.template
|
behavior_js_template: simpleclicks.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
click_css_selector: span.load-more-text
|
click_css_selector: span.load-more-text
|
||||||
|
click_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # https://webarchive.jira.com/browse/ARI-4725
|
- # https://webarchive.jira.com/browse/ARI-4725
|
||||||
url_regex: '^https?://(?:www\.)?moma.org/.*$'
|
url_regex: '^https?://(?:www\.)?moma.org/.*$'
|
||||||
behavior_js_template: simpleclicks.js.template
|
behavior_js_template: simpleclicks.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
click_css_selector: button[data-more-results-bottom-button]
|
click_css_selector: button[data-more-results-bottom-button]
|
||||||
click_until_hard_timeout: True
|
click_until_hard_timeout: True
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # https://webarchive.jira.com/browse/ARI-4692
|
- # https://webarchive.jira.com/browse/ARI-4692
|
||||||
url_regex: '^https?://(?:www\.)?fec.gov/data/.*$'
|
url_regex: '^https?://(?:www\.)?fec.gov/data/.*$'
|
||||||
behavior_js: fec_gov.js
|
behavior_js_template: fec_gov.js
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- url_regex: '^https?://(?:www\.)?news\.com\.au/.*$'
|
- url_regex: '^https?://(?:www\.)?news\.com\.au/.*$'
|
||||||
behavior_js_template: simpledo.js.template
|
behavior_js_template: simpledo.js.j2
|
||||||
default_parameters:
|
default_parameters:
|
||||||
sdo_css_selector: .menu-item a
|
sdo_css_selector: .menu-item a
|
||||||
sdo_action: mouseover
|
sdo_action: mouseover
|
||||||
|
sdo_until_hard_timeout: False
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
- # default fallback behavior
|
- # default fallback behavior
|
||||||
url_regex: '^.*$'
|
url_regex: '^.*$'
|
||||||
request_idle_timeout_sec: 10
|
request_idle_timeout_sec: 10
|
||||||
behavior_js: default.js
|
behavior_js_template: default.js
|
||||||
|
|
|
@ -26,12 +26,9 @@ var umbraBehavior = {
|
||||||
var didSomething = false;
|
var didSomething = false;
|
||||||
var somethingLeftBelow = false;
|
var somethingLeftBelow = false;
|
||||||
var somethingLeftAbove = false;
|
var somethingLeftAbove = false;
|
||||||
var cssSelector = "${sdo_css_selector}";
|
var cssSelector = {{sdo_css_selector}};
|
||||||
var doAction = "${sdo_action}"; // currently supports click, mouseover
|
var doAction = {{sdo_action}}; // currently supports click, mouseover
|
||||||
var doUntilTimeout = "${sdo_until_hard_timeout}";
|
var doUntilTimeout = {{sdo_until_hard_timeout}};
|
||||||
|
|
||||||
//handle Python to JavaScript boolean conversion
|
|
||||||
doUntilTimeout == "True" ? doUntilTimeout = true : doUntilTimeout = false;
|
|
||||||
|
|
||||||
var iframes = document.querySelectorAll("iframe");
|
var iframes = document.querySelectorAll("iframe");
|
||||||
var documents = Array(iframes.length + 1);
|
var documents = Array(iframes.length + 1);
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue