mirror of
https://github.com/webrecorder/browsertrix-crawler.git
synced 2025-12-08 06:09:48 +00:00
Adds support for autoclick behavior:
- Adds new `autoclick` behavior option to `--behaviors`, but not
enabling by default
- Adds support for new exposed function `__bx_addSet` which allows
autoclick behavior to persist state about links that have already been
clicked to avoid duplicates, only used if link has an href
- Adds a new pageFinished flag on the worker state.
- Adds a on('dialog') handler to reject onbeforeunload page navigations,
when in behavior (page not finished), but accept when page is finished -
to allow navigation away only when behaviors are done
- Update to browsertrix-behaviors 0.7.0, which supports autoclick
- Add --clickSelector option to customize elements that will be clicked,
defaulting to `a`.
- Add --linkSelector as alias for --selectLinks for consistency
- Unknown options for --behaviors printed as warnings, instead of hard
exit, for forward compatibility for new behavior types in the future
Fixes #728, also #216, #665, #31
|
||
|---|---|---|
| .. | ||
| custom-behaviors | ||
| fixtures | ||
| invalid-behaviors | ||
| .DS_Store | ||
| adblockrules.test.js | ||
| add-exclusion.test.js | ||
| basic_crawl.test.js | ||
| blockrules.test.js | ||
| brave-query-redir.test.js | ||
| collection_name.test.js | ||
| config_file.test.js | ||
| config_stdin.test.js | ||
| crawl_overwrite.js | ||
| custom-behavior.test.js | ||
| custom_driver.test.js | ||
| custom_selector.test.js | ||
| dryrun.test.js | ||
| extra_hops_depth.test.js | ||
| file_stats.test.js | ||
| http-auth.test.js | ||
| limit_reached.test.js | ||
| log_filtering.test.js | ||
| mult_url_crawl_with_favicon.test.js | ||
| multi-instance-crawl.test.js | ||
| non-html-crawl.test.js | ||
| pageinfo-records.test.js | ||
| proxy.test.js | ||
| qa_compare.test.js | ||
| rollover-writer.test.js | ||
| saved-state.test.js | ||
| scopes.test.js | ||
| screenshot.test.js | ||
| seeds.test.js | ||
| sitemap-parse.test.js | ||
| storage.test.js | ||
| text-extract.test.js | ||
| url_file_list.test.js | ||
| warcinfo.test.js | ||