mirror of
https://github.com/webrecorder/browsertrix-crawler.git
synced 2025-12-08 06:09:48 +00:00
1529 lines
No EOL
93 KiB
HTML
1529 lines
No EOL
93 KiB
HTML
|
|
<!doctype html>
|
|
<html lang="en" class="no-js">
|
|
<head>
|
|
|
|
<meta charset="utf-8">
|
|
<meta name="viewport" content="width=device-width,initial-scale=1">
|
|
|
|
|
|
|
|
|
|
<link rel="prev" href="../qa/">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<link rel="icon" href="../../assets/brand/browsertrix-crawler-icon-color-dynamic.svg">
|
|
<meta name="generator" content="mkdocs-1.6.1, mkdocs-material-9.7.0">
|
|
|
|
|
|
|
|
<title>All Command-Line Options - Browsertrix Crawler Docs</title>
|
|
|
|
|
|
|
|
<link rel="stylesheet" href="../../assets/stylesheets/main.618322db.min.css">
|
|
|
|
|
|
<link rel="stylesheet" href="../../assets/stylesheets/palette.ab4e12ef.min.css">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<style>:root{--md-admonition-icon--note:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-pencil-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M12.854.146a.5.5%200%200%200-.707%200L10.5%201.793%2014.207%205.5l1.647-1.646a.5.5%200%200%200%200-.708l-3-3zm.646%206.061L9.793%202.5%203.293%209H3.5a.5.5%200%200%201%20.5.5v.5h.5a.5.5%200%200%201%20.5.5v.5h.5a.5.5%200%200%201%20.5.5v.5h.5a.5.5%200%200%201%20.5.5v.207l6.5-6.5zm-7.468%207.468A.5.5%200%200%201%206%2013.5V13h-.5a.5.5%200%200%201-.5-.5V12h-.5a.5.5%200%200%201-.5-.5V11h-.5a.5.5%200%200%201-.5-.5V10h-.5a.499.499%200%200%201-.175-.032l-.179.178a.5.5%200%200%200-.11.168l-2%205a.5.5%200%200%200%20.65.65l5-2a.5.5%200%200%200%20.168-.11l.178-.178z%22/%3E%3C/svg%3E');--md-admonition-icon--abstract:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-file-earmark-text-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M9.293%200H4a2%202%200%200%200-2%202v12a2%202%200%200%200%202%202h8a2%202%200%200%200%202-2V4.707A1%201%200%200%200%2013.707%204L10%20.293A1%201%200%200%200%209.293%200zM9.5%203.5v-2l3%203h-2a1%201%200%200%201-1-1zM4.5%209a.5.5%200%200%201%200-1h7a.5.5%200%200%201%200%201h-7zM4%2010.5a.5.5%200%200%201%20.5-.5h7a.5.5%200%200%201%200%201h-7a.5.5%200%200%201-.5-.5zm.5%202.5a.5.5%200%200%201%200-1h4a.5.5%200%200%201%200%201h-4z%22/%3E%3C/svg%3E');--md-admonition-icon--info:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-info-circle-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M8%2016A8%208%200%201%200%208%200a8%208%200%200%200%200%2016zm.93-9.412-1%204.705c-.07.34.029.533.304.533.194%200%20.487-.07.686-.246l-.088.416c-.287.346-.92.598-1.465.598-.703%200-1.002-.422-.808-1.319l.738-3.468c.064-.293.006-.399-.287-.47l-.451-.081.082-.381%202.29-.287zM8%205.5a1%201%200%201%201%200-2%201%201%200%200%201%200%202z%22/%3E%3C/svg%3E');--md-admonition-icon--tip:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-exclamation-circle-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M16%208A8%208%200%201%201%200%208a8%208%200%200%201%2016%200zM8%204a.905.905%200%200%200-.9.995l.35%203.507a.552.552%200%200%200%201.1%200l.35-3.507A.905.905%200%200%200%208%204zm.002%206a1%201%200%201%200%200%202%201%201%200%200%200%200-2z%22/%3E%3C/svg%3E');--md-admonition-icon--success:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-check-circle-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M16%208A8%208%200%201%201%200%208a8%208%200%200%201%2016%200zm-3.97-3.03a.75.75%200%200%200-1.08.022L7.477%209.417%205.384%207.323a.75.75%200%200%200-1.06%201.06L6.97%2011.03a.75.75%200%200%200%201.079-.02l3.992-4.99a.75.75%200%200%200-.01-1.05z%22/%3E%3C/svg%3E');--md-admonition-icon--question:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-question-circle-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M16%208A8%208%200%201%201%200%208a8%208%200%200%201%2016%200zM5.496%206.033h.825c.138%200%20.248-.113.266-.25.09-.656.54-1.134%201.342-1.134.686%200%201.314.343%201.314%201.168%200%20.635-.374.927-.965%201.371-.673.489-1.206%201.06-1.168%201.987l.003.217a.25.25%200%200%200%20.25.246h.811a.25.25%200%200%200%20.25-.25v-.105c0-.718.273-.927%201.01-1.486.609-.463%201.244-.977%201.244-2.056%200-1.511-1.276-2.241-2.673-2.241-1.267%200-2.655.59-2.75%202.286a.237.237%200%200%200%20.241.247zm2.325%206.443c.61%200%201.029-.394%201.029-.927%200-.552-.42-.94-1.029-.94-.584%200-1.009.388-1.009.94%200%20.533.425.927%201.01.927z%22/%3E%3C/svg%3E');--md-admonition-icon--warning:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-exclamation-triangle-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M8.982%201.566a1.13%201.13%200%200%200-1.96%200L.165%2013.233c-.457.778.091%201.767.98%201.767h13.713c.889%200%201.438-.99.98-1.767L8.982%201.566zM8%205c.535%200%20.954.462.9.995l-.35%203.507a.552.552%200%200%201-1.1%200L7.1%205.995A.905.905%200%200%201%208%205zm.002%206a1%201%200%201%201%200%202%201%201%200%200%201%200-2z%22/%3E%3C/svg%3E');--md-admonition-icon--failure:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-x-octagon-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M11.46.146A.5.5%200%200%200%2011.107%200H4.893a.5.5%200%200%200-.353.146L.146%204.54A.5.5%200%200%200%200%204.893v6.214a.5.5%200%200%200%20.146.353l4.394%204.394a.5.5%200%200%200%20.353.146h6.214a.5.5%200%200%200%20.353-.146l4.394-4.394a.5.5%200%200%200%20.146-.353V4.893a.5.5%200%200%200-.146-.353L11.46.146zm-6.106%204.5L8%207.293l2.646-2.647a.5.5%200%200%201%20.708.708L8.707%208l2.647%202.646a.5.5%200%200%201-.708.708L8%208.707l-2.646%202.647a.5.5%200%200%201-.708-.708L7.293%208%204.646%205.354a.5.5%200%201%201%20.708-.708z%22/%3E%3C/svg%3E');--md-admonition-icon--danger:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-exclamation-diamond-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M9.05.435c-.58-.58-1.52-.58-2.1%200L.436%206.95c-.58.58-.58%201.519%200%202.098l6.516%206.516c.58.58%201.519.58%202.098%200l6.516-6.516c.58-.58.58-1.519%200-2.098L9.05.435zM8%204c.535%200%20.954.462.9.995l-.35%203.507a.552.552%200%200%201-1.1%200L7.1%204.995A.905.905%200%200%201%208%204zm.002%206a1%201%200%201%201%200%202%201%201%200%200%201%200-2z%22/%3E%3C/svg%3E');--md-admonition-icon--bug:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-bug-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M4.978.855a.5.5%200%201%200-.956.29l.41%201.352A4.985%204.985%200%200%200%203%206h10a4.985%204.985%200%200%200-1.432-3.503l.41-1.352a.5.5%200%201%200-.956-.29l-.291.956A4.978%204.978%200%200%200%208%201a4.979%204.979%200%200%200-2.731.811l-.29-.956z%22/%3E%20%20%3Cpath%20d%3D%22M13%206v1H8.5v8.975A5%205%200%200%200%2013%2011h.5a.5.5%200%200%201%20.5.5v.5a.5.5%200%201%200%201%200v-.5a1.5%201.5%200%200%200-1.5-1.5H13V9h1.5a.5.5%200%200%200%200-1H13V7h.5A1.5%201.5%200%200%200%2015%205.5V5a.5.5%200%200%200-1%200v.5a.5.5%200%200%201-.5.5H13zm-5.5%209.975V7H3V6h-.5a.5.5%200%200%201-.5-.5V5a.5.5%200%200%200-1%200v.5A1.5%201.5%200%200%200%202.5%207H3v1H1.5a.5.5%200%200%200%200%201H3v1h-.5A1.5%201.5%200%200%200%201%2011.5v.5a.5.5%200%201%200%201%200v-.5a.5.5%200%200%201%20.5-.5H3a5%205%200%200%200%204.5%204.975z%22/%3E%3C/svg%3E');--md-admonition-icon--example:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-mortarboard-fill%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M8.211%202.047a.5.5%200%200%200-.422%200l-7.5%203.5a.5.5%200%200%200%20.025.917l7.5%203a.5.5%200%200%200%20.372%200L14%207.14V13a1%201%200%200%200-1%201v2h3v-2a1%201%200%200%200-1-1V6.739l.686-.275a.5.5%200%200%200%20.025-.917l-7.5-3.5Z%22/%3E%20%20%3Cpath%20d%3D%22M4.176%209.032a.5.5%200%200%200-.656.327l-.5%201.7a.5.5%200%200%200%20.294.605l4.5%201.8a.5.5%200%200%200%20.372%200l4.5-1.8a.5.5%200%200%200%20.294-.605l-.5-1.7a.5.5%200%200%200-.656-.327L8%2010.466%204.176%209.032Z%22/%3E%3C/svg%3E');--md-admonition-icon--quote:url('data:image/svg+xml;charset=utf-8,%3Csvg%20xmlns%3D%22http%3A//www.w3.org/2000/svg%22%20width%3D%2216%22%20height%3D%2216%22%20fill%3D%22currentColor%22%20class%3D%22bi%20bi-quote%22%20viewBox%3D%220%200%2016%2016%22%3E%20%20%3Cpath%20d%3D%22M12%2012a1%201%200%200%200%201-1V8.558a1%201%200%200%200-1-1h-1.388c0-.351.021-.703.062-1.054.062-.372.166-.703.31-.992.145-.29.331-.517.559-.683.227-.186.516-.279.868-.279V3c-.579%200-1.085.124-1.52.372a3.322%203.322%200%200%200-1.085.992%204.92%204.92%200%200%200-.62%201.458A7.712%207.712%200%200%200%209%207.558V11a1%201%200%200%200%201%201h2Zm-6%200a1%201%200%200%200%201-1V8.558a1%201%200%200%200-1-1H4.612c0-.351.021-.703.062-1.054.062-.372.166-.703.31-.992.145-.29.331-.517.559-.683.227-.186.516-.279.868-.279V3c-.579%200-1.085.124-1.52.372a3.322%203.322%200%200%200-1.085.992%204.92%204.92%200%200%200-.62%201.458A7.712%207.712%200%200%200%203%207.558V11a1%201%200%200%200%201%201h2Z%22/%3E%3C/svg%3E');}</style>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
|
|
<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,300i,400,400i,700,700i%7CRoboto+Mono:400,400i,700,700i&display=fallback">
|
|
<style>:root{--md-text-font:"Roboto";--md-code-font:"Roboto Mono"}</style>
|
|
|
|
|
|
|
|
<link rel="stylesheet" href="../../stylesheets/extra.css">
|
|
|
|
<script>__md_scope=new URL("../..",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
|
|
|
|
|
|
|
|
|
|
|
|
</head>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<body dir="ltr" data-md-color-scheme="webrecorder" data-md-color-primary="indigo" data-md-color-accent="indigo">
|
|
|
|
|
|
<input class="md-toggle" data-md-toggle="drawer" type="checkbox" id="__drawer" autocomplete="off">
|
|
<input class="md-toggle" data-md-toggle="search" type="checkbox" id="__search" autocomplete="off">
|
|
<label class="md-overlay" for="__drawer"></label>
|
|
<div data-md-component="skip">
|
|
|
|
|
|
<a href="#all-command-line-options" class="md-skip">
|
|
Skip to content
|
|
</a>
|
|
|
|
</div>
|
|
<div data-md-component="announce">
|
|
|
|
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<header class="md-header md-header--shadow md-header--lifted" data-md-component="header">
|
|
<nav class="md-header__inner md-grid" aria-label="Header">
|
|
<a href="../.." title="Browsertrix Crawler Docs" class="md-header__button md-logo" aria-label="Browsertrix Crawler Docs" data-md-component="logo">
|
|
|
|
<img src="../../assets/brand/browsertrix-crawler-white.svg" alt="logo">
|
|
|
|
</a>
|
|
<label class="md-header__button md-icon" for="__drawer">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M3 6h18v2H3zm0 5h18v2H3zm0 5h18v2H3z"/></svg>
|
|
</label>
|
|
<div class="md-header__title" data-md-component="header-title">
|
|
<div class="md-header__ellipsis">
|
|
<div class="md-header__topic">
|
|
<span class="md-ellipsis">
|
|
Browsertrix Crawler Docs
|
|
</span>
|
|
</div>
|
|
<div class="md-header__topic" data-md-component="header-topic">
|
|
<span class="md-ellipsis">
|
|
|
|
All Command-Line Options
|
|
|
|
</span>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<label class="md-header__button md-icon" for="__search">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.52 6.52 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5"/></svg>
|
|
</label>
|
|
<div class="md-search" data-md-component="search" role="dialog">
|
|
<label class="md-search__overlay" for="__search"></label>
|
|
<div class="md-search__inner" role="search">
|
|
<form class="md-search__form" name="search">
|
|
<input type="text" class="md-search__input" name="query" aria-label="Search" placeholder="Search" autocapitalize="off" autocorrect="off" autocomplete="off" spellcheck="false" data-md-component="search-query" required>
|
|
<label class="md-search__icon md-icon" for="__search">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.52 6.52 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5"/></svg>
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11z"/></svg>
|
|
</label>
|
|
<nav class="md-search__options" aria-label="Search">
|
|
|
|
<button type="reset" class="md-search__icon md-icon" title="Clear" aria-label="Clear" tabindex="-1">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12z"/></svg>
|
|
</button>
|
|
</nav>
|
|
|
|
<div class="md-search__suggest" data-md-component="search-suggest"></div>
|
|
|
|
</form>
|
|
<div class="md-search__output">
|
|
<div class="md-search__scrollwrap" tabindex="0" data-md-scrollfix>
|
|
<div class="md-search-result" data-md-component="search-result">
|
|
<div class="md-search-result__meta">
|
|
Initializing search
|
|
</div>
|
|
<ol class="md-search-result__list" role="presentation"></ol>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
|
|
|
|
<div class="md-header__source">
|
|
<a href="https://github.com/webrecorder/browsertrix-crawler/" title="Go to repository" class="md-source" data-md-component="source">
|
|
<div class="md-source__icon md-icon">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-github" viewBox="0 0 16 16">
|
|
<path d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.012 8.012 0 0 0 16 8c0-4.42-3.58-8-8-8z"/>
|
|
</svg>
|
|
</div>
|
|
<div class="md-source__repository">
|
|
Browsertrix Crawler
|
|
</div>
|
|
</a>
|
|
</div>
|
|
|
|
</nav>
|
|
|
|
|
|
|
|
<nav class="md-tabs" aria-label="Tabs" data-md-component="tabs">
|
|
<div class="md-grid">
|
|
<ul class="md-tabs__list">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-tabs__item">
|
|
<a href="../.." class="md-tabs__link">
|
|
|
|
|
|
|
|
|
|
|
|
Home
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-tabs__item">
|
|
<a href="../../develop/" class="md-tabs__link">
|
|
|
|
|
|
|
|
|
|
|
|
Develop
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-tabs__item md-tabs__item--active">
|
|
<a href="../" class="md-tabs__link">
|
|
|
|
|
|
|
|
|
|
|
|
User Guide
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
</ul>
|
|
</div>
|
|
</nav>
|
|
|
|
|
|
</header>
|
|
|
|
<div class="md-container" data-md-component="container">
|
|
|
|
|
|
|
|
|
|
<main class="md-main" data-md-component="main">
|
|
<div class="md-main__inner md-grid">
|
|
|
|
|
|
|
|
<div class="md-sidebar md-sidebar--primary" data-md-component="sidebar" data-md-type="navigation" >
|
|
<div class="md-sidebar__scrollwrap">
|
|
<div class="md-sidebar__inner">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<nav class="md-nav md-nav--primary md-nav--lifted" aria-label="Navigation" data-md-level="0">
|
|
<label class="md-nav__title" for="__drawer">
|
|
<a href="../.." title="Browsertrix Crawler Docs" class="md-nav__button md-logo" aria-label="Browsertrix Crawler Docs" data-md-component="logo">
|
|
|
|
<img src="../../assets/brand/browsertrix-crawler-white.svg" alt="logo">
|
|
|
|
</a>
|
|
Browsertrix Crawler Docs
|
|
</label>
|
|
|
|
<div class="md-nav__source">
|
|
<a href="https://github.com/webrecorder/browsertrix-crawler/" title="Go to repository" class="md-source" data-md-component="source">
|
|
<div class="md-source__icon md-icon">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-github" viewBox="0 0 16 16">
|
|
<path d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.012 8.012 0 0 0 16 8c0-4.42-3.58-8-8-8z"/>
|
|
</svg>
|
|
</div>
|
|
<div class="md-source__repository">
|
|
Browsertrix Crawler
|
|
</div>
|
|
</a>
|
|
</div>
|
|
|
|
<ul class="md-nav__list" data-md-scrollfix>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../.." class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Home
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item md-nav__item--nested">
|
|
|
|
|
|
|
|
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_2" >
|
|
|
|
|
|
<div class="md-nav__link md-nav__container">
|
|
<a href="../../develop/" class="md-nav__link ">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Develop
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
|
|
|
|
<label class="md-nav__link " for="__nav_2" id="__nav_2_label" tabindex="0">
|
|
<span class="md-nav__icon md-icon"></span>
|
|
</label>
|
|
|
|
</div>
|
|
|
|
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_2_label" aria-expanded="false">
|
|
<label class="md-nav__title" for="__nav_2">
|
|
<span class="md-nav__icon md-icon"></span>
|
|
|
|
|
|
Develop
|
|
|
|
|
|
</label>
|
|
<ul class="md-nav__list" data-md-scrollfix>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../../develop/docs/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Documentation
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
</ul>
|
|
</nav>
|
|
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item md-nav__item--active md-nav__item--section md-nav__item--nested">
|
|
|
|
|
|
|
|
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3" checked>
|
|
|
|
|
|
<div class="md-nav__link md-nav__container">
|
|
<a href="../" class="md-nav__link ">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
User Guide
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
|
|
|
|
<label class="md-nav__link " for="__nav_3" id="__nav_3_label" tabindex="">
|
|
<span class="md-nav__icon md-icon"></span>
|
|
</label>
|
|
|
|
</div>
|
|
|
|
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_3_label" aria-expanded="true">
|
|
<label class="md-nav__title" for="__nav_3">
|
|
<span class="md-nav__icon md-icon"></span>
|
|
|
|
|
|
User Guide
|
|
|
|
|
|
</label>
|
|
<ul class="md-nav__list" data-md-scrollfix>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../outputs/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Outputs
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../exit-codes/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Exit codes
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../common-options/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Commonly-Used Options
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../crawl-scope/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Crawl Scope
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../yaml-config/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
YAML Crawl Config
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../browser-profiles/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Creating and Using Browser Profiles
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../proxies/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Crawling with Proxies
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../behaviors/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Browser Behaviors
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item">
|
|
<a href="../qa/" class="md-nav__link">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
Quality Assurance
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
</li>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<li class="md-nav__item md-nav__item--active">
|
|
|
|
<input class="md-nav__toggle md-toggle" type="checkbox" id="__toc">
|
|
|
|
|
|
|
|
|
|
|
|
<label class="md-nav__link md-nav__link--active" for="__toc">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
All Command-Line Options
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
<span class="md-nav__icon md-icon"></span>
|
|
</label>
|
|
|
|
<a href="./" class="md-nav__link md-nav__link--active">
|
|
|
|
|
|
|
|
<span class="md-ellipsis">
|
|
|
|
|
|
All Command-Line Options
|
|
|
|
|
|
|
|
</span>
|
|
|
|
|
|
|
|
</a>
|
|
|
|
|
|
|
|
<nav class="md-nav md-nav--secondary" aria-label="Table of contents">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<label class="md-nav__title" for="__toc">
|
|
<span class="md-nav__icon md-icon"></span>
|
|
Table of contents
|
|
</label>
|
|
<ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
|
|
|
|
<li class="md-nav__item">
|
|
<a href="#crawler" class="md-nav__link">
|
|
<span class="md-ellipsis">
|
|
|
|
crawler
|
|
|
|
</span>
|
|
</a>
|
|
|
|
</li>
|
|
|
|
<li class="md-nav__item">
|
|
<a href="#create-login-profile" class="md-nav__link">
|
|
<span class="md-ellipsis">
|
|
|
|
create-login-profile
|
|
|
|
</span>
|
|
</a>
|
|
|
|
</li>
|
|
|
|
</ul>
|
|
|
|
</nav>
|
|
|
|
</li>
|
|
|
|
|
|
|
|
|
|
</ul>
|
|
</nav>
|
|
|
|
</li>
|
|
|
|
|
|
|
|
</ul>
|
|
</nav>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
|
|
|
|
<div class="md-sidebar md-sidebar--secondary" data-md-component="sidebar" data-md-type="toc" >
|
|
<div class="md-sidebar__scrollwrap">
|
|
<div class="md-sidebar__inner">
|
|
|
|
|
|
<nav class="md-nav md-nav--secondary" aria-label="Table of contents">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<label class="md-nav__title" for="__toc">
|
|
<span class="md-nav__icon md-icon"></span>
|
|
Table of contents
|
|
</label>
|
|
<ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
|
|
|
|
<li class="md-nav__item">
|
|
<a href="#crawler" class="md-nav__link">
|
|
<span class="md-ellipsis">
|
|
|
|
crawler
|
|
|
|
</span>
|
|
</a>
|
|
|
|
</li>
|
|
|
|
<li class="md-nav__item">
|
|
<a href="#create-login-profile" class="md-nav__link">
|
|
<span class="md-ellipsis">
|
|
|
|
create-login-profile
|
|
|
|
</span>
|
|
</a>
|
|
|
|
</li>
|
|
|
|
</ul>
|
|
|
|
</nav>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
|
|
|
|
<div class="md-content" data-md-component="content">
|
|
|
|
<article class="md-content__inner md-typeset">
|
|
|
|
|
|
|
|
|
|
|
|
<a href="https://github.com/webrecorder/browsertrix-crawler/edit/main/docs/docs/user-guide/cli-options.md" title="Edit this page" class="md-content__button md-icon" rel="edit">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-pencil" viewBox="0 0 16 16">
|
|
<path d="M12.146.146a.5.5 0 0 1 .708 0l3 3a.5.5 0 0 1 0 .708l-10 10a.5.5 0 0 1-.168.11l-5 2a.5.5 0 0 1-.65-.65l2-5a.5.5 0 0 1 .11-.168l10-10zM11.207 2.5 13.5 4.793 14.793 3.5 12.5 1.207 11.207 2.5zm1.586 3L10.5 3.207 4 9.707V10h.5a.5.5 0 0 1 .5.5v.5h.5a.5.5 0 0 1 .5.5v.5h.293l6.5-6.5zm-9.761 5.175-.106.106-1.528 3.821 3.821-1.528.106-.106A.5.5 0 0 1 5 12.5V12h-.5a.5.5 0 0 1-.5-.5V11h-.5a.5.5 0 0 1-.468-.325z"/>
|
|
</svg>
|
|
</a>
|
|
|
|
|
|
|
|
|
|
<h1 id="all-command-line-options">All Command-Line Options<a class="headerlink" href="#all-command-line-options" title="Permanent link">¶</a></h1>
|
|
<p>The Browsertrix Crawler Docker image currently accepts the following parameters, broken down by entrypoint:</p>
|
|
<h2 id="crawler">crawler<a class="headerlink" href="#crawler" title="Permanent link">¶</a></h2>
|
|
<div class="highlight"><pre><span></span><code><a id="__codelineno-0-1" name="__codelineno-0-1" href="#__codelineno-0-1"></a>Options:
|
|
<a id="__codelineno-0-2" name="__codelineno-0-2" href="#__codelineno-0-2"></a> --help Show help [boolean]
|
|
<a id="__codelineno-0-3" name="__codelineno-0-3" href="#__codelineno-0-3"></a> --version Show version number [boolean]
|
|
<a id="__codelineno-0-4" name="__codelineno-0-4" href="#__codelineno-0-4"></a> --seeds, --url The URL to start crawling from
|
|
<a id="__codelineno-0-5" name="__codelineno-0-5" href="#__codelineno-0-5"></a> [array] [default: []]
|
|
<a id="__codelineno-0-6" name="__codelineno-0-6" href="#__codelineno-0-6"></a> --seedFile, --urlFile If set, read a list of seed urls, on
|
|
<a id="__codelineno-0-7" name="__codelineno-0-7" href="#__codelineno-0-7"></a> e per line, from the specified
|
|
<a id="__codelineno-0-8" name="__codelineno-0-8" href="#__codelineno-0-8"></a> [string]
|
|
<a id="__codelineno-0-9" name="__codelineno-0-9" href="#__codelineno-0-9"></a> -w, --workers The number of workers to run in para
|
|
<a id="__codelineno-0-10" name="__codelineno-0-10" href="#__codelineno-0-10"></a> llel [number] [default: 1]
|
|
<a id="__codelineno-0-11" name="__codelineno-0-11" href="#__codelineno-0-11"></a> --crawlId, --id A user provided ID for this crawl or
|
|
<a id="__codelineno-0-12" name="__codelineno-0-12" href="#__codelineno-0-12"></a> crawl configuration (can also be se
|
|
<a id="__codelineno-0-13" name="__codelineno-0-13" href="#__codelineno-0-13"></a> t via CRAWL_ID env var), defaults to
|
|
<a id="__codelineno-0-14" name="__codelineno-0-14" href="#__codelineno-0-14"></a> combination of Docker container hos
|
|
<a id="__codelineno-0-15" name="__codelineno-0-15" href="#__codelineno-0-15"></a> tname and collection [string]
|
|
<a id="__codelineno-0-16" name="__codelineno-0-16" href="#__codelineno-0-16"></a> --waitUntil Puppeteer page.goto() condition to w
|
|
<a id="__codelineno-0-17" name="__codelineno-0-17" href="#__codelineno-0-17"></a> ait for before continuing, can be mu
|
|
<a id="__codelineno-0-18" name="__codelineno-0-18" href="#__codelineno-0-18"></a> ltiple separated by ','
|
|
<a id="__codelineno-0-19" name="__codelineno-0-19" href="#__codelineno-0-19"></a> [array] [choices: "load", "domcontentloaded", "networkidle0", "networkidle2"]
|
|
<a id="__codelineno-0-20" name="__codelineno-0-20" href="#__codelineno-0-20"></a> [default: ["load","networkidle2"]]
|
|
<a id="__codelineno-0-21" name="__codelineno-0-21" href="#__codelineno-0-21"></a> --depth The depth of the crawl for all seeds
|
|
<a id="__codelineno-0-22" name="__codelineno-0-22" href="#__codelineno-0-22"></a> [number] [default: -1]
|
|
<a id="__codelineno-0-23" name="__codelineno-0-23" href="#__codelineno-0-23"></a> --extraHops Number of extra 'hops' to follow, be
|
|
<a id="__codelineno-0-24" name="__codelineno-0-24" href="#__codelineno-0-24"></a> yond the current scope
|
|
<a id="__codelineno-0-25" name="__codelineno-0-25" href="#__codelineno-0-25"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-26" name="__codelineno-0-26" href="#__codelineno-0-26"></a> --pageLimit, --limit Limit crawl to this number of pages
|
|
<a id="__codelineno-0-27" name="__codelineno-0-27" href="#__codelineno-0-27"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-28" name="__codelineno-0-28" href="#__codelineno-0-28"></a> --maxPageLimit Maximum pages to crawl, overriding
|
|
<a id="__codelineno-0-29" name="__codelineno-0-29" href="#__codelineno-0-29"></a> pageLimit if both are set
|
|
<a id="__codelineno-0-30" name="__codelineno-0-30" href="#__codelineno-0-30"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-31" name="__codelineno-0-31" href="#__codelineno-0-31"></a> --pageLoadTimeout, --timeout Timeout for each page to load (in se
|
|
<a id="__codelineno-0-32" name="__codelineno-0-32" href="#__codelineno-0-32"></a> conds) [number] [default: 90]
|
|
<a id="__codelineno-0-33" name="__codelineno-0-33" href="#__codelineno-0-33"></a> --scopeType A predefined scope of the crawl. For
|
|
<a id="__codelineno-0-34" name="__codelineno-0-34" href="#__codelineno-0-34"></a> more customization, use 'custom' an
|
|
<a id="__codelineno-0-35" name="__codelineno-0-35" href="#__codelineno-0-35"></a> d set scopeIncludeRx regexes
|
|
<a id="__codelineno-0-36" name="__codelineno-0-36" href="#__codelineno-0-36"></a> [string] [choices: "page", "page-spa", "prefix", "host", "domain", "any", "cus
|
|
<a id="__codelineno-0-37" name="__codelineno-0-37" href="#__codelineno-0-37"></a> tom"]
|
|
<a id="__codelineno-0-38" name="__codelineno-0-38" href="#__codelineno-0-38"></a> --scopeIncludeRx, --include Regex of page URLs that should be in
|
|
<a id="__codelineno-0-39" name="__codelineno-0-39" href="#__codelineno-0-39"></a> cluded in the crawl (defaults to the
|
|
<a id="__codelineno-0-40" name="__codelineno-0-40" href="#__codelineno-0-40"></a> immediate directory of URL)[string]
|
|
<a id="__codelineno-0-41" name="__codelineno-0-41" href="#__codelineno-0-41"></a> --scopeExcludeRx, --exclude Regex of page URLs that should be ex
|
|
<a id="__codelineno-0-42" name="__codelineno-0-42" href="#__codelineno-0-42"></a> cluded from the crawl. [string]
|
|
<a id="__codelineno-0-43" name="__codelineno-0-43" href="#__codelineno-0-43"></a> --allowHashUrls Allow Hashtag URLs, useful for singl
|
|
<a id="__codelineno-0-44" name="__codelineno-0-44" href="#__codelineno-0-44"></a> e-page-application crawling or when
|
|
<a id="__codelineno-0-45" name="__codelineno-0-45" href="#__codelineno-0-45"></a> different hashtags load dynamic cont
|
|
<a id="__codelineno-0-46" name="__codelineno-0-46" href="#__codelineno-0-46"></a> ent
|
|
<a id="__codelineno-0-47" name="__codelineno-0-47" href="#__codelineno-0-47"></a> --selectLinks, --linkSelector One or more selectors for extracting
|
|
<a id="__codelineno-0-48" name="__codelineno-0-48" href="#__codelineno-0-48"></a> links, in the format [css selector]
|
|
<a id="__codelineno-0-49" name="__codelineno-0-49" href="#__codelineno-0-49"></a> ->[property to use],[css selector]->
|
|
<a id="__codelineno-0-50" name="__codelineno-0-50" href="#__codelineno-0-50"></a> @[attribute to use]
|
|
<a id="__codelineno-0-51" name="__codelineno-0-51" href="#__codelineno-0-51"></a> [array] [default: ["a[href]->href"]]
|
|
<a id="__codelineno-0-52" name="__codelineno-0-52" href="#__codelineno-0-52"></a> --clickSelector Selector for elements to click when
|
|
<a id="__codelineno-0-53" name="__codelineno-0-53" href="#__codelineno-0-53"></a> using the autoclick behavior
|
|
<a id="__codelineno-0-54" name="__codelineno-0-54" href="#__codelineno-0-54"></a> [string] [default: "a"]
|
|
<a id="__codelineno-0-55" name="__codelineno-0-55" href="#__codelineno-0-55"></a> --blockRules Additional rules for blocking certai
|
|
<a id="__codelineno-0-56" name="__codelineno-0-56" href="#__codelineno-0-56"></a> n URLs from being loaded, by URL reg
|
|
<a id="__codelineno-0-57" name="__codelineno-0-57" href="#__codelineno-0-57"></a> ex and optionally via text match in
|
|
<a id="__codelineno-0-58" name="__codelineno-0-58" href="#__codelineno-0-58"></a> an iframe [array] [default: []]
|
|
<a id="__codelineno-0-59" name="__codelineno-0-59" href="#__codelineno-0-59"></a> --blockMessage If specified, when a URL is blocked,
|
|
<a id="__codelineno-0-60" name="__codelineno-0-60" href="#__codelineno-0-60"></a> a record with this error message is
|
|
<a id="__codelineno-0-61" name="__codelineno-0-61" href="#__codelineno-0-61"></a> added instead[string] [default: ""]
|
|
<a id="__codelineno-0-62" name="__codelineno-0-62" href="#__codelineno-0-62"></a> --blockAds, --blockads If set, block advertisements from be
|
|
<a id="__codelineno-0-63" name="__codelineno-0-63" href="#__codelineno-0-63"></a> ing loaded (based on Stephen Black's
|
|
<a id="__codelineno-0-64" name="__codelineno-0-64" href="#__codelineno-0-64"></a> blocklist)
|
|
<a id="__codelineno-0-65" name="__codelineno-0-65" href="#__codelineno-0-65"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-66" name="__codelineno-0-66" href="#__codelineno-0-66"></a> --adBlockMessage If specified, when an ad is blocked,
|
|
<a id="__codelineno-0-67" name="__codelineno-0-67" href="#__codelineno-0-67"></a> a record with this error message is
|
|
<a id="__codelineno-0-68" name="__codelineno-0-68" href="#__codelineno-0-68"></a> added instead[string] [default: ""]
|
|
<a id="__codelineno-0-69" name="__codelineno-0-69" href="#__codelineno-0-69"></a> -c, --collection Collection name / directory to crawl
|
|
<a id="__codelineno-0-70" name="__codelineno-0-70" href="#__codelineno-0-70"></a> into[string] [default: "crawl-@ts"]
|
|
<a id="__codelineno-0-71" name="__codelineno-0-71" href="#__codelineno-0-71"></a> --headless Run in headless mode, otherwise star
|
|
<a id="__codelineno-0-72" name="__codelineno-0-72" href="#__codelineno-0-72"></a> t xvfb [boolean] [default: false]
|
|
<a id="__codelineno-0-73" name="__codelineno-0-73" href="#__codelineno-0-73"></a> --driver Custom driver for the crawler, if an
|
|
<a id="__codelineno-0-74" name="__codelineno-0-74" href="#__codelineno-0-74"></a> y [string]
|
|
<a id="__codelineno-0-75" name="__codelineno-0-75" href="#__codelineno-0-75"></a> --generateCDX, --generatecdx, --gene If set, generate merged index in CDX
|
|
<a id="__codelineno-0-76" name="__codelineno-0-76" href="#__codelineno-0-76"></a> rateCdx J format [boolean] [default: false]
|
|
<a id="__codelineno-0-77" name="__codelineno-0-77" href="#__codelineno-0-77"></a> --combineWARC, --combinewarc, --comb If set, combine the warcs
|
|
<a id="__codelineno-0-78" name="__codelineno-0-78" href="#__codelineno-0-78"></a> ineWarc [boolean] [default: false]
|
|
<a id="__codelineno-0-79" name="__codelineno-0-79" href="#__codelineno-0-79"></a> --rolloverSize If set, declare the rollover size
|
|
<a id="__codelineno-0-80" name="__codelineno-0-80" href="#__codelineno-0-80"></a> [number] [default: 1000000000]
|
|
<a id="__codelineno-0-81" name="__codelineno-0-81" href="#__codelineno-0-81"></a> --generateWACZ, --generatewacz, --ge If set, generate WACZ on disk
|
|
<a id="__codelineno-0-82" name="__codelineno-0-82" href="#__codelineno-0-82"></a> nerateWacz [boolean] [default: false]
|
|
<a id="__codelineno-0-83" name="__codelineno-0-83" href="#__codelineno-0-83"></a> --useSHA1 If set, sha-1 instead of sha-256 has
|
|
<a id="__codelineno-0-84" name="__codelineno-0-84" href="#__codelineno-0-84"></a> hes will be used for creating record
|
|
<a id="__codelineno-0-85" name="__codelineno-0-85" href="#__codelineno-0-85"></a> s [boolean] [default: false]
|
|
<a id="__codelineno-0-86" name="__codelineno-0-86" href="#__codelineno-0-86"></a> --logging Logging options for crawler, can inc
|
|
<a id="__codelineno-0-87" name="__codelineno-0-87" href="#__codelineno-0-87"></a> lude: stats (enabled by default), js
|
|
<a id="__codelineno-0-88" name="__codelineno-0-88" href="#__codelineno-0-88"></a> errors, debug
|
|
<a id="__codelineno-0-89" name="__codelineno-0-89" href="#__codelineno-0-89"></a> [array] [default: ["stats"]]
|
|
<a id="__codelineno-0-90" name="__codelineno-0-90" href="#__codelineno-0-90"></a> --logLevel Comma-separated list of log levels t
|
|
<a id="__codelineno-0-91" name="__codelineno-0-91" href="#__codelineno-0-91"></a> o include in logs
|
|
<a id="__codelineno-0-92" name="__codelineno-0-92" href="#__codelineno-0-92"></a> [array] [default: []]
|
|
<a id="__codelineno-0-93" name="__codelineno-0-93" href="#__codelineno-0-93"></a> --context, --logContext Comma-separated list of contexts to
|
|
<a id="__codelineno-0-94" name="__codelineno-0-94" href="#__codelineno-0-94"></a> include in logs
|
|
<a id="__codelineno-0-95" name="__codelineno-0-95" href="#__codelineno-0-95"></a> [array] [choices: "general", "worker", "recorder", "recorderNetwork", "writer"
|
|
<a id="__codelineno-0-96" name="__codelineno-0-96" href="#__codelineno-0-96"></a> , "state", "redis", "storage", "text", "exclusion", "screenshots", "screencast
|
|
<a id="__codelineno-0-97" name="__codelineno-0-97" href="#__codelineno-0-97"></a> ", "originOverride", "healthcheck", "browser", "blocking", "behavior", "behavi
|
|
<a id="__codelineno-0-98" name="__codelineno-0-98" href="#__codelineno-0-98"></a> orScript", "behaviorScriptCustom", "jsError", "fetch", "pageStatus", "memorySt
|
|
<a id="__codelineno-0-99" name="__codelineno-0-99" href="#__codelineno-0-99"></a> atus", "crawlStatus", "links", "sitemap", "wacz", "replay", "proxy", "scope",
|
|
<a id="__codelineno-0-100" name="__codelineno-0-100" href="#__codelineno-0-100"></a> "robots"] [default: []]
|
|
<a id="__codelineno-0-101" name="__codelineno-0-101" href="#__codelineno-0-101"></a> --logExcludeContext Comma-separated list of contexts to
|
|
<a id="__codelineno-0-102" name="__codelineno-0-102" href="#__codelineno-0-102"></a> NOT include in logs
|
|
<a id="__codelineno-0-103" name="__codelineno-0-103" href="#__codelineno-0-103"></a> [array] [choices: "general", "worker", "recorder", "recorderNetwork", "writer"
|
|
<a id="__codelineno-0-104" name="__codelineno-0-104" href="#__codelineno-0-104"></a> , "state", "redis", "storage", "text", "exclusion", "screenshots", "screencast
|
|
<a id="__codelineno-0-105" name="__codelineno-0-105" href="#__codelineno-0-105"></a> ", "originOverride", "healthcheck", "browser", "blocking", "behavior", "behavi
|
|
<a id="__codelineno-0-106" name="__codelineno-0-106" href="#__codelineno-0-106"></a> orScript", "behaviorScriptCustom", "jsError", "fetch", "pageStatus", "memorySt
|
|
<a id="__codelineno-0-107" name="__codelineno-0-107" href="#__codelineno-0-107"></a> atus", "crawlStatus", "links", "sitemap", "wacz", "replay", "proxy", "scope",
|
|
<a id="__codelineno-0-108" name="__codelineno-0-108" href="#__codelineno-0-108"></a> "robots"] [default: ["recorderNetwork","jsError","screencast"]]
|
|
<a id="__codelineno-0-109" name="__codelineno-0-109" href="#__codelineno-0-109"></a> --text Extract initial (default) or final t
|
|
<a id="__codelineno-0-110" name="__codelineno-0-110" href="#__codelineno-0-110"></a> ext to pages.jsonl or WARC resource
|
|
<a id="__codelineno-0-111" name="__codelineno-0-111" href="#__codelineno-0-111"></a> record(s)
|
|
<a id="__codelineno-0-112" name="__codelineno-0-112" href="#__codelineno-0-112"></a> [array] [choices: "to-pages", "to-warc", "final-to-warc"]
|
|
<a id="__codelineno-0-113" name="__codelineno-0-113" href="#__codelineno-0-113"></a> --cwd Crawl working directory for captures
|
|
<a id="__codelineno-0-114" name="__codelineno-0-114" href="#__codelineno-0-114"></a> . If not set, defaults to process.cw
|
|
<a id="__codelineno-0-115" name="__codelineno-0-115" href="#__codelineno-0-115"></a> d() [string] [default: "/crawls"]
|
|
<a id="__codelineno-0-116" name="__codelineno-0-116" href="#__codelineno-0-116"></a> --mobileDevice Emulate mobile device by name from:
|
|
<a id="__codelineno-0-117" name="__codelineno-0-117" href="#__codelineno-0-117"></a> https://github.com/puppeteer/puppete
|
|
<a id="__codelineno-0-118" name="__codelineno-0-118" href="#__codelineno-0-118"></a> er/blob/main/src/common/DeviceDescri
|
|
<a id="__codelineno-0-119" name="__codelineno-0-119" href="#__codelineno-0-119"></a> ptors.ts [string]
|
|
<a id="__codelineno-0-120" name="__codelineno-0-120" href="#__codelineno-0-120"></a> --userAgent Override user-agent with specified s
|
|
<a id="__codelineno-0-121" name="__codelineno-0-121" href="#__codelineno-0-121"></a> tring [string]
|
|
<a id="__codelineno-0-122" name="__codelineno-0-122" href="#__codelineno-0-122"></a> --userAgentSuffix Append suffix to existing browser us
|
|
<a id="__codelineno-0-123" name="__codelineno-0-123" href="#__codelineno-0-123"></a> er-agent (ex: +MyCrawler, info@examp
|
|
<a id="__codelineno-0-124" name="__codelineno-0-124" href="#__codelineno-0-124"></a> le.com) [string]
|
|
<a id="__codelineno-0-125" name="__codelineno-0-125" href="#__codelineno-0-125"></a> --useSitemap, --sitemap If enabled, check for sitemaps at /s
|
|
<a id="__codelineno-0-126" name="__codelineno-0-126" href="#__codelineno-0-126"></a> itemap.xml, or custom URL if URL is
|
|
<a id="__codelineno-0-127" name="__codelineno-0-127" href="#__codelineno-0-127"></a> specified
|
|
<a id="__codelineno-0-128" name="__codelineno-0-128" href="#__codelineno-0-128"></a> --sitemapFromDate, --sitemapFrom If set, filter URLs from sitemaps to
|
|
<a id="__codelineno-0-129" name="__codelineno-0-129" href="#__codelineno-0-129"></a> those greater than or equal to (>=)
|
|
<a id="__codelineno-0-130" name="__codelineno-0-130" href="#__codelineno-0-130"></a> provided ISO Date string (YYYY-MM-D
|
|
<a id="__codelineno-0-131" name="__codelineno-0-131" href="#__codelineno-0-131"></a> D or YYYY-MM-DDTHH:MM:SS or partial
|
|
<a id="__codelineno-0-132" name="__codelineno-0-132" href="#__codelineno-0-132"></a> date) [string]
|
|
<a id="__codelineno-0-133" name="__codelineno-0-133" href="#__codelineno-0-133"></a> --sitemapToDate, --sitemapTo If set, filter URLs from sitemaps to
|
|
<a id="__codelineno-0-134" name="__codelineno-0-134" href="#__codelineno-0-134"></a> those less than or equal to (<=) pr
|
|
<a id="__codelineno-0-135" name="__codelineno-0-135" href="#__codelineno-0-135"></a> ovided ISO Date string (YYYY-MM-DD o
|
|
<a id="__codelineno-0-136" name="__codelineno-0-136" href="#__codelineno-0-136"></a> r YYYY-MM-DDTHH:MM:SS or partial dat
|
|
<a id="__codelineno-0-137" name="__codelineno-0-137" href="#__codelineno-0-137"></a> e) [string]
|
|
<a id="__codelineno-0-138" name="__codelineno-0-138" href="#__codelineno-0-138"></a> --statsFilename If set, output stats as JSON to this
|
|
<a id="__codelineno-0-139" name="__codelineno-0-139" href="#__codelineno-0-139"></a> file. (Relative filename resolves t
|
|
<a id="__codelineno-0-140" name="__codelineno-0-140" href="#__codelineno-0-140"></a> o crawl working directory) [string]
|
|
<a id="__codelineno-0-141" name="__codelineno-0-141" href="#__codelineno-0-141"></a> --behaviors Which background behaviors to enable
|
|
<a id="__codelineno-0-142" name="__codelineno-0-142" href="#__codelineno-0-142"></a> on each page
|
|
<a id="__codelineno-0-143" name="__codelineno-0-143" href="#__codelineno-0-143"></a> [array] [default: ["autoplay","autofetch","autoscroll","siteSpecific"]]
|
|
<a id="__codelineno-0-144" name="__codelineno-0-144" href="#__codelineno-0-144"></a> --behaviorTimeout If >0, timeout (in seconds) for in-p
|
|
<a id="__codelineno-0-145" name="__codelineno-0-145" href="#__codelineno-0-145"></a> age behavior will run on each page.
|
|
<a id="__codelineno-0-146" name="__codelineno-0-146" href="#__codelineno-0-146"></a> If 0, a behavior can run until finis
|
|
<a id="__codelineno-0-147" name="__codelineno-0-147" href="#__codelineno-0-147"></a> h. [number] [default: 90]
|
|
<a id="__codelineno-0-148" name="__codelineno-0-148" href="#__codelineno-0-148"></a> --postLoadDelay If >0, amount of time to sleep (in s
|
|
<a id="__codelineno-0-149" name="__codelineno-0-149" href="#__codelineno-0-149"></a> econds) after page has loaded, befor
|
|
<a id="__codelineno-0-150" name="__codelineno-0-150" href="#__codelineno-0-150"></a> e taking screenshots / getting text
|
|
<a id="__codelineno-0-151" name="__codelineno-0-151" href="#__codelineno-0-151"></a> / running behaviors
|
|
<a id="__codelineno-0-152" name="__codelineno-0-152" href="#__codelineno-0-152"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-153" name="__codelineno-0-153" href="#__codelineno-0-153"></a> --pageExtraDelay, --delay If >0, amount of time to sleep (in s
|
|
<a id="__codelineno-0-154" name="__codelineno-0-154" href="#__codelineno-0-154"></a> econds) after behaviors before movin
|
|
<a id="__codelineno-0-155" name="__codelineno-0-155" href="#__codelineno-0-155"></a> g on to next page
|
|
<a id="__codelineno-0-156" name="__codelineno-0-156" href="#__codelineno-0-156"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-157" name="__codelineno-0-157" href="#__codelineno-0-157"></a> --profile, --loadProfile Path or HTTP(S) URL to tar.gz file w
|
|
<a id="__codelineno-0-158" name="__codelineno-0-158" href="#__codelineno-0-158"></a> hich contains the browser profile di
|
|
<a id="__codelineno-0-159" name="__codelineno-0-159" href="#__codelineno-0-159"></a> rectory [string]
|
|
<a id="__codelineno-0-160" name="__codelineno-0-160" href="#__codelineno-0-160"></a> --saveProfile If set, save profile if crawl succee
|
|
<a id="__codelineno-0-161" name="__codelineno-0-161" href="#__codelineno-0-161"></a> ded successfully. If no value provid
|
|
<a id="__codelineno-0-162" name="__codelineno-0-162" href="#__codelineno-0-162"></a> ed, save back to save location as sp
|
|
<a id="__codelineno-0-163" name="__codelineno-0-163" href="#__codelineno-0-163"></a> ecified in --profile
|
|
<a id="__codelineno-0-164" name="__codelineno-0-164" href="#__codelineno-0-164"></a> --screenshot Screenshot options for crawler, can
|
|
<a id="__codelineno-0-165" name="__codelineno-0-165" href="#__codelineno-0-165"></a> include: view, thumbnail, fullPage,
|
|
<a id="__codelineno-0-166" name="__codelineno-0-166" href="#__codelineno-0-166"></a> fullPageFinal
|
|
<a id="__codelineno-0-167" name="__codelineno-0-167" href="#__codelineno-0-167"></a> [array] [choices: "view", "thumbnail", "fullPage", "fullPageFinal"] [default:
|
|
<a id="__codelineno-0-168" name="__codelineno-0-168" href="#__codelineno-0-168"></a> []]
|
|
<a id="__codelineno-0-169" name="__codelineno-0-169" href="#__codelineno-0-169"></a> --screencastPort If set to a non-zero value, starts a
|
|
<a id="__codelineno-0-170" name="__codelineno-0-170" href="#__codelineno-0-170"></a> n HTTP server with screencast access
|
|
<a id="__codelineno-0-171" name="__codelineno-0-171" href="#__codelineno-0-171"></a> ible on this port
|
|
<a id="__codelineno-0-172" name="__codelineno-0-172" href="#__codelineno-0-172"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-173" name="__codelineno-0-173" href="#__codelineno-0-173"></a> --screencastRedis If set, will use the state store red
|
|
<a id="__codelineno-0-174" name="__codelineno-0-174" href="#__codelineno-0-174"></a> is pubsub for screencasting. Require
|
|
<a id="__codelineno-0-175" name="__codelineno-0-175" href="#__codelineno-0-175"></a> s --redisStoreUrl to be set
|
|
<a id="__codelineno-0-176" name="__codelineno-0-176" href="#__codelineno-0-176"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-177" name="__codelineno-0-177" href="#__codelineno-0-177"></a> --warcInfo, --warcinfo Optional fields added to the warcinf
|
|
<a id="__codelineno-0-178" name="__codelineno-0-178" href="#__codelineno-0-178"></a> o record in combined WARCs
|
|
<a id="__codelineno-0-179" name="__codelineno-0-179" href="#__codelineno-0-179"></a> --redisStoreUrl If set, url for remote redis server
|
|
<a id="__codelineno-0-180" name="__codelineno-0-180" href="#__codelineno-0-180"></a> to store state. Otherwise, using loc
|
|
<a id="__codelineno-0-181" name="__codelineno-0-181" href="#__codelineno-0-181"></a> al redis instance
|
|
<a id="__codelineno-0-182" name="__codelineno-0-182" href="#__codelineno-0-182"></a> [string] [default: "redis://localhost:6379/0"]
|
|
<a id="__codelineno-0-183" name="__codelineno-0-183" href="#__codelineno-0-183"></a> --saveState If the crawl state should be seriali
|
|
<a id="__codelineno-0-184" name="__codelineno-0-184" href="#__codelineno-0-184"></a> zed to the crawls/ directory. Defaul
|
|
<a id="__codelineno-0-185" name="__codelineno-0-185" href="#__codelineno-0-185"></a> ts to 'partial', only saved when cra
|
|
<a id="__codelineno-0-186" name="__codelineno-0-186" href="#__codelineno-0-186"></a> wl is interrupted
|
|
<a id="__codelineno-0-187" name="__codelineno-0-187" href="#__codelineno-0-187"></a> [string] [choices: "never", "partial", "always"] [default: "partial"]
|
|
<a id="__codelineno-0-188" name="__codelineno-0-188" href="#__codelineno-0-188"></a> --saveStateInterval If save state is set to 'always', al
|
|
<a id="__codelineno-0-189" name="__codelineno-0-189" href="#__codelineno-0-189"></a> so save state during the crawl at th
|
|
<a id="__codelineno-0-190" name="__codelineno-0-190" href="#__codelineno-0-190"></a> is interval (in seconds)
|
|
<a id="__codelineno-0-191" name="__codelineno-0-191" href="#__codelineno-0-191"></a> [number] [default: 300]
|
|
<a id="__codelineno-0-192" name="__codelineno-0-192" href="#__codelineno-0-192"></a> --saveStateHistory Number of save states to keep during
|
|
<a id="__codelineno-0-193" name="__codelineno-0-193" href="#__codelineno-0-193"></a> the duration of a crawl
|
|
<a id="__codelineno-0-194" name="__codelineno-0-194" href="#__codelineno-0-194"></a> [number] [default: 5]
|
|
<a id="__codelineno-0-195" name="__codelineno-0-195" href="#__codelineno-0-195"></a> --sizeLimit If set, save state and exit if size
|
|
<a id="__codelineno-0-196" name="__codelineno-0-196" href="#__codelineno-0-196"></a> limit exceeds this value
|
|
<a id="__codelineno-0-197" name="__codelineno-0-197" href="#__codelineno-0-197"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-198" name="__codelineno-0-198" href="#__codelineno-0-198"></a> --diskUtilization If set, save state and exit if disk
|
|
<a id="__codelineno-0-199" name="__codelineno-0-199" href="#__codelineno-0-199"></a> utilization exceeds this percentage
|
|
<a id="__codelineno-0-200" name="__codelineno-0-200" href="#__codelineno-0-200"></a> value [number] [default: 0]
|
|
<a id="__codelineno-0-201" name="__codelineno-0-201" href="#__codelineno-0-201"></a> --timeLimit If set, save state and exit after ti
|
|
<a id="__codelineno-0-202" name="__codelineno-0-202" href="#__codelineno-0-202"></a> me limit, in seconds
|
|
<a id="__codelineno-0-203" name="__codelineno-0-203" href="#__codelineno-0-203"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-204" name="__codelineno-0-204" href="#__codelineno-0-204"></a> --healthCheckPort port to run healthcheck on
|
|
<a id="__codelineno-0-205" name="__codelineno-0-205" href="#__codelineno-0-205"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-206" name="__codelineno-0-206" href="#__codelineno-0-206"></a> --overwrite overwrite current crawl data: if set
|
|
<a id="__codelineno-0-207" name="__codelineno-0-207" href="#__codelineno-0-207"></a> , existing collection directory will
|
|
<a id="__codelineno-0-208" name="__codelineno-0-208" href="#__codelineno-0-208"></a> be deleted before crawl is started
|
|
<a id="__codelineno-0-209" name="__codelineno-0-209" href="#__codelineno-0-209"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-210" name="__codelineno-0-210" href="#__codelineno-0-210"></a> --waitOnDone if set, wait for interrupt signal wh
|
|
<a id="__codelineno-0-211" name="__codelineno-0-211" href="#__codelineno-0-211"></a> en finished instead of exiting
|
|
<a id="__codelineno-0-212" name="__codelineno-0-212" href="#__codelineno-0-212"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-213" name="__codelineno-0-213" href="#__codelineno-0-213"></a> --restartsOnError if set, assume will be restarted if
|
|
<a id="__codelineno-0-214" name="__codelineno-0-214" href="#__codelineno-0-214"></a> interrupted, don't run post-crawl pr
|
|
<a id="__codelineno-0-215" name="__codelineno-0-215" href="#__codelineno-0-215"></a> ocesses on interrupt
|
|
<a id="__codelineno-0-216" name="__codelineno-0-216" href="#__codelineno-0-216"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-217" name="__codelineno-0-217" href="#__codelineno-0-217"></a> --netIdleWait number of seconds to wait for networ
|
|
<a id="__codelineno-0-218" name="__codelineno-0-218" href="#__codelineno-0-218"></a> k idle after page load and after beh
|
|
<a id="__codelineno-0-219" name="__codelineno-0-219" href="#__codelineno-0-219"></a> aviors are done (default: 2)
|
|
<a id="__codelineno-0-220" name="__codelineno-0-220" href="#__codelineno-0-220"></a> [number] [default: 2]
|
|
<a id="__codelineno-0-221" name="__codelineno-0-221" href="#__codelineno-0-221"></a> --netIdleMaxRequests max active requests allowed for netw
|
|
<a id="__codelineno-0-222" name="__codelineno-0-222" href="#__codelineno-0-222"></a> ork to be considered idle
|
|
<a id="__codelineno-0-223" name="__codelineno-0-223" href="#__codelineno-0-223"></a> [default: 1]
|
|
<a id="__codelineno-0-224" name="__codelineno-0-224" href="#__codelineno-0-224"></a> --lang if set, sets the language used by th
|
|
<a id="__codelineno-0-225" name="__codelineno-0-225" href="#__codelineno-0-225"></a> e browser, should be ISO 639 languag
|
|
<a id="__codelineno-0-226" name="__codelineno-0-226" href="#__codelineno-0-226"></a> e[-country] code [string]
|
|
<a id="__codelineno-0-227" name="__codelineno-0-227" href="#__codelineno-0-227"></a> --title If set, write supplied title into WA
|
|
<a id="__codelineno-0-228" name="__codelineno-0-228" href="#__codelineno-0-228"></a> CZ datapackage.json metadata[string]
|
|
<a id="__codelineno-0-229" name="__codelineno-0-229" href="#__codelineno-0-229"></a> --description, --desc If set, write supplied description i
|
|
<a id="__codelineno-0-230" name="__codelineno-0-230" href="#__codelineno-0-230"></a> nto WACZ datapackage.json metadata
|
|
<a id="__codelineno-0-231" name="__codelineno-0-231" href="#__codelineno-0-231"></a> [string]
|
|
<a id="__codelineno-0-232" name="__codelineno-0-232" href="#__codelineno-0-232"></a> --originOverride if set, will redirect requests from
|
|
<a id="__codelineno-0-233" name="__codelineno-0-233" href="#__codelineno-0-233"></a> each origin in key to origin in the
|
|
<a id="__codelineno-0-234" name="__codelineno-0-234" href="#__codelineno-0-234"></a> value, eg. --originOverride https://
|
|
<a id="__codelineno-0-235" name="__codelineno-0-235" href="#__codelineno-0-235"></a> host:port=http://alt-host:alt-port
|
|
<a id="__codelineno-0-236" name="__codelineno-0-236" href="#__codelineno-0-236"></a> [array] [default: []]
|
|
<a id="__codelineno-0-237" name="__codelineno-0-237" href="#__codelineno-0-237"></a> --logErrorsToRedis If set, write error messages to redi
|
|
<a id="__codelineno-0-238" name="__codelineno-0-238" href="#__codelineno-0-238"></a> s [boolean] [default: false]
|
|
<a id="__codelineno-0-239" name="__codelineno-0-239" href="#__codelineno-0-239"></a> --logBehaviorsToRedis If set, write behavior script messag
|
|
<a id="__codelineno-0-240" name="__codelineno-0-240" href="#__codelineno-0-240"></a> es to redis
|
|
<a id="__codelineno-0-241" name="__codelineno-0-241" href="#__codelineno-0-241"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-242" name="__codelineno-0-242" href="#__codelineno-0-242"></a> --writePagesToRedis If set, write page objects to redis
|
|
<a id="__codelineno-0-243" name="__codelineno-0-243" href="#__codelineno-0-243"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-244" name="__codelineno-0-244" href="#__codelineno-0-244"></a> --maxPageRetries, --retries If set, number of times to retry a p
|
|
<a id="__codelineno-0-245" name="__codelineno-0-245" href="#__codelineno-0-245"></a> age that failed to load before page
|
|
<a id="__codelineno-0-246" name="__codelineno-0-246" href="#__codelineno-0-246"></a> is considered to have failed
|
|
<a id="__codelineno-0-247" name="__codelineno-0-247" href="#__codelineno-0-247"></a> [number] [default: 2]
|
|
<a id="__codelineno-0-248" name="__codelineno-0-248" href="#__codelineno-0-248"></a> --failOnFailedSeed If set, crawler will fail with exit
|
|
<a id="__codelineno-0-249" name="__codelineno-0-249" href="#__codelineno-0-249"></a> code 1 if any seed fails. When combi
|
|
<a id="__codelineno-0-250" name="__codelineno-0-250" href="#__codelineno-0-250"></a> ned with --failOnInvalidStatus,will
|
|
<a id="__codelineno-0-251" name="__codelineno-0-251" href="#__codelineno-0-251"></a> result in crawl failing with exit co
|
|
<a id="__codelineno-0-252" name="__codelineno-0-252" href="#__codelineno-0-252"></a> de 1 if any seed has a 4xx/5xx respo
|
|
<a id="__codelineno-0-253" name="__codelineno-0-253" href="#__codelineno-0-253"></a> nse [boolean] [default: false]
|
|
<a id="__codelineno-0-254" name="__codelineno-0-254" href="#__codelineno-0-254"></a> --failOnFailedLimit If set, save state and exit if numbe
|
|
<a id="__codelineno-0-255" name="__codelineno-0-255" href="#__codelineno-0-255"></a> r of failed pages exceeds this value
|
|
<a id="__codelineno-0-256" name="__codelineno-0-256" href="#__codelineno-0-256"></a> [number] [default: 0]
|
|
<a id="__codelineno-0-257" name="__codelineno-0-257" href="#__codelineno-0-257"></a> --failOnInvalidStatus If set, will treat pages with 4xx or
|
|
<a id="__codelineno-0-258" name="__codelineno-0-258" href="#__codelineno-0-258"></a> 5xx response as failures. When comb
|
|
<a id="__codelineno-0-259" name="__codelineno-0-259" href="#__codelineno-0-259"></a> ined with --failOnFailedLimit or --f
|
|
<a id="__codelineno-0-260" name="__codelineno-0-260" href="#__codelineno-0-260"></a> ailOnFailedSeed may result in crawl
|
|
<a id="__codelineno-0-261" name="__codelineno-0-261" href="#__codelineno-0-261"></a> failing due to non-200 responses
|
|
<a id="__codelineno-0-262" name="__codelineno-0-262" href="#__codelineno-0-262"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-263" name="__codelineno-0-263" href="#__codelineno-0-263"></a> --failOnContentCheck If set, allows for behaviors to fail
|
|
<a id="__codelineno-0-264" name="__codelineno-0-264" href="#__codelineno-0-264"></a> a crawl with custom reason based on
|
|
<a id="__codelineno-0-265" name="__codelineno-0-265" href="#__codelineno-0-265"></a> content (e.g. logged out)
|
|
<a id="__codelineno-0-266" name="__codelineno-0-266" href="#__codelineno-0-266"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-267" name="__codelineno-0-267" href="#__codelineno-0-267"></a> --customBehaviors Custom behavior files to inject. Val
|
|
<a id="__codelineno-0-268" name="__codelineno-0-268" href="#__codelineno-0-268"></a> id values: URL to file, path to file
|
|
<a id="__codelineno-0-269" name="__codelineno-0-269" href="#__codelineno-0-269"></a> , path to directory of behaviors, UR
|
|
<a id="__codelineno-0-270" name="__codelineno-0-270" href="#__codelineno-0-270"></a> L to Git repo of behaviors (prefixed
|
|
<a id="__codelineno-0-271" name="__codelineno-0-271" href="#__codelineno-0-271"></a> with git+, optionally specify branc
|
|
<a id="__codelineno-0-272" name="__codelineno-0-272" href="#__codelineno-0-272"></a> h and relative path to a directory w
|
|
<a id="__codelineno-0-273" name="__codelineno-0-273" href="#__codelineno-0-273"></a> ithin repo as branch and path query
|
|
<a id="__codelineno-0-274" name="__codelineno-0-274" href="#__codelineno-0-274"></a> parameters, e.g. --customBehaviors "
|
|
<a id="__codelineno-0-275" name="__codelineno-0-275" href="#__codelineno-0-275"></a> git+https://git.example.com/repo.git
|
|
<a id="__codelineno-0-276" name="__codelineno-0-276" href="#__codelineno-0-276"></a> ?branch=dev&path=some/dir"
|
|
<a id="__codelineno-0-277" name="__codelineno-0-277" href="#__codelineno-0-277"></a> [array] [default: []]
|
|
<a id="__codelineno-0-278" name="__codelineno-0-278" href="#__codelineno-0-278"></a> --saveStorage if set, will store the localStorage/
|
|
<a id="__codelineno-0-279" name="__codelineno-0-279" href="#__codelineno-0-279"></a> sessionStorage data for each page as
|
|
<a id="__codelineno-0-280" name="__codelineno-0-280" href="#__codelineno-0-280"></a> part of WARC-JSON-Metadata field
|
|
<a id="__codelineno-0-281" name="__codelineno-0-281" href="#__codelineno-0-281"></a> [boolean]
|
|
<a id="__codelineno-0-282" name="__codelineno-0-282" href="#__codelineno-0-282"></a> --debugAccessRedis if set, runs internal redis without
|
|
<a id="__codelineno-0-283" name="__codelineno-0-283" href="#__codelineno-0-283"></a> protected mode to allow external acc
|
|
<a id="__codelineno-0-284" name="__codelineno-0-284" href="#__codelineno-0-284"></a> ess (for debugging) [boolean]
|
|
<a id="__codelineno-0-285" name="__codelineno-0-285" href="#__codelineno-0-285"></a> --debugAccessBrowser if set, allow debugging browser on p
|
|
<a id="__codelineno-0-286" name="__codelineno-0-286" href="#__codelineno-0-286"></a> ort 9222 via CDP [boolean]
|
|
<a id="__codelineno-0-287" name="__codelineno-0-287" href="#__codelineno-0-287"></a> --warcPrefix prefix for WARC files generated, inc
|
|
<a id="__codelineno-0-288" name="__codelineno-0-288" href="#__codelineno-0-288"></a> luding WARCs added to WACZ [string]
|
|
<a id="__codelineno-0-289" name="__codelineno-0-289" href="#__codelineno-0-289"></a> --serviceWorker, --sw service worker handling: disabled, e
|
|
<a id="__codelineno-0-290" name="__codelineno-0-290" href="#__codelineno-0-290"></a> nabled, or disabled with custom prof
|
|
<a id="__codelineno-0-291" name="__codelineno-0-291" href="#__codelineno-0-291"></a> ile
|
|
<a id="__codelineno-0-292" name="__codelineno-0-292" href="#__codelineno-0-292"></a> [choices: "disabled", "disabled-if-profile", "enabled"] [default: "disabled"]
|
|
<a id="__codelineno-0-293" name="__codelineno-0-293" href="#__codelineno-0-293"></a> --proxyServer if set, will use specified proxy ser
|
|
<a id="__codelineno-0-294" name="__codelineno-0-294" href="#__codelineno-0-294"></a> ver. Takes precedence over any env v
|
|
<a id="__codelineno-0-295" name="__codelineno-0-295" href="#__codelineno-0-295"></a> ar proxy settings [string]
|
|
<a id="__codelineno-0-296" name="__codelineno-0-296" href="#__codelineno-0-296"></a> --proxyServerPreferSingleProxy if set, and both proxyServer and pro
|
|
<a id="__codelineno-0-297" name="__codelineno-0-297" href="#__codelineno-0-297"></a> xyServerConfig are provided, the pro
|
|
<a id="__codelineno-0-298" name="__codelineno-0-298" href="#__codelineno-0-298"></a> xyServer value will be preferred
|
|
<a id="__codelineno-0-299" name="__codelineno-0-299" href="#__codelineno-0-299"></a> [boolean] [default: false]
|
|
<a id="__codelineno-0-300" name="__codelineno-0-300" href="#__codelineno-0-300"></a> --proxyServerConfig if set, path to yaml/json file that
|
|
<a id="__codelineno-0-301" name="__codelineno-0-301" href="#__codelineno-0-301"></a> configures multiple path servers per
|
|
<a id="__codelineno-0-302" name="__codelineno-0-302" href="#__codelineno-0-302"></a> URL regex [string]
|
|
<a id="__codelineno-0-303" name="__codelineno-0-303" href="#__codelineno-0-303"></a> --dryRun If true, no archive data is written
|
|
<a id="__codelineno-0-304" name="__codelineno-0-304" href="#__codelineno-0-304"></a> to disk, only pages and logs (and op
|
|
<a id="__codelineno-0-305" name="__codelineno-0-305" href="#__codelineno-0-305"></a> tionally saved state). [boolean]
|
|
<a id="__codelineno-0-306" name="__codelineno-0-306" href="#__codelineno-0-306"></a> --qaSource Required for QA mode. Source (WACZ o
|
|
<a id="__codelineno-0-307" name="__codelineno-0-307" href="#__codelineno-0-307"></a> r multi WACZ) for QA [string]
|
|
<a id="__codelineno-0-308" name="__codelineno-0-308" href="#__codelineno-0-308"></a> --qaDebugImageDiff if specified, will write crawl.png,
|
|
<a id="__codelineno-0-309" name="__codelineno-0-309" href="#__codelineno-0-309"></a> replay.png and diff.png for each pag
|
|
<a id="__codelineno-0-310" name="__codelineno-0-310" href="#__codelineno-0-310"></a> e where they're different [boolean]
|
|
<a id="__codelineno-0-311" name="__codelineno-0-311" href="#__codelineno-0-311"></a> --sshProxyPrivateKeyFile path to SSH private key for SOCKS5 o
|
|
<a id="__codelineno-0-312" name="__codelineno-0-312" href="#__codelineno-0-312"></a> ver SSH proxy connection [string]
|
|
<a id="__codelineno-0-313" name="__codelineno-0-313" href="#__codelineno-0-313"></a> --sshProxyKnownHostsFile path to SSH known hosts file for SOC
|
|
<a id="__codelineno-0-314" name="__codelineno-0-314" href="#__codelineno-0-314"></a> KS5 over SSH proxy connection
|
|
<a id="__codelineno-0-315" name="__codelineno-0-315" href="#__codelineno-0-315"></a> [string]
|
|
<a id="__codelineno-0-316" name="__codelineno-0-316" href="#__codelineno-0-316"></a> --extraChromeArgs Extra arguments to pass directly to
|
|
<a id="__codelineno-0-317" name="__codelineno-0-317" href="#__codelineno-0-317"></a> the Chrome instance (space-separated
|
|
<a id="__codelineno-0-318" name="__codelineno-0-318" href="#__codelineno-0-318"></a> or multiple --extraChromeArgs)
|
|
<a id="__codelineno-0-319" name="__codelineno-0-319" href="#__codelineno-0-319"></a> [array] [default: []]
|
|
<a id="__codelineno-0-320" name="__codelineno-0-320" href="#__codelineno-0-320"></a> --useRobots, --robots If set, fetch and respect page disal
|
|
<a id="__codelineno-0-321" name="__codelineno-0-321" href="#__codelineno-0-321"></a> lows specified in per-host robots.tx
|
|
<a id="__codelineno-0-322" name="__codelineno-0-322" href="#__codelineno-0-322"></a> t [boolean] [default: false]
|
|
<a id="__codelineno-0-323" name="__codelineno-0-323" href="#__codelineno-0-323"></a> --robotsAgent Agent to check in addition to '*' fo
|
|
<a id="__codelineno-0-324" name="__codelineno-0-324" href="#__codelineno-0-324"></a> r robots rules
|
|
<a id="__codelineno-0-325" name="__codelineno-0-325" href="#__codelineno-0-325"></a> [string] [default: "Browsertrix/1.x"]
|
|
<a id="__codelineno-0-326" name="__codelineno-0-326" href="#__codelineno-0-326"></a> --config Path to YAML config file
|
|
</code></pre></div>
|
|
<h2 id="create-login-profile">create-login-profile<a class="headerlink" href="#create-login-profile" title="Permanent link">¶</a></h2>
|
|
<div class="highlight"><pre><span></span><code><a id="__codelineno-1-1" name="__codelineno-1-1" href="#__codelineno-1-1"></a>Options:
|
|
<a id="__codelineno-1-2" name="__codelineno-1-2" href="#__codelineno-1-2"></a> --help Show help [boolean]
|
|
<a id="__codelineno-1-3" name="__codelineno-1-3" href="#__codelineno-1-3"></a> --version Show version number [boolean]
|
|
<a id="__codelineno-1-4" name="__codelineno-1-4" href="#__codelineno-1-4"></a> --url The URL of the login page [string] [required]
|
|
<a id="__codelineno-1-5" name="__codelineno-1-5" href="#__codelineno-1-5"></a> --user The username for the login. If not specified, will b
|
|
<a id="__codelineno-1-6" name="__codelineno-1-6" href="#__codelineno-1-6"></a> e prompted [string]
|
|
<a id="__codelineno-1-7" name="__codelineno-1-7" href="#__codelineno-1-7"></a> --password The password for the login. If not specified, will b
|
|
<a id="__codelineno-1-8" name="__codelineno-1-8" href="#__codelineno-1-8"></a> e prompted (recommended) [string]
|
|
<a id="__codelineno-1-9" name="__codelineno-1-9" href="#__codelineno-1-9"></a> --filename The filename for the profile tarball, stored within
|
|
<a id="__codelineno-1-10" name="__codelineno-1-10" href="#__codelineno-1-10"></a> /crawls/profiles if absolute path not provided
|
|
<a id="__codelineno-1-11" name="__codelineno-1-11" href="#__codelineno-1-11"></a> [string] [default: "/crawls/profiles/profile.tar.gz"]
|
|
<a id="__codelineno-1-12" name="__codelineno-1-12" href="#__codelineno-1-12"></a> --debugScreenshot If specified, take a screenshot after login and save
|
|
<a id="__codelineno-1-13" name="__codelineno-1-13" href="#__codelineno-1-13"></a> as this filename [boolean] [default: false]
|
|
<a id="__codelineno-1-14" name="__codelineno-1-14" href="#__codelineno-1-14"></a> --headless Run in headless mode, otherwise start xvfb
|
|
<a id="__codelineno-1-15" name="__codelineno-1-15" href="#__codelineno-1-15"></a> [boolean] [default: false]
|
|
<a id="__codelineno-1-16" name="__codelineno-1-16" href="#__codelineno-1-16"></a> --automated Start in automated mode, no interactive browser
|
|
<a id="__codelineno-1-17" name="__codelineno-1-17" href="#__codelineno-1-17"></a> [boolean] [default: false]
|
|
<a id="__codelineno-1-18" name="__codelineno-1-18" href="#__codelineno-1-18"></a> --interactive Deprecated. Now the default option!
|
|
<a id="__codelineno-1-19" name="__codelineno-1-19" href="#__codelineno-1-19"></a> [boolean] [default: false]
|
|
<a id="__codelineno-1-20" name="__codelineno-1-20" href="#__codelineno-1-20"></a> --shutdownWait Shutdown browser in interactive after this many seco
|
|
<a id="__codelineno-1-21" name="__codelineno-1-21" href="#__codelineno-1-21"></a> nds, if no pings received [number] [default: 0]
|
|
<a id="__codelineno-1-22" name="__codelineno-1-22" href="#__codelineno-1-22"></a> --profile Path or HTTP(S) URL to tar.gz file which contains th
|
|
<a id="__codelineno-1-23" name="__codelineno-1-23" href="#__codelineno-1-23"></a> e browser profile directory [string] [default: ""]
|
|
<a id="__codelineno-1-24" name="__codelineno-1-24" href="#__codelineno-1-24"></a> --windowSize Browser window dimensions, specified as: width,heigh
|
|
<a id="__codelineno-1-25" name="__codelineno-1-25" href="#__codelineno-1-25"></a> t [string] [default: "1360,1020"]
|
|
<a id="__codelineno-1-26" name="__codelineno-1-26" href="#__codelineno-1-26"></a> --cookieDays If >0, set all cookies, including session cookies, t
|
|
<a id="__codelineno-1-27" name="__codelineno-1-27" href="#__codelineno-1-27"></a> o have this duration in days before saving profile
|
|
<a id="__codelineno-1-28" name="__codelineno-1-28" href="#__codelineno-1-28"></a> [number] [default: 7]
|
|
<a id="__codelineno-1-29" name="__codelineno-1-29" href="#__codelineno-1-29"></a> --proxyServer if set, will use specified proxy server. Takes prece
|
|
<a id="__codelineno-1-30" name="__codelineno-1-30" href="#__codelineno-1-30"></a> dence over any env var proxy settings [string]
|
|
<a id="__codelineno-1-31" name="__codelineno-1-31" href="#__codelineno-1-31"></a> --proxyServerConfig if set, path to yaml/json file that configures multi
|
|
<a id="__codelineno-1-32" name="__codelineno-1-32" href="#__codelineno-1-32"></a> ple path servers per URL regex [string]
|
|
<a id="__codelineno-1-33" name="__codelineno-1-33" href="#__codelineno-1-33"></a> --sshProxyPrivateKeyFile path to SSH private key for SOCKS5 over SSH proxy co
|
|
<a id="__codelineno-1-34" name="__codelineno-1-34" href="#__codelineno-1-34"></a> nnection [string]
|
|
<a id="__codelineno-1-35" name="__codelineno-1-35" href="#__codelineno-1-35"></a> --sshProxyKnownHostsFile path to SSH known hosts file for SOCKS5 over SSH pro
|
|
<a id="__codelineno-1-36" name="__codelineno-1-36" href="#__codelineno-1-36"></a> xy connection [string]
|
|
</code></pre></div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
</article>
|
|
</div>
|
|
|
|
|
|
<script>var target=document.getElementById(location.hash.slice(1));target&&target.name&&(target.checked=target.name.startsWith("__tabbed_"))</script>
|
|
</div>
|
|
|
|
</main>
|
|
|
|
<footer class="md-footer">
|
|
|
|
|
|
|
|
<nav class="md-footer__inner md-grid" aria-label="Footer" >
|
|
|
|
|
|
<a href="../qa/" class="md-footer__link md-footer__link--prev" aria-label="Previous: Quality Assurance">
|
|
<div class="md-footer__button md-icon">
|
|
|
|
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11z"/></svg>
|
|
</div>
|
|
<div class="md-footer__title">
|
|
<span class="md-footer__direction">
|
|
Previous
|
|
</span>
|
|
<div class="md-ellipsis">
|
|
Quality Assurance
|
|
</div>
|
|
</div>
|
|
</a>
|
|
|
|
|
|
</nav>
|
|
|
|
|
|
<div class="md-footer-meta md-typeset">
|
|
<div class="md-footer-meta__inner md-grid">
|
|
<div class="md-copyright">
|
|
|
|
<div class="md-copyright__highlight">
|
|
Creative Commons Attribution 4.0 International (CC BY 4.0)
|
|
</div>
|
|
|
|
|
|
</div>
|
|
|
|
|
|
<div class="md-social">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<a href="https://webrecorder.net" target="_blank" rel="noopener" title="webrecorder.net" class="md-social__link">
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-globe" viewBox="0 0 16 16">
|
|
<path d="M0 8a8 8 0 1 1 16 0A8 8 0 0 1 0 8zm7.5-6.923c-.67.204-1.335.82-1.887 1.855A7.97 7.97 0 0 0 5.145 4H7.5V1.077zM4.09 4a9.267 9.267 0 0 1 .64-1.539 6.7 6.7 0 0 1 .597-.933A7.025 7.025 0 0 0 2.255 4H4.09zm-.582 3.5c.03-.877.138-1.718.312-2.5H1.674a6.958 6.958 0 0 0-.656 2.5h2.49zM4.847 5a12.5 12.5 0 0 0-.338 2.5H7.5V5H4.847zM8.5 5v2.5h2.99a12.495 12.495 0 0 0-.337-2.5H8.5zM4.51 8.5a12.5 12.5 0 0 0 .337 2.5H7.5V8.5H4.51zm3.99 0V11h2.653c.187-.765.306-1.608.338-2.5H8.5zM5.145 12c.138.386.295.744.468 1.068.552 1.035 1.218 1.65 1.887 1.855V12H5.145zm.182 2.472a6.696 6.696 0 0 1-.597-.933A9.268 9.268 0 0 1 4.09 12H2.255a7.024 7.024 0 0 0 3.072 2.472zM3.82 11a13.652 13.652 0 0 1-.312-2.5h-2.49c.062.89.291 1.733.656 2.5H3.82zm6.853 3.472A7.024 7.024 0 0 0 13.745 12H11.91a9.27 9.27 0 0 1-.64 1.539 6.688 6.688 0 0 1-.597.933zM8.5 12v2.923c.67-.204 1.335-.82 1.887-1.855.173-.324.33-.682.468-1.068H8.5zm3.68-1h2.146c.365-.767.594-1.61.656-2.5h-2.49a13.65 13.65 0 0 1-.312 2.5zm2.802-3.5a6.959 6.959 0 0 0-.656-2.5H12.18c.174.782.282 1.623.312 2.5h2.49zM11.27 2.461c.247.464.462.98.64 1.539h1.835a7.024 7.024 0 0 0-3.072-2.472c.218.284.418.598.597.933zM10.855 4a7.966 7.966 0 0 0-.468-1.068C9.835 1.897 9.17 1.282 8.5 1.077V4h2.355z"/>
|
|
</svg>
|
|
</a>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<a href="https://forum.webrecorder.net/" target="_blank" rel="noopener" title="forum.webrecorder.net" class="md-social__link">
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-chat-left-text-fill" viewBox="0 0 16 16">
|
|
<path d="M0 2a2 2 0 0 1 2-2h12a2 2 0 0 1 2 2v8a2 2 0 0 1-2 2H4.414a1 1 0 0 0-.707.293L.854 15.146A.5.5 0 0 1 0 14.793V2zm3.5 1a.5.5 0 0 0 0 1h9a.5.5 0 0 0 0-1h-9zm0 2.5a.5.5 0 0 0 0 1h9a.5.5 0 0 0 0-1h-9zm0 2.5a.5.5 0 0 0 0 1h5a.5.5 0 0 0 0-1h-5z"/>
|
|
</svg>
|
|
</a>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<a href="https://digipres.club/@webrecorder" target="_blank" rel="noopener me" title="digipres.club" class="md-social__link">
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-mastodon" viewBox="0 0 16 16">
|
|
<path d="M11.19 12.195c2.016-.24 3.77-1.475 3.99-2.603.348-1.778.32-4.339.32-4.339 0-3.47-2.286-4.488-2.286-4.488C12.062.238 10.083.017 8.027 0h-.05C5.92.017 3.942.238 2.79.765c0 0-2.285 1.017-2.285 4.488l-.002.662c-.004.64-.007 1.35.011 2.091.083 3.394.626 6.74 3.78 7.57 1.454.383 2.703.463 3.709.408 1.823-.1 2.847-.647 2.847-.647l-.06-1.317s-1.303.41-2.767.36c-1.45-.05-2.98-.156-3.215-1.928a3.614 3.614 0 0 1-.033-.496s1.424.346 3.228.428c1.103.05 2.137-.064 3.188-.189zm1.613-2.47H11.13v-4.08c0-.859-.364-1.295-1.091-1.295-.804 0-1.207.517-1.207 1.541v2.233H7.168V5.89c0-1.024-.403-1.541-1.207-1.541-.727 0-1.091.436-1.091 1.296v4.079H3.197V5.522c0-.859.22-1.541.66-2.046.456-.505 1.052-.764 1.793-.764.856 0 1.504.328 1.933.983L8 4.39l.417-.695c.429-.655 1.077-.983 1.934-.983.74 0 1.336.259 1.791.764.442.505.661 1.187.661 2.046v4.203z"/>
|
|
</svg>
|
|
</a>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<a href="https://www.youtube.com/@webrecorder" target="_blank" rel="noopener" title="www.youtube.com" class="md-social__link">
|
|
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-youtube" viewBox="0 0 16 16">
|
|
<path d="M8.051 1.999h.089c.822.003 4.987.033 6.11.335a2.01 2.01 0 0 1 1.415 1.42c.101.38.172.883.22 1.402l.01.104.022.26.008.104c.065.914.073 1.77.074 1.957v.075c-.001.194-.01 1.108-.082 2.06l-.008.105-.009.104c-.05.572-.124 1.14-.235 1.558a2.007 2.007 0 0 1-1.415 1.42c-1.16.312-5.569.334-6.18.335h-.142c-.309 0-1.587-.006-2.927-.052l-.17-.006-.087-.004-.171-.007-.171-.007c-1.11-.049-2.167-.128-2.654-.26a2.007 2.007 0 0 1-1.415-1.419c-.111-.417-.185-.986-.235-1.558L.09 9.82l-.008-.104A31.4 31.4 0 0 1 0 7.68v-.123c.002-.215.01-.958.064-1.778l.007-.103.003-.052.008-.104.022-.26.01-.104c.048-.519.119-1.023.22-1.402a2.007 2.007 0 0 1 1.415-1.42c.487-.13 1.544-.21 2.654-.26l.17-.007.172-.006.086-.003.171-.007A99.788 99.788 0 0 1 7.858 2h.193zM6.4 5.209v4.818l4.157-2.408L6.4 5.209z"/>
|
|
</svg>
|
|
</a>
|
|
|
|
</div>
|
|
|
|
</div>
|
|
</div>
|
|
</footer>
|
|
|
|
</div>
|
|
<div class="md-dialog" data-md-component="dialog">
|
|
<div class="md-dialog__inner md-typeset"></div>
|
|
</div>
|
|
|
|
|
|
|
|
|
|
|
|
<script id="__config" type="application/json">{"annotate": null, "base": "../..", "features": ["navigation.sections", "navigation.tabs", "navigation.tabs.sticky", "navigation.instant", "navigation.tracking", "navigation.indexes", "navigation.footer", "content.code.copy", "content.action.edit", "content.tooltips", "search.suggest"], "search": "../../assets/javascripts/workers/search.7a47a382.min.js", "tags": null, "translations": {"clipboard.copied": "Copied to clipboard", "clipboard.copy": "Copy to clipboard", "search.result.more.one": "1 more on this page", "search.result.more.other": "# more on this page", "search.result.none": "No matching documents", "search.result.one": "1 matching document", "search.result.other": "# matching documents", "search.result.placeholder": "Type to start searching", "search.result.term.missing": "Missing", "select.version": "Select version"}, "version": null}</script>
|
|
|
|
|
|
<script src="../../assets/javascripts/bundle.e71a0d61.min.js"></script>
|
|
|
|
|
|
</body>
|
|
</html> |