2023-11-09 19:11:11 -05:00
|
|
|
export const HTML_TYPES = [
|
|
|
|
"text/html",
|
|
|
|
"application/xhtml",
|
|
|
|
"application/xhtml+xml",
|
|
|
|
];
|
|
|
|
export const WAIT_UNTIL_OPTS = [
|
|
|
|
"load",
|
|
|
|
"domcontentloaded",
|
|
|
|
"networkidle0",
|
|
|
|
"networkidle2",
|
|
|
|
];
|
2023-10-31 23:05:30 -07:00
|
|
|
export const EXTRACT_TEXT_TYPES = ["to-pages", "to-warc", "final-to-warc"];
|
|
|
|
|
2022-10-24 15:30:10 +02:00
|
|
|
export const BEHAVIOR_LOG_FUNC = "__bx_log";
|
2023-09-15 10:12:08 -07:00
|
|
|
export const ADD_LINK_FUNC = "__bx_addLink";
|
2023-03-17 14:24:44 -07:00
|
|
|
export const MAX_DEPTH = 1000000;
|
2021-06-23 19:36:32 -07:00
|
|
|
|
2023-11-09 19:11:11 -05:00
|
|
|
export const DEFAULT_SELECTORS = [
|
|
|
|
{
|
|
|
|
selector: "a[href]",
|
|
|
|
extract: "href",
|
|
|
|
isAttribute: false,
|
|
|
|
},
|
|
|
|
];
|