summaryrefslogtreecommitdiff
path: root/template.js
diff options
context:
space:
mode:
Diffstat (limited to 'template.js')
-rw-r--r--template.js130
1 files changed, 65 insertions, 65 deletions
diff --git a/template.js b/template.js
index b466a4e..36bb909 100644
--- a/template.js
+++ b/template.js
@@ -1,76 +1,76 @@
export const config = {
- // Specify the URL to start scraping from.
- url: "https://example.com/",
+ // Specify the URL to start scraping from.
+ url: "https://example.com/",
- // Enable rendering with headless browser. (default = false)
- // browser: true,
+ // Enable rendering with headless browser. (default = false)
+ // browser: true,
- // Specify if browser should be headless or not. (default = true)
- // headless: false,
+ // Specify if browser should be headless or not. (default = true)
+ // headless: false,
- // Specify the multiple URLs to start scraping from. (default = [])
- // urls: [
- // "https://anothersite.com/",
- // "https://yetanother.com/",
- // ],
+ // Specify the multiple URLs to start scraping from. (default = [])
+ // urls: [
+ // "https://anothersite.com/",
+ // "https://yetanother.com/",
+ // ],
- // Specify how deep links should be followed. (default = 0, no follow)
- // depth: 5,
+ // Specify how deep links should be followed. (default = 0, no follow)
+ // depth: 5,
- // Speficy the css selectors to follow. (default = ["a[href]"])
- // follow: [".next > a", ".related a"],
-
- // Specify the allowed domains. ['*'] for all. (default = domain from url)
- // allowedDomains: ["example.com", "anothersite.com"],
-
- // Specify the blocked domains. (default = none)
- // blockedDomains: ["somesite.com"],
+ // Speficy the css selectors to follow. (default = ["a[href]"])
+ // follow: [".next > a", ".related a"],
+
+ // Specify the allowed domains. ['*'] for all. (default = domain from url)
+ // allowedDomains: ["example.com", "anothersite.com"],
- // Specify the allowed URLs as regex. (default = all allowed)
- // allowedURLs: ["/posts", "/articles/\d+"],
+ // Specify the blocked domains. (default = none)
+ // blockedDomains: ["somesite.com"],
+
+ // Specify the allowed URLs as regex. (default = all allowed)
+ // allowedURLs: ["/posts", "/articles/\d+"],
+
+ // Specify the blocked URLs as regex. (default = none)
+ // blockedURLs: ["/admin"],
- // Specify the blocked URLs as regex. (default = none)
- // blockedURLs: ["/admin"],
-
- // Specify the rate in requests per minute. (default = no rate limit)
- // rate: 60,
-
- // Specify the number of concurrent requests. (default = no limit)
- // concurrency: 1,
-
- // Specify a single HTTP(S) proxy URL. (default = no proxy)
- // Note: Not compatible with browser mode.
- // proxy: "http://someproxy.com:8043",
-
- // Specify multiple HTTP(S) proxy URLs. (default = no proxy)
- // Note: Not compatible with browser mode.
- // proxies: [
- // "http://someproxy.com:8043",
- // "http://someotherproxy.com:8043",
- // ],
-
- // Enable file-based request caching. (default = no cache)
- // cache: "file",
-
- // Specify the HTTP request header. (default = none)
- // headers: {
- // "Authorization": "Bearer ...",
- // "User-Agent": "Mozilla ...",
- // },
-
- // Use the cookie store of your local browser. (default = off)
- // Options: "chrome" | "edge" | "firefox"
- // cookies: "chrome",
-
- // Specify the output options.
- // output: {
- // // Specify the output file. (default = stdout)
- // file: "results.json",
- //
- // // Specify the output format. (default = json)
- // // Options: "json" | "ndjson"
- // format: "json",
- // },
+ // Specify the rate in requests per minute. (default = no rate limit)
+ // rate: 60,
+
+ // Specify the number of concurrent requests. (default = no limit)
+ // concurrency: 1,
+
+ // Specify a single HTTP(S) proxy URL. (default = no proxy)
+ // Note: Not compatible with browser mode.
+ // proxy: "http://someproxy.com:8043",
+
+ // Specify multiple HTTP(S) proxy URLs. (default = no proxy)
+ // Note: Not compatible with browser mode.
+ // proxies: [
+ // "http://someproxy.com:8043",
+ // "http://someotherproxy.com:8043",
+ // ],
+
+ // Enable file-based request caching. (default = no cache)
+ // cache: "file",
+
+ // Specify the HTTP request header. (default = none)
+ // headers: {
+ // "Authorization": "Bearer ...",
+ // "User-Agent": "Mozilla ...",
+ // },
+
+ // Use the cookie store of your local browser. (default = off)
+ // Options: "chrome" | "edge" | "firefox"
+ // cookies: "chrome",
+
+ // Specify the output options.
+ // output: {
+ // // Specify the output file. (default = stdout)
+ // file: "results.json",
+ //
+ // // Specify the output format. (default = json)
+ // // Options: "json" | "ndjson"
+ // format: "json",
+ // },
};
export default function({ doc, absoluteURL }) {