From b1e2c8fd5cb5dfa46bc440a12eafaf56cd844b1c Mon Sep 17 00:00:00 2001 From: Philipp Tanlak Date: Mon, 24 Nov 2025 20:54:57 +0100 Subject: Docs --- public/docs/configuration/domain-filter/index.html | 616 +++++++++++++++++++++ 1 file changed, 616 insertions(+) create mode 100644 public/docs/configuration/domain-filter/index.html (limited to 'public/docs/configuration/domain-filter') diff --git a/public/docs/configuration/domain-filter/index.html b/public/docs/configuration/domain-filter/index.html new file mode 100644 index 0000000..482211f --- /dev/null +++ b/public/docs/configuration/domain-filter/index.html @@ -0,0 +1,616 @@ + + + + + + + + + + + + + + + Domain Filter – Flyscrape + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + +
+
+
+ +
Domain Filter
+
+ +
+

Domain Filter

+

The allowedDomains and blockedDomains config options allow you to specify a list of domains which are accessible or blocked during scraping.

+
Configuration
export const options = {
+  url: "http://example.com/",
+  allowedDomains: ["subdomain.example.com"],
+  // ...
+};
+ +
+
+

Allowed Domains +

This config option controls which additional domains are allowed to be visted during scraping. The domain of the initial URL is always allowed.

+

You can also allow all domains to be accessible by setting allowedDomains to ["*"]. To then further restrict access, you can specify blockedDomains.

+
Configuration
export const options = {
+  url: "http://example.com/",
+  allowedDomains: ["*"],
+  // ...
+};
+ +
+
+

Blocked Domains +

This config option controls which additional domains are blocked from being accessed. By default all domains other than the domain of the initial URL or those specified in allowedDomains are blocked.

+

You can best use blockedDomains in conjunction with allowedDomains: ["*"], allowing the scraping process to access all domains except what’s specified in blockedDomains.

+
Configuration
export const options = {
+  url: "http://example.com/",
+  allowedDomains: ["*"],
+  blockedDomains: ["google.com", "bing.com"],
+  // ...
+};
+ +
+
+ +
+
+ + +
+
+
+ + + + + + + + + + -- cgit v1.2.3