From b1e2c8fd5cb5dfa46bc440a12eafaf56cd844b1c Mon Sep 17 00:00:00 2001 From: Philipp Tanlak Date: Mon, 24 Nov 2025 20:54:57 +0100 Subject: Docs --- .../docs/configuration/link-following/index.html | 593 +++++++++++++++++++++ 1 file changed, 593 insertions(+) create mode 100644 public/docs/configuration/link-following/index.html (limited to 'public/docs/configuration/link-following') diff --git a/public/docs/configuration/link-following/index.html b/public/docs/configuration/link-following/index.html new file mode 100644 index 0000000..46434c3 --- /dev/null +++ b/public/docs/configuration/link-following/index.html @@ -0,0 +1,593 @@ + + + + + + + + + + + + + + + Link Following – Flyscrape + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + +
+
+
+ +
Link Following
+
+ +
+

Link Following

+

The follow config option allows you to specify a list of CSS selectors that determine which links the scraper should follow.

+

When no value is provided the scraper will follow all links found with the a[href] selector.

+
Configuration
export const config = {
+  url: "http://example.com/",
+  follow: [
+    ".pagination > a[href]",
+    ".nav a[href]",
+  ],
+  // ...
+};
+ +
+
+

Following non href attributes +

For special cases where the link is not to be found in the href, you specify a selector with a different ending attribute.

+
Configuration
export const config = {
+  url: "http://example.com/",
+  follow: [
+    ".articles > div[data-url]",
+  ],
+  // ...
+};
+ +
+
+ +
+
+ + +
+
+
+ + + + + + + + + + -- cgit v1.2.3