From b0c320e436ff5cdc70ad38a980a2af2a7f3e5dfd Mon Sep 17 00:00:00 2001 From: Shulhan Date: Thu, 29 May 2025 14:04:51 +0700 Subject: all: ignore HTML page from external domain Any HTML link that is from domain other than the scanned domain should net get parsed. It only check if the link is valid or not. --- testdata/web/index.html | 1 + testdata/web/page2/index.html | 1 + 2 files changed, 2 insertions(+) (limited to 'testdata/web') diff --git a/testdata/web/index.html b/testdata/web/index.html index e4d8bd0..f4f86d8 100644 --- a/testdata/web/index.html +++ b/testdata/web/index.html @@ -9,5 +9,6 @@ SPDX-License-Identifier: GPL-3.0-only Page 2 Broken HTML + External URL diff --git a/testdata/web/page2/index.html b/testdata/web/page2/index.html index 0fc7601..ae6b4ea 100644 --- a/testdata/web/page2/index.html +++ b/testdata/web/page2/index.html @@ -9,5 +9,6 @@ SPDX-License-Identifier: GPL-3.0-only broken relative link Back with absolute path Back with relative path + External URL page2 -- cgit v1.3