From 71a3e7dd0e60314e08362d68eb546ed2d108b0bb Mon Sep 17 00:00:00 2001 From: ghost Date: Sat, 8 Apr 2023 19:11:12 +0300 Subject: [PATCH] skip x-raw-image links crawl --- crontab/crawler.php | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/crontab/crawler.php b/crontab/crawler.php index 394692f..fe8ffb9 100644 --- a/crontab/crawler.php +++ b/crontab/crawler.php @@ -112,6 +112,12 @@ foreach ($db->getCrawlQueue(CRAWL_PAGE_LIMIT, time() - CRAWL_PAGE_SECONDS_OFFSET continue; } + // Skip x-raw-image links + if (false !== strpos($href, 'x-raw-image:')) { + + continue; + } + // @TODO skip other apps // Add absolute URL prefixes to the relative links found