From e09440b44ab8cf7fc700aca47928ad2ea349b427 Mon Sep 17 00:00:00 2001 From: yggverse Date: Thu, 21 Mar 2024 00:38:24 +0200 Subject: [PATCH] strip code content --- src/cli/document/crawl.php | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/cli/document/crawl.php b/src/cli/document/crawl.php index 829f25a..5537e79 100644 --- a/src/cli/document/crawl.php +++ b/src/cli/document/crawl.php @@ -364,6 +364,8 @@ foreach($index->search('') [ '/]*)>([^<]*)<\/script>/is', // strip js content '/]*)>([^<]*)<\/style>/is', // strip css content + '/]*)>([^<]*)<\/pre>/is', // strip code content + '/]*)>([^<]*)<\/code>/is', ], '', html_entity_decode(