diff --git a/src/cli/document/clean.php b/src/cli/document/clean.php index 4b123ee..d76c347 100644 --- a/src/cli/document/clean.php +++ b/src/cli/document/clean.php @@ -83,12 +83,20 @@ foreach ($config->cli->document->crawl->skip->stripos->url as $condition) $index->search( sprintf( '@url "%s"', - $condition + @\Manticoresearch\Utils::escape( + $condition + ) ) )->limit( isset($argv[1]) ? (int) $argv[1] : 10 )->get() as $document) { + // Make sure document contain exact substring in URL + if (false === mb_strpos($document->get('url'), $condition)) + { + continue; + } + // Delete found document by it ID $result = $index->deleteDocument( $document->getId()