Browse Source

make sure document contain exact substring in URL

main
yggverse 8 months ago
parent
commit
be7c63e68a
  1. 10
      src/cli/document/clean.php

10
src/cli/document/clean.php

@ -83,12 +83,20 @@ foreach ($config->cli->document->crawl->skip->stripos->url as $condition) @@ -83,12 +83,20 @@ foreach ($config->cli->document->crawl->skip->stripos->url as $condition)
$index->search(
sprintf(
'@url "%s"',
$condition
@\Manticoresearch\Utils::escape(
$condition
)
)
)->limit(
isset($argv[1]) ? (int) $argv[1] : 10
)->get() as $document)
{
// Make sure document contain exact substring in URL
if (false === mb_strpos($document->get('url'), $condition))
{
continue;
}
// Delete found document by it ID
$result = $index->deleteDocument(
$document->getId()

Loading…
Cancel
Save