Browse Source

add hostPageDom generate [selectors] attribute

main
ghost 2 years ago
parent
commit
6702c3f402
  1. 16
      cli/yggo.php

16
cli/yggo.php

@ -39,7 +39,17 @@ switch ($argv[1]) { @@ -39,7 +39,17 @@ switch ($argv[1]) {
case 'generate':
if (CRAWL_HOST_PAGE_DOM_SELECTORS) {
$selectors = [];
foreach ((array) explode(';', !empty($argv[3]) ? $argv[3] : (string) CRAWL_HOST_PAGE_DOM_SELECTORS) as $selector) {
if (!empty($selector)) {
$selectors[] = trim($selector);
}
}
if ($selectors) {
// Init variables
$hostPagesProcessedTotal = 0;
@ -58,7 +68,7 @@ switch ($argv[1]) { @@ -58,7 +68,7 @@ switch ($argv[1]) {
$html = str_get_html(base64_decode($hostPageDescription->data));
foreach ((array) explode(',', CRAWL_HOST_PAGE_DOM_SELECTORS) as $selector) {
foreach ($selectors as $selector) {
foreach($html->find($selector) as $element) {
@ -118,7 +128,7 @@ echo '/_/\____/\____/\____(_)' . PHP_EOL; @@ -118,7 +128,7 @@ echo '/_/\____/\____/\____(_)' . PHP_EOL;
echo PHP_EOL . _('available options:') . PHP_EOL . PHP_EOL;
echo _(' help - this message') . PHP_EOL;
echo _(' hostPageDom generate - make hostPageDom index based on related hostPage.data field') . PHP_EOL;
echo _(' hostPageDom generate [selectors] - make hostPageDom index based on related hostPage.data field') . PHP_EOL;
echo _(' hostPageDom truncate - flush hostPageDom table') . PHP_EOL . PHP_EOL;
echo _('get support: https://github.com/YGGverse/YGGo/issues') . PHP_EOL . PHP_EOL;

Loading…
Cancel
Save