mirror of https://github.com/YGGverse/YGGo.git
phpyggdrasilmysqlcrawlerjs-lessalt-websphinxspiderdistributedwebsearch-engineopen-sourceweb-archivepdocurlparserfts5privacy-orientedsphinxsearchfederative
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
56 lines
1.4 KiB
56 lines
1.4 KiB
<?php |
|
|
|
// Debug |
|
ini_set('display_errors', '1'); |
|
ini_set('display_startup_errors', '1'); |
|
error_reporting(E_ALL); |
|
|
|
// Website |
|
define('WEBSITE_DOMAIN', (issue($_SERVER['HTTP_HOST']) ? 'http://' . $_SERVER['HTTP_HOST'] : '')); |
|
define('WEBSITE_PAGINATION_SEARCH_RESULTS_LIMIT', 100); |
|
define('WEBSITE_IDENTICON_IMAGE_CACHE', true); |
|
|
|
// Database |
|
define('DB_HOST', 'localhost'); |
|
define('DB_PORT', 3306); |
|
define('DB_NAME', ''); |
|
define('DB_USERNAME', ''); |
|
define('DB_PASSWORD', ''); |
|
|
|
// Sphinx |
|
define('SPHINX_HOST', '127.0.0.1'); |
|
define('SPHINX_PORT', 9306); |
|
|
|
// Crawler settings |
|
define('CRAWL_PAGE_LIMIT', 10); |
|
define('CRAWL_PAGE_SECONDS_OFFSET', 3600); |
|
|
|
define('CRAWL_URL_REGEXP', '/^.*$/ui'); // ipv6 only '/^http:\/\/\[[\w:]+\].*$/ui' |
|
|
|
define('CRAWL_HOST_DEFAULT_PAGES_LIMIT', 1000); |
|
define('CRAWL_HOST_DEFAULT_STATUS', true); |
|
define('CRAWL_HOST_DEFAULT_META_ONLY', false); |
|
|
|
/* |
|
* Default robots.txt rules on remote file not exists |
|
* The crawler able to overwrite these rules |
|
* |
|
* Presets |
|
* yggdrasil: /database/yggdrasil/host.robots.md |
|
* |
|
*/ |
|
define('CRAWL_ROBOTS_DEFAULT_RULES', null); // string|null |
|
|
|
/* |
|
* Permanent rules that append to the robots.txt if exists else CRAWL_ROBOTS_DEFAULT_RULES |
|
* The crawler does not overwrite these rules |
|
* |
|
* Presets |
|
* yggdrasil: /database/yggdrasil/host.robotsPostfix.md |
|
* |
|
*/ |
|
define('CRAWL_ROBOTS_POSTFIX_RULES', null); // string|null |
|
|
|
// Cleaner settings |
|
define('CLEAN_HOST_LIMIT', 20); |
|
define('CLEAN_HOST_SECONDS_OFFSET', 3600); |