2023-04-01 16:29:39 +00:00
|
|
|
<?php
|
|
|
|
|
|
|
|
// Load system dependencies
|
|
|
|
require_once('../config/app.php');
|
2023-04-07 01:04:24 +00:00
|
|
|
require_once('../library/curl.php');
|
|
|
|
require_once('../library/robots.php');
|
2023-04-01 16:29:39 +00:00
|
|
|
require_once('../library/filter.php');
|
2023-04-07 01:04:24 +00:00
|
|
|
require_once('../library/parser.php');
|
|
|
|
require_once('../library/mysql.php');
|
|
|
|
require_once('../library/sphinxql.php');
|
|
|
|
|
|
|
|
// Connect Sphinx search server
|
|
|
|
$sphinx = new SphinxQL(SPHINX_HOST, SPHINX_PORT);
|
2023-04-01 16:29:39 +00:00
|
|
|
|
|
|
|
// Connect database
|
2023-04-07 01:04:24 +00:00
|
|
|
$db = new MySQL(DB_HOST, DB_PORT, DB_NAME, DB_USERNAME, DB_PASSWORD);
|
2023-04-01 16:29:39 +00:00
|
|
|
|
|
|
|
// Filter request data
|
2023-05-04 00:48:57 +00:00
|
|
|
$t = !empty($_GET['t']) ? Filter::url($_GET['t']) : 'page';
|
2023-05-01 17:09:28 +00:00
|
|
|
$m = !empty($_GET['m']) ? Filter::url($_GET['m']) : 'default';
|
2023-04-01 16:29:39 +00:00
|
|
|
$q = !empty($_GET['q']) ? Filter::url($_GET['q']) : '';
|
2023-04-02 20:36:35 +00:00
|
|
|
$p = !empty($_GET['p']) ? (int) $_GET['p'] : 1;
|
2023-04-01 16:29:39 +00:00
|
|
|
|
2023-05-04 22:42:44 +00:00
|
|
|
// Define page basics
|
|
|
|
switch ($t) {
|
|
|
|
|
|
|
|
case 'image':
|
|
|
|
|
2023-05-08 09:28:49 +00:00
|
|
|
$totalPages = $sphinx->getHostImagesTotal();
|
2023-05-04 22:42:44 +00:00
|
|
|
|
|
|
|
$placeholder = Filter::plural($totalPages, [sprintf(_('Over %s image or enter the new one...'), $totalPages),
|
|
|
|
sprintf(_('Over %s images or enter the new one...'), $totalPages),
|
|
|
|
sprintf(_('Over %s images or enter the new one...'), $totalPages),
|
|
|
|
]);
|
|
|
|
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
|
2023-05-08 09:28:49 +00:00
|
|
|
$totalPages = $sphinx->getHostPagesTotal();
|
2023-05-04 22:42:44 +00:00
|
|
|
|
|
|
|
$placeholder = Filter::plural($totalPages, [sprintf(_('Over %s page or enter the new one...'), $totalPages),
|
|
|
|
sprintf(_('Over %s pages or enter the new one...'), $totalPages),
|
|
|
|
sprintf(_('Over %s pages or enter the new one...'), $totalPages),
|
|
|
|
]);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2023-04-01 16:29:39 +00:00
|
|
|
// Crawl request
|
|
|
|
if (filter_var($q, FILTER_VALIDATE_URL) && preg_match(CRAWL_URL_REGEXP, $q)) {
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
$db->beginTransaction();
|
|
|
|
|
|
|
|
try {
|
|
|
|
|
|
|
|
// Parse host info
|
|
|
|
if ($hostURL = Parser::hostURL($q)) {
|
|
|
|
|
|
|
|
// Host exists
|
|
|
|
if ($host = $db->getHost(crc32($hostURL->string))) {
|
|
|
|
|
2023-04-08 19:28:31 +00:00
|
|
|
$hostStatus = $host->status;
|
2023-05-09 10:26:19 +00:00
|
|
|
$hostNsfw = $host->nsfw;
|
2023-04-08 19:28:31 +00:00
|
|
|
$hostPageLimit = $host->crawlPageLimit;
|
|
|
|
$hostId = $host->hostId;
|
|
|
|
$hostRobots = $host->robots;
|
|
|
|
$hostRobotsPostfix = $host->robotsPostfix;
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
// Register new host
|
|
|
|
} else {
|
|
|
|
|
2023-04-23 01:05:00 +00:00
|
|
|
// Disk quota not reached
|
|
|
|
if (CRAWL_STOP_DISK_QUOTA_MB_LEFT < disk_free_space('/') / 1000000) {
|
|
|
|
|
|
|
|
// Get robots.txt if exists
|
2023-05-04 04:38:22 +00:00
|
|
|
$curl = new Curl($hostURL->string . '/robots.txt', CRAWL_CURLOPT_USERAGENT);
|
2023-04-23 01:05:00 +00:00
|
|
|
|
|
|
|
if (200 == $curl->getCode() && false !== stripos($curl->getContent(), 'user-agent:')) {
|
|
|
|
$hostRobots = $curl->getContent();
|
|
|
|
} else {
|
|
|
|
$hostRobots = null;
|
|
|
|
}
|
|
|
|
|
|
|
|
$hostRobotsPostfix = CRAWL_ROBOTS_POSTFIX_RULES;
|
|
|
|
|
|
|
|
$hostStatus = CRAWL_HOST_DEFAULT_STATUS;
|
2023-05-09 10:26:19 +00:00
|
|
|
$hostNsfw = CRAWL_HOST_DEFAULT_NSFW;
|
2023-04-23 01:05:00 +00:00
|
|
|
$hostPageLimit = CRAWL_HOST_DEFAULT_PAGES_LIMIT;
|
|
|
|
$hostId = $db->addHost($hostURL->scheme,
|
|
|
|
$hostURL->name,
|
|
|
|
$hostURL->port,
|
|
|
|
crc32($hostURL->string),
|
|
|
|
time(),
|
|
|
|
null,
|
|
|
|
$hostPageLimit,
|
|
|
|
(string) CRAWL_HOST_DEFAULT_META_ONLY,
|
|
|
|
(string) $hostStatus,
|
2023-05-09 10:26:19 +00:00
|
|
|
(string) $hostNsfw,
|
2023-04-23 01:05:00 +00:00
|
|
|
$hostRobots,
|
|
|
|
$hostRobotsPostfix);
|
2023-04-07 01:04:24 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Parse page URI
|
|
|
|
$hostPageURI = Parser::uri($q);
|
|
|
|
|
|
|
|
// Init robots parser
|
2023-04-08 19:28:31 +00:00
|
|
|
$robots = new Robots((!$hostRobots ? (string) $hostRobots : (string) CRAWL_ROBOTS_DEFAULT_RULES) . PHP_EOL . (string) $hostRobotsPostfix);
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
// Save page info
|
|
|
|
if ($hostStatus && // host enabled
|
|
|
|
$robots->uriAllowed($hostPageURI->string) && // page allowed by robots.txt rules
|
|
|
|
$hostPageLimit > $db->getTotalHostPages($hostId) && // pages quantity not reached host limit
|
|
|
|
!$db->getHostPage($hostId, crc32($hostPageURI->string))) { // page not exists
|
|
|
|
|
|
|
|
$db->addHostPage($hostId, crc32($hostPageURI->string), $hostPageURI->string, time());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$db->commit();
|
|
|
|
|
|
|
|
} catch(Exception $e){
|
|
|
|
|
|
|
|
$db->rollBack();
|
|
|
|
}
|
2023-04-01 16:29:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Search request
|
|
|
|
if (!empty($q)) {
|
|
|
|
|
2023-05-04 06:20:34 +00:00
|
|
|
if ($t == 'image') {
|
2023-05-04 00:48:57 +00:00
|
|
|
|
|
|
|
$resultsTotal = $sphinx->searchHostImagesTotal(Filter::searchQuery($q, $m));
|
2023-05-04 06:20:34 +00:00
|
|
|
$results = $sphinx->searchHostImages(Filter::searchQuery($q, $m), $p * WEBSITE_PAGINATION_SEARCH_IMAGE_RESULTS_LIMIT - WEBSITE_PAGINATION_SEARCH_IMAGE_RESULTS_LIMIT, WEBSITE_PAGINATION_SEARCH_IMAGE_RESULTS_LIMIT, $resultsTotal);
|
2023-05-04 00:48:57 +00:00
|
|
|
|
|
|
|
} else {
|
|
|
|
|
|
|
|
$resultsTotal = $sphinx->searchHostPagesTotal(Filter::searchQuery($q, $m));
|
2023-05-04 06:20:34 +00:00
|
|
|
$results = $sphinx->searchHostPages(Filter::searchQuery($q, $m), $p * WEBSITE_PAGINATION_SEARCH_PAGE_RESULTS_LIMIT - WEBSITE_PAGINATION_SEARCH_PAGE_RESULTS_LIMIT, WEBSITE_PAGINATION_SEARCH_PAGE_RESULTS_LIMIT, $resultsTotal);
|
2023-05-04 00:48:57 +00:00
|
|
|
}
|
2023-04-01 16:29:39 +00:00
|
|
|
|
|
|
|
} else {
|
|
|
|
|
|
|
|
$resultsTotal = 0;
|
2023-04-23 06:29:24 +00:00
|
|
|
$results = [];
|
2023-04-01 16:29:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
?>
|
|
|
|
|
|
|
|
<!DOCTYPE html>
|
|
|
|
<html lang="<?php echo _('en-US'); ?>">
|
|
|
|
<head>
|
2023-04-02 20:49:04 +00:00
|
|
|
<title><?php echo (empty($q) ? _('Empty request - YGGo!') : ($p > 1 ? sprintf(_('%s - #%s - YGGo!'), htmlentities($q), $p) : sprintf(_('%s - YGGo!'), htmlentities($q)))) ?></title>
|
2023-04-01 16:29:39 +00:00
|
|
|
<meta charset="utf-8" />
|
|
|
|
<meta name="viewport" content="width=device-width, initial-scale=1" />
|
2023-04-02 13:07:57 +00:00
|
|
|
<meta name="description" content="<?php echo _('Javascript-less Open Source Web Search Engine') ?>" />
|
2023-04-08 22:22:36 +00:00
|
|
|
<meta name="keywords" content="<?php echo _('web, search, engine, crawler, php, pdo, mysql, sphinx, yggdrasil, js-less, open source') ?>" />
|
2023-04-01 16:29:39 +00:00
|
|
|
<style>
|
|
|
|
|
|
|
|
* {
|
|
|
|
border: 0;
|
|
|
|
margin: 0;
|
|
|
|
padding: 0;
|
|
|
|
font-family: Sans-serif;
|
|
|
|
}
|
|
|
|
|
|
|
|
body {
|
|
|
|
background-color: #2e3436;
|
|
|
|
}
|
|
|
|
|
|
|
|
header {
|
|
|
|
background-color: #34393b;
|
|
|
|
position: fixed;
|
|
|
|
top: 0;
|
|
|
|
left: 0;
|
|
|
|
right: 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
main {
|
2023-05-04 06:52:08 +00:00
|
|
|
margin-top: 110px;
|
2023-04-01 16:29:39 +00:00
|
|
|
margin-bottom: 76px;
|
2023-05-04 06:55:52 +00:00
|
|
|
padding: 0 20px;
|
2023-04-01 16:29:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
h1 {
|
2023-04-02 22:55:26 +00:00
|
|
|
position: fixed;
|
|
|
|
top: 8px;
|
|
|
|
left: 24px;
|
|
|
|
}
|
|
|
|
|
|
|
|
h1 > a,
|
|
|
|
h1 > a:visited,
|
|
|
|
h1 > a:active,
|
|
|
|
h1 > a:hover {
|
2023-04-01 16:29:39 +00:00
|
|
|
color: #fff;
|
|
|
|
font-weight: normal;
|
2023-05-04 06:52:08 +00:00
|
|
|
font-size: 24px;
|
|
|
|
margin: 10px 0;
|
2023-04-02 22:55:26 +00:00
|
|
|
text-decoration: none;
|
2023-04-01 16:29:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
h2 {
|
|
|
|
display: block;
|
|
|
|
font-size: 16px;
|
|
|
|
font-weight: normal;
|
|
|
|
margin: 4px 0;
|
|
|
|
color: #fff;
|
|
|
|
}
|
|
|
|
|
2023-05-04 00:48:57 +00:00
|
|
|
h3 {
|
|
|
|
display: block;
|
|
|
|
font-size: 16px;
|
|
|
|
font-weight: normal;
|
2023-05-04 05:53:41 +00:00
|
|
|
margin: 12px 0;
|
2023-05-04 00:48:57 +00:00
|
|
|
color: #fff;
|
|
|
|
}
|
|
|
|
|
2023-04-01 16:29:39 +00:00
|
|
|
form {
|
|
|
|
display: block;
|
2023-04-02 22:55:26 +00:00
|
|
|
max-width: 678px;
|
2023-04-01 16:29:39 +00:00
|
|
|
margin: 0 auto;
|
|
|
|
text-align: center;
|
|
|
|
}
|
|
|
|
|
|
|
|
input {
|
|
|
|
width: 100%;
|
2023-05-04 06:52:08 +00:00
|
|
|
margin: 12px 0;
|
|
|
|
padding: 10px 0;
|
2023-04-01 16:29:39 +00:00
|
|
|
border-radius: 32px;
|
|
|
|
background-color: #000;
|
|
|
|
color: #fff;
|
|
|
|
font-size: 16px;
|
|
|
|
text-align: center;
|
|
|
|
}
|
|
|
|
|
|
|
|
input:hover {
|
|
|
|
background-color: #111
|
|
|
|
}
|
|
|
|
|
|
|
|
input:focus {
|
|
|
|
outline: none;
|
|
|
|
background-color: #111
|
|
|
|
}
|
|
|
|
|
|
|
|
input:focus::placeholder {
|
|
|
|
color: #090808
|
|
|
|
}
|
|
|
|
|
2023-05-04 00:48:57 +00:00
|
|
|
label {
|
|
|
|
font-size: 14px;
|
2023-05-04 06:52:08 +00:00
|
|
|
color: #fff;
|
|
|
|
float: left;
|
|
|
|
margin-left: 16px;
|
|
|
|
margin-bottom: 14px;
|
2023-05-04 00:48:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
label > input {
|
|
|
|
width: auto;
|
|
|
|
margin: 0 4px;
|
|
|
|
}
|
|
|
|
|
2023-04-01 16:29:39 +00:00
|
|
|
button {
|
2023-05-04 06:52:08 +00:00
|
|
|
padding: 8px 16px;
|
2023-04-01 16:29:39 +00:00
|
|
|
border-radius: 4px;
|
|
|
|
cursor: pointer;
|
|
|
|
background-color: #3394fb;
|
|
|
|
color: #fff;
|
|
|
|
font-size: 14px;
|
|
|
|
position: fixed;
|
2023-05-04 06:52:08 +00:00
|
|
|
top: 15px;
|
2023-04-01 16:29:39 +00:00
|
|
|
right: 24px;
|
|
|
|
}
|
|
|
|
|
|
|
|
button:hover {
|
|
|
|
background-color: #4b9df4;
|
|
|
|
}
|
|
|
|
|
|
|
|
a, a:visited, a:active {
|
2023-04-02 22:55:26 +00:00
|
|
|
color: #9ba2ac;
|
2023-05-04 03:12:51 +00:00
|
|
|
display: inline-block;
|
2023-04-02 22:30:09 +00:00
|
|
|
font-size: 12px;
|
2023-04-02 22:55:26 +00:00
|
|
|
margin-top: 8px;
|
2023-04-01 16:29:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
a:hover {
|
|
|
|
color: #54a3f7;
|
|
|
|
}
|
|
|
|
|
2023-05-04 00:48:57 +00:00
|
|
|
img.icon {
|
2023-04-02 22:30:09 +00:00
|
|
|
float: left;
|
|
|
|
border-radius: 50%;
|
|
|
|
margin-right: 8px;
|
|
|
|
}
|
|
|
|
|
2023-05-04 00:48:57 +00:00
|
|
|
img.image {
|
|
|
|
max-width: 100%;
|
|
|
|
border-radius: 3px;
|
|
|
|
}
|
|
|
|
|
2023-04-01 16:29:39 +00:00
|
|
|
div {
|
|
|
|
max-width: 640px;
|
|
|
|
margin: 0 auto;
|
|
|
|
padding: 16px 0;
|
|
|
|
border-top: 1px #000 dashed;
|
|
|
|
font-size: 14px
|
|
|
|
}
|
|
|
|
|
|
|
|
span {
|
2023-04-02 19:02:53 +00:00
|
|
|
color: #ccc;
|
2023-04-01 16:29:39 +00:00
|
|
|
display: block;
|
|
|
|
margin: 8px 0;
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:53:37 +00:00
|
|
|
p {
|
|
|
|
margin: 16px 0;
|
|
|
|
text-align: right;
|
|
|
|
}
|
|
|
|
|
2023-04-01 16:29:39 +00:00
|
|
|
</style>
|
|
|
|
</head>
|
|
|
|
<body>
|
|
|
|
<header>
|
|
|
|
<form name="search" method="GET" action="<?php echo WEBSITE_DOMAIN; ?>/search.php">
|
2023-04-02 22:55:26 +00:00
|
|
|
<h1><a href="<?php echo WEBSITE_DOMAIN; ?>"><?php echo _('YGGo!') ?></a></h1>
|
2023-04-01 16:29:39 +00:00
|
|
|
<input type="text" name="q" placeholder="<?php echo $placeholder ?>" value="<?php echo htmlentities($q) ?>" />
|
2023-05-04 06:52:08 +00:00
|
|
|
<label><input type="radio" name="t" value="page" <?php echo ($t == 'page' ? 'checked="checked"' : false) ?>/> <?php echo _('Pages') ?></label>
|
|
|
|
<label><input type="radio" name="t" value="image" <?php echo ($t == 'image' ? 'checked="checked"' : false) ?>/> <?php echo _('Images') ?></label>
|
2023-04-01 16:29:39 +00:00
|
|
|
<button type="submit"><?php echo _('Search'); ?></button>
|
|
|
|
</form>
|
|
|
|
</header>
|
|
|
|
<main>
|
|
|
|
<?php if ($results) { ?>
|
|
|
|
<div>
|
2023-04-02 19:02:53 +00:00
|
|
|
<span><?php echo sprintf(_('Total found: %s'), $resultsTotal) ?></span>
|
2023-04-01 22:30:50 +00:00
|
|
|
<?php if ($queueTotal = $db->getTotalPagesByHttpCode(null)) { ?>
|
2023-04-02 19:02:53 +00:00
|
|
|
<span><?php echo sprintf(_('* Please wait for all pages crawl to complete (%s in queue).'), $queueTotal) ?></span>
|
2023-04-01 22:30:50 +00:00
|
|
|
<?php } ?>
|
2023-04-01 16:29:39 +00:00
|
|
|
</div>
|
|
|
|
<?php foreach ($results as $result) { ?>
|
2023-05-04 06:20:34 +00:00
|
|
|
<?php if ($t == 'image' && $hostImage = $db->getFoundHostImage($result->id)) { ?>
|
2023-05-04 00:48:57 +00:00
|
|
|
<?php
|
|
|
|
|
|
|
|
// Built image url
|
|
|
|
$hostImageURL = $hostImage->scheme . '://' .
|
|
|
|
$hostImage->name .
|
|
|
|
($hostImage->port ? ':' . $hostImage->port : false) .
|
|
|
|
$hostImage->uri;
|
|
|
|
|
2023-05-09 05:53:33 +00:00
|
|
|
// Get local image data
|
2023-05-09 13:30:36 +00:00
|
|
|
$lastHostImageDescription = $db->getLastHostImageDescription($result->id);
|
|
|
|
|
|
|
|
if (!empty($lastHostImageDescription->data)) {
|
2023-05-09 05:53:33 +00:00
|
|
|
|
|
|
|
$hostImageURLencoded = $lastHostImageDescription->data;
|
|
|
|
|
|
|
|
// Get remote if local index not found or CRAWL_HOST_DEFAULT_META_ONLY enabled
|
|
|
|
} else {
|
2023-05-04 01:42:07 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
// Init image request
|
2023-05-04 04:38:22 +00:00
|
|
|
$hostImageCurl = new Curl($hostImageURL, PROXY_CURLOPT_USERAGENT);
|
2023-05-04 01:42:07 +00:00
|
|
|
|
2023-05-04 02:19:29 +00:00
|
|
|
// Skip item render on timeout
|
2023-05-04 03:12:51 +00:00
|
|
|
$hostImageHttpCode = $hostImageCurl->getCode();
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageHttpCode($result->id, (int) $hostImageHttpCode, time());
|
2023-05-04 03:12:51 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
if (200 != $hostImageHttpCode) {
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageHttpCode($result->id, $hostImageHttpCode, time());
|
2023-05-08 11:13:53 +00:00
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageTimeBanned($result->id, time());
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Skip image processing on MIME type not provided
|
|
|
|
if (!$hostImageContentType = $hostImageCurl->getContentType()) {
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageTimeBanned($result->id, time());
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Skip image processing on MIME type not allowed in settings
|
2023-05-08 10:00:02 +00:00
|
|
|
$hostImageBanned = true;
|
|
|
|
foreach ((array) explode(',', CRAWL_IMAGE_MIME) as $mime) {
|
2023-05-06 05:45:37 +00:00
|
|
|
|
2023-05-08 10:00:02 +00:00
|
|
|
if (false !== strpos($hostImageContentType, trim($mime))) {
|
2023-05-06 05:45:37 +00:00
|
|
|
|
2023-05-08 10:00:02 +00:00
|
|
|
$hostImageBanned = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($hostImageBanned) {
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageMime($result->id, $hostImageContentType, time());
|
2023-05-08 11:13:53 +00:00
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$hostImagesBanned += $db->updateHostImageTimeBanned($result->id, time());
|
2023-05-08 10:12:16 +00:00
|
|
|
|
|
|
|
continue;
|
2023-05-06 05:45:37 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Skip image processing without returned content
|
|
|
|
if (!$hostImageContent = $hostImageCurl->getContent()) {
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageTimeBanned($result->id, time());
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
2023-05-04 00:48:57 +00:00
|
|
|
|
2023-05-04 02:19:29 +00:00
|
|
|
// Convert remote image data to base64 string to prevent direct URL call
|
2023-05-06 05:45:37 +00:00
|
|
|
if (!$hostImageExtension = @pathinfo($hostImageURL, PATHINFO_EXTENSION)) {
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageTimeBanned($result->id, time());
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!$hostImageBase64 = @base64_encode($hostImageContent)) {
|
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImageTimeBanned($result->id, time());
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
2023-05-04 02:19:29 +00:00
|
|
|
|
2023-05-08 10:12:16 +00:00
|
|
|
$hostImageURLencoded = 'data:image/' . str_replace(['svg'], ['svg+xml'], $hostImageExtension) . ';base64,' . $hostImageBase64;
|
2023-05-04 02:19:29 +00:00
|
|
|
|
2023-05-04 03:12:51 +00:00
|
|
|
// Save image content on data settings enabled
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->updateHostImage($result->id,
|
2023-05-06 05:45:37 +00:00
|
|
|
Filter::mime($hostImageContentType),
|
2023-05-08 10:00:02 +00:00
|
|
|
time());
|
2023-05-04 03:12:51 +00:00
|
|
|
|
2023-05-09 12:23:32 +00:00
|
|
|
$db->setHostImageDescriptionData($result->id,
|
2023-05-09 05:53:33 +00:00
|
|
|
crc32($hostImageURLencoded),
|
|
|
|
$hostImage->crawlMetaOnly ? null : $hostImageURLencoded,
|
2023-05-09 12:53:21 +00:00
|
|
|
time(),
|
|
|
|
null);
|
2023-05-04 02:19:29 +00:00
|
|
|
}
|
2023-05-04 00:48:57 +00:00
|
|
|
?>
|
|
|
|
<div>
|
|
|
|
<a href="<?php echo $hostImageURL ?>">
|
2023-05-09 05:53:33 +00:00
|
|
|
<img src="<?php echo $hostImageURLencoded ?>" alt="<?php echo htmlentities($hostImageURL) ?>" title="<?php echo htmlentities($hostImageURL) ?>" class="image" />
|
2023-05-04 00:48:57 +00:00
|
|
|
</a>
|
2023-05-09 13:34:33 +00:00
|
|
|
<br />
|
2023-05-04 07:53:37 +00:00
|
|
|
<?php $hostImageHostPagesTotal = $db->getHostImageHostPagesTotal($result->id) ?>
|
|
|
|
<?php foreach ((array) $db->getHostImageHostPages($result->id, WEBSITE_SEARCH_IMAGE_RELATED_PAGE_RESULTS_LIMIT) as $hostPage) { ?>
|
2023-05-04 00:48:57 +00:00
|
|
|
<?php if ($hostPage = $db->getFoundHostPage($hostPage->hostPageId)) { ?>
|
|
|
|
<?php $hostPageURL = $hostPage->scheme . '://' . $hostPage->name . ($hostPage->port ? ':' . $hostPage->port : false) . $hostPage->uri ?>
|
2023-05-08 22:29:32 +00:00
|
|
|
<?php if ($hostPageDescription = $db->getLastPageDescription($result->id)) { ?>
|
|
|
|
<h3><?php echo $hostPageDescription->metaTitle ?></h3>
|
|
|
|
<?php } ?>
|
2023-05-09 13:30:36 +00:00
|
|
|
<?php if ($lastHostImageDescription) { ?>
|
2023-05-09 05:19:49 +00:00
|
|
|
<span><?php echo $lastHostImageDescription->title ?> <?php echo $lastHostImageDescription->alt ?></span>
|
2023-05-04 00:48:57 +00:00
|
|
|
<?php } ?>
|
|
|
|
<a href="<?php echo $hostPageURL ?>">
|
|
|
|
<img src="<?php echo WEBSITE_DOMAIN ?>/image.php?q=<?php echo urlencode($hostPage->name) ?>" alt="favicon" width="16" height="16" class="icon" />
|
2023-05-05 17:09:15 +00:00
|
|
|
<?php echo htmlentities(urldecode($hostPageURL)) ?>
|
2023-05-04 00:48:57 +00:00
|
|
|
</a>
|
|
|
|
<?php } ?>
|
|
|
|
<?php } ?>
|
2023-05-04 07:53:37 +00:00
|
|
|
<?php if ($hostImageHostPagesTotal - WEBSITE_SEARCH_IMAGE_RELATED_PAGE_RESULTS_LIMIT > 0) { ?>
|
|
|
|
<p>
|
|
|
|
<small>
|
|
|
|
<?php echo Filter::plural($hostImageHostPagesTotal - WEBSITE_SEARCH_IMAGE_RELATED_PAGE_RESULTS_LIMIT,
|
|
|
|
[
|
|
|
|
sprintf(_('+%s other page'), $hostImageHostPagesTotal - WEBSITE_SEARCH_IMAGE_RELATED_PAGE_RESULTS_LIMIT),
|
|
|
|
sprintf(_('+%s other pages'), $hostImageHostPagesTotal - WEBSITE_SEARCH_IMAGE_RELATED_PAGE_RESULTS_LIMIT),
|
|
|
|
sprintf(_('+%s other pages'), $hostImageHostPagesTotal - WEBSITE_SEARCH_IMAGE_RELATED_PAGE_RESULTS_LIMIT),
|
|
|
|
]); ?>
|
|
|
|
</small>
|
|
|
|
</p>
|
|
|
|
<?php } ?>
|
2023-05-04 00:48:57 +00:00
|
|
|
</div>
|
|
|
|
<?php } else if ($hostPage = $db->getFoundHostPage($result->id)) { ?>
|
|
|
|
<?php
|
|
|
|
|
|
|
|
$hostPageURL = $hostPage->scheme . '://' .
|
|
|
|
$hostPage->name .
|
|
|
|
($hostPage->port ? ':' . $hostPage->port : false) .
|
|
|
|
$hostPage->uri;
|
|
|
|
|
|
|
|
?>
|
2023-04-07 01:04:24 +00:00
|
|
|
<div>
|
2023-05-08 22:29:32 +00:00
|
|
|
<?php if ($hostPageDescription = $db->getLastPageDescription($result->id)) { ?>
|
|
|
|
<h2><?php echo $hostPageDescription->metaTitle ?></h2>
|
|
|
|
<?php if (!empty($hostPageDescription->metaDescription)) { ?>
|
|
|
|
<span><?php echo $hostPageDescription->metaDescription ?></span>
|
|
|
|
<?php } ?>
|
2023-04-07 01:04:24 +00:00
|
|
|
<?php } ?>
|
|
|
|
<a href="<?php echo $hostPageURL ?>">
|
2023-05-04 00:48:57 +00:00
|
|
|
<img src="<?php echo WEBSITE_DOMAIN; ?>/image.php?q=<?php echo urlencode($hostPage->name) ?>" alt="favicon" width="16" height="16" class="icon" />
|
2023-05-05 17:09:15 +00:00
|
|
|
<?php echo htmlentities(urldecode($hostPageURL)) ?>
|
2023-04-07 01:04:24 +00:00
|
|
|
</a>
|
|
|
|
</div>
|
|
|
|
<?php } ?>
|
2023-04-01 16:29:39 +00:00
|
|
|
<?php } ?>
|
2023-05-04 06:20:34 +00:00
|
|
|
<?php if ($p * ($t == 'image' ? WEBSITE_PAGINATION_SEARCH_IMAGE_RESULTS_LIMIT : WEBSITE_PAGINATION_SEARCH_PAGE_RESULTS_LIMIT) <= $resultsTotal) { ?>
|
2023-04-02 20:36:35 +00:00
|
|
|
<div>
|
2023-05-04 06:20:34 +00:00
|
|
|
<a href="<?php echo WEBSITE_DOMAIN; ?>/search.php?q=<?php echo urlencode(htmlentities($q)) ?>&t=<?php echo $t ?>&p=<?php echo $p + 1 ?>"><?php echo _('Next page') ?></a>
|
2023-04-02 20:36:35 +00:00
|
|
|
</div>
|
|
|
|
<?php } ?>
|
2023-04-01 16:29:39 +00:00
|
|
|
<?php } else { ?>
|
|
|
|
<div style="text-align:center">
|
2023-04-02 19:02:53 +00:00
|
|
|
<span><?php echo sprintf(_('Total found: %s'), $resultsTotal) ?></span>
|
2023-04-01 22:30:50 +00:00
|
|
|
<?php if ($q && $queueTotal = $db->getTotalPagesByHttpCode(null)) { ?>
|
2023-04-02 19:02:53 +00:00
|
|
|
<span><?php echo sprintf(_('* Please wait for all pages crawl to complete (%s in queue).'), $queueTotal) ?></span>
|
2023-04-01 22:30:50 +00:00
|
|
|
<?php } ?>
|
2023-04-01 16:29:39 +00:00
|
|
|
</div>
|
|
|
|
<?php } ?>
|
|
|
|
</main>
|
|
|
|
</body>
|
|
|
|
</html>
|