2023-04-07 01:04:24 +00:00
|
|
|
<?php
|
|
|
|
|
|
|
|
class MySQL {
|
|
|
|
|
|
|
|
private PDO $_db;
|
|
|
|
|
|
|
|
public function __construct(string $host, int $port, string $database, string $username, string $password) {
|
|
|
|
|
|
|
|
$this->_db = new PDO('mysql:dbname=' . $database . ';host=' . $host . ';port=' . $port . ';charset=utf8', $username, $password, [PDO::MYSQL_ATTR_INIT_COMMAND => 'SET NAMES utf8']);
|
|
|
|
$this->_db->setAttribute(PDO::ATTR_ERRMODE, PDO::ERRMODE_EXCEPTION);
|
|
|
|
$this->_db->setAttribute(PDO::ATTR_DEFAULT_FETCH_MODE, PDO::FETCH_OBJ);
|
|
|
|
$this->_db->setAttribute(PDO::ATTR_TIMEOUT, 600);
|
|
|
|
}
|
|
|
|
|
|
|
|
// System
|
|
|
|
public function beginTransaction() {
|
|
|
|
|
|
|
|
$this->_db->beginTransaction();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function commit() {
|
|
|
|
|
|
|
|
$this->_db->commit();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function rollBack() {
|
|
|
|
|
|
|
|
$this->_db->rollBack();
|
|
|
|
}
|
|
|
|
|
2023-05-03 06:22:14 +00:00
|
|
|
// Manifest
|
2023-05-05 02:26:53 +00:00
|
|
|
public function getTotalManifests() {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT COUNT(*) AS `total` FROM `manifest`');
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->fetch()->total;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getManifests() {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `manifest`');
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-05-03 06:22:14 +00:00
|
|
|
public function getManifest(int $crc32url) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `manifest` WHERE `crc32url` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$crc32url]);
|
|
|
|
|
|
|
|
return $query->fetch();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function addManifest(int $crc32url, string $url, string $status, int $timeAdded, mixed $timeUpdated = null) {
|
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
$query = $this->_db->prepare('INSERT INTO `manifest` (`crc32url`, `url`, `status`, `timeAdded`, `timeUpdated`) VALUES (?, ?, ?, ?, ?)');
|
2023-05-03 06:22:14 +00:00
|
|
|
|
|
|
|
$query->execute([$crc32url, $url, $status, $timeAdded, $timeUpdated]);
|
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
2023-05-05 02:26:53 +00:00
|
|
|
public function deleteManifest(int $manifestId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `manifest` WHERE `manifestId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$manifestId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
// Host
|
2023-04-23 00:01:51 +00:00
|
|
|
public function getAPIHosts(string $apiHostFields) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT ' . $apiHostFields . ' FROM `host`');
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
public function getHost(int $crc32url) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `host` WHERE `crc32url` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$crc32url]);
|
|
|
|
|
|
|
|
return $query->fetch();
|
|
|
|
}
|
|
|
|
|
2023-04-08 21:06:28 +00:00
|
|
|
public function getTotalHosts() {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT COUNT(*) AS `total` FROM `host`');
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->fetch()->total;
|
|
|
|
}
|
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
public function addHost(string $scheme, string $name, mixed $port, int $crc32url, int $timeAdded, mixed $timeUpdated, int $crawlPageLimit, int $crawlImageLimit, string $crawlPageMetaOnly, string $status, mixed $robots, mixed $robotsPostfix) {
|
2023-04-07 01:04:24 +00:00
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
$query = $this->_db->prepare('INSERT INTO `host` (`scheme`, `name`, `port`, `crc32url`, `timeAdded`, `timeUpdated`, `crawlPageLimit`, `crawlImageLimit`, `crawlPageMetaOnly`, `status`, `robots`, `robotsPostfix`) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)');
|
2023-04-07 01:04:24 +00:00
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
$query->execute([$scheme, $name, $port, $crc32url, $timeAdded, $timeUpdated, $crawlPageLimit, $crawlImageLimit, $crawlPageMetaOnly, $status, $robots, $robotsPostfix]);
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
2023-04-08 21:06:28 +00:00
|
|
|
public function updateHostRobots(int $hostId, mixed $robots, int $timeUpdated) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `host` SET `robots` = ?, `timeUpdated` = ? WHERE `hostId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$robots, $timeUpdated, $hostId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
// Images
|
|
|
|
public function getTotalHostImages(int $hostId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT COUNT(*) AS `total` FROM `hostImage` WHERE `hostId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostId]);
|
|
|
|
|
|
|
|
return $query->fetch()->total;
|
|
|
|
}
|
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
public function getHostImageId(int $hostId, int $crc32uri) {
|
2023-05-03 22:04:39 +00:00
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
$query = $this->_db->prepare('SELECT `hostImageId` FROM `hostImage` WHERE `hostId` = ? AND `crc32uri` = ? LIMIT 1');
|
2023-05-03 22:04:39 +00:00
|
|
|
|
|
|
|
$query->execute([$hostId, $crc32uri]);
|
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
return $query->rowCount() ? $query->fetch()->hostImageId : 0;
|
2023-05-03 22:04:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
public function getHostImages(int $hostId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostImage` WHERE `hostId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostId]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getUnrelatedHostImages() {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostImage`
|
|
|
|
WHERE `hostImage`.`hostImageId` NOT IN (SELECT `hostImageToHostPage`.`hostImageId`
|
|
|
|
FROM `hostImageToHostPage`
|
|
|
|
|
|
|
|
WHERE `hostImageToHostPage`.`hostImageId` = `hostImage`.`hostImageId`)');
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getHostImagesByLimit(int $hostId, int $limit) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostImage` WHERE `hostId` = ? ORDER BY hostImageId DESC LIMIT ' . (int) $limit);
|
|
|
|
|
|
|
|
$query->execute([$hostId]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function addHostImage(int $hostId,
|
2023-05-06 04:25:54 +00:00
|
|
|
int $crc32uri,
|
|
|
|
string $uri,
|
|
|
|
int $timeAdded,
|
|
|
|
mixed $timeUpdated = null,
|
2023-05-06 05:45:37 +00:00
|
|
|
mixed $timeBanned = null,
|
2023-05-06 04:25:54 +00:00
|
|
|
mixed $httpCode = null,
|
|
|
|
mixed $mime = null,
|
|
|
|
mixed $rank = null,
|
|
|
|
mixed $data = null) {
|
2023-05-03 22:04:39 +00:00
|
|
|
|
|
|
|
$query = $this->_db->prepare('INSERT INTO `hostImage` ( `hostId`,
|
|
|
|
`crc32uri`,
|
|
|
|
`uri`,
|
|
|
|
`timeAdded`,
|
|
|
|
`timeUpdated`,
|
2023-05-06 05:45:37 +00:00
|
|
|
`timeBanned`,
|
2023-05-03 22:04:39 +00:00
|
|
|
`httpCode`,
|
2023-05-06 04:25:54 +00:00
|
|
|
`mime`,
|
2023-05-04 02:19:29 +00:00
|
|
|
`rank`,
|
2023-05-06 05:45:37 +00:00
|
|
|
`data`) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)');
|
2023-05-03 22:04:39 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
$query->execute([$hostId, $crc32uri, $uri, $timeAdded, $timeUpdated, $timeBanned, $httpCode, $mime, $rank, $data]);
|
2023-05-03 22:04:39 +00:00
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function updateHostImageRank(int $hostId,
|
|
|
|
int $crc32uri,
|
|
|
|
int $increment) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostImage` SET `rank` = `rank` + ' . (int) $increment . ' WHERE `hostId` = ? AND `crc32uri` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostId, $crc32uri]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-06 07:11:25 +00:00
|
|
|
public function updateHostImageTimeBanned(int $hostImageId, int $timeBanned) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostImage` SET `timeBanned` = ? WHERE `hostImageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$timeBanned, $hostImageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-04 03:12:51 +00:00
|
|
|
public function updateHostImageHttpCode(int $hostImageId,
|
|
|
|
int $httpCode,
|
|
|
|
int $timeUpdated) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostImage` SET `httpCode` = ?, `timeUpdated` = ? WHERE `hostImageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$httpCode, $timeUpdated, $hostImageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-06 04:25:54 +00:00
|
|
|
public function updateHostImage(int $hostImageId,
|
|
|
|
string $mime,
|
|
|
|
mixed $data,
|
2023-05-06 05:45:37 +00:00
|
|
|
int $timeUpdated,
|
|
|
|
mixed $timeBanned = null) {
|
2023-05-04 03:12:51 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
$query = $this->_db->prepare('UPDATE `hostImage` SET `mime` = ?, `data` = ?, `timeUpdated` = ?, `timeBanned` = ? WHERE `hostImageId` = ? LIMIT 1');
|
2023-05-04 03:12:51 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
$query->execute([$mime, $data, $timeUpdated, $timeBanned, $hostImageId]);
|
2023-05-04 03:12:51 +00:00
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
public function deleteHostImage(int $hostImageId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `hostImage` WHERE `hostImageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostImageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
public function setHostImageDescription(int $hostImageId, int $crc32id, string $alt, string $title, int $timeAdded, int $timeUpdated) {
|
2023-05-03 22:04:39 +00:00
|
|
|
|
|
|
|
$query = $this->_db->prepare('INSERT INTO `hostImageDescription` (`hostImageId`,
|
|
|
|
`crc32id`,
|
|
|
|
`alt`,
|
|
|
|
`title`,
|
2023-05-04 05:51:45 +00:00
|
|
|
`timeAdded`) VALUES (?, ?, ?, ?, ?)
|
|
|
|
|
|
|
|
ON DUPLICATE KEY UPDATE `alt` = ?,
|
|
|
|
`title` = ?,
|
|
|
|
`timeUpdated` = ?');
|
2023-05-03 22:04:39 +00:00
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
$query->execute([$hostImageId, $crc32id, $alt, $title, $timeAdded, $alt, $title, $timeUpdated]);
|
2023-05-03 22:04:39 +00:00
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function deleteHostImageDescription(int $hostImageId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `hostImageDescription` WHERE `hostImageId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostImageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:17:47 +00:00
|
|
|
public function getHostImageHostPages(int $hostImageId, int $limit = 5) {
|
2023-05-04 00:48:57 +00:00
|
|
|
|
2023-05-04 07:53:37 +00:00
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostImageToHostPage`
|
|
|
|
JOIN `hostPage` ON (`hostPage`.`hostPageId` = `hostImageToHostPage`.`hostPageId`)
|
|
|
|
|
|
|
|
WHERE `hostImageId` = ?
|
|
|
|
|
|
|
|
ORDER BY `hostPage`.`rank` DESC, RAND(`hostPage`.`hostId`)
|
|
|
|
|
|
|
|
LIMIT ' . (int) $limit);
|
2023-05-04 00:48:57 +00:00
|
|
|
|
|
|
|
$query->execute([$hostImageId]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:53:37 +00:00
|
|
|
public function getHostImageHostPagesTotal(int $hostImageId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT COUNT(*) AS `total` FROM `hostImageToHostPage` WHERE `hostImageId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostImageId]);
|
|
|
|
|
|
|
|
return $query->fetch()->total;
|
|
|
|
}
|
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
public function setHostImageToHostPage(int $hostImageId, int $hostPageId, int $timeAdded, mixed $timeUpdated, int $quantity) {
|
2023-05-03 22:04:39 +00:00
|
|
|
|
|
|
|
$query = $this->_db->prepare('INSERT INTO `hostImageToHostPage` (`hostImageId`,
|
|
|
|
`hostPageId`,
|
|
|
|
`timeAdded`,
|
|
|
|
`timeUpdated`,
|
2023-05-04 05:51:45 +00:00
|
|
|
`quantity`) VALUES (?, ?, ?, ?, ?)
|
2023-05-03 22:04:39 +00:00
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
ON DUPLICATE KEY UPDATE `timeUpdated` = ?,
|
|
|
|
`quantity` = `quantity` + ' . (int) $quantity);
|
2023-05-03 22:04:39 +00:00
|
|
|
|
2023-05-04 07:11:13 +00:00
|
|
|
$query->execute([$hostImageId, $hostPageId, $timeAdded, null, $quantity, $timeUpdated]);
|
2023-05-03 22:04:39 +00:00
|
|
|
|
2023-05-04 05:51:45 +00:00
|
|
|
return $query->rowCount(); // no primary key
|
2023-05-03 22:04:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
public function deleteHostImageToHostPage(int $hostImageId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `hostImageToHostPage` WHERE `hostImageId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostImageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
// Pages
|
|
|
|
public function getTotalHostPages(int $hostId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT COUNT(*) AS `total` FROM `hostPage` WHERE `hostId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostId]);
|
|
|
|
|
|
|
|
return $query->fetch()->total;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getTotalPagesByHttpCode(mixed $httpCode) {
|
|
|
|
|
|
|
|
if (is_null($httpCode)) {
|
|
|
|
|
|
|
|
$query = $this->_db->query('SELECT COUNT(*) AS `total` FROM `hostPage` WHERE `httpCode` IS NULL');
|
|
|
|
|
|
|
|
} else {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT COUNT(*) AS `total` FROM `hostPage` WHERE `httpCode` = ?');
|
|
|
|
|
|
|
|
$query->execute([$httpCode]);
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
return $query->fetch()->total;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getHostPage(int $hostId, int $crc32uri) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostPage` WHERE `hostId` = ? AND `crc32uri` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostId, $crc32uri]);
|
|
|
|
|
|
|
|
return $query->fetch();
|
|
|
|
}
|
|
|
|
|
2023-04-08 21:06:28 +00:00
|
|
|
public function getHostPages(int $hostId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostPage` WHERE `hostId` = ?');
|
|
|
|
|
|
|
|
$query->execute([$hostId]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
public function getHostPagesByLimit(int $hostId, int $limit) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `hostPage` WHERE `hostId` = ? ORDER BY hostPageId DESC LIMIT ' . (int) $limit);
|
|
|
|
|
|
|
|
$query->execute([$hostId]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
public function getFoundHostPage(int $hostPageId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT `hostPage`.`metaTitle`,
|
|
|
|
`hostPage`.`metaDescription`,
|
|
|
|
`hostPage`.`data`,
|
|
|
|
`hostPage`.`uri`,
|
2023-04-25 13:54:01 +00:00
|
|
|
`hostPage`.`rank`,
|
2023-04-07 01:04:24 +00:00
|
|
|
`host`.`scheme`,
|
|
|
|
`host`.`name`,
|
|
|
|
`host`.`port`
|
|
|
|
|
|
|
|
FROM `hostPage`
|
|
|
|
JOIN `host` ON (`host`.`hostId` = `hostPage`.`hostId`)
|
|
|
|
|
|
|
|
WHERE `hostPage`.`hostPageId` = ?
|
|
|
|
|
|
|
|
LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostPageId]);
|
|
|
|
|
|
|
|
return $query->fetch();
|
|
|
|
}
|
|
|
|
|
2023-05-04 00:48:57 +00:00
|
|
|
public function getFoundHostImage(int $hostImageId) {
|
|
|
|
|
2023-05-04 03:12:51 +00:00
|
|
|
$query = $this->_db->prepare('SELECT `hostImage`.`hostImageId`,
|
|
|
|
`hostImage`.`uri`,
|
2023-05-04 02:19:29 +00:00
|
|
|
`hostImage`.`data`,
|
2023-05-04 00:48:57 +00:00
|
|
|
`hostImage`.`rank`,
|
|
|
|
`host`.`scheme`,
|
|
|
|
`host`.`name`,
|
|
|
|
`host`.`port`,
|
|
|
|
|
2023-05-04 01:19:38 +00:00
|
|
|
(SELECT GROUP_CONCAT(CONCAT_WS(" ", `hostImageDescription`.`alt`, `hostImageDescription`.`title`))
|
2023-05-04 00:48:57 +00:00
|
|
|
|
|
|
|
FROM `hostImageDescription`
|
|
|
|
WHERE `hostImageDescription`.`hostImageId` = `hostImage`.`hostImageId`) AS `description`
|
|
|
|
|
|
|
|
FROM `hostImage`
|
|
|
|
JOIN `host` ON (`host`.`hostId` = `hostImage`.`hostId`)
|
|
|
|
|
|
|
|
WHERE `hostImage`.`hostImageId` = ?
|
|
|
|
|
|
|
|
LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostImageId]);
|
|
|
|
|
|
|
|
return $query->fetch();
|
|
|
|
}
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
public function addHostPage(int $hostId,
|
|
|
|
int $crc32uri,
|
|
|
|
string $uri,
|
|
|
|
int $timeAdded,
|
|
|
|
mixed $timeUpdated = null,
|
2023-05-06 05:45:37 +00:00
|
|
|
mixed $timeBanned = null,
|
2023-04-07 01:04:24 +00:00
|
|
|
mixed $httpCode = null,
|
2023-05-06 04:25:54 +00:00
|
|
|
mixed $mime = null,
|
2023-04-07 01:04:24 +00:00
|
|
|
mixed $rank = null,
|
|
|
|
mixed $metaTitle = null,
|
|
|
|
mixed $metaDescription = null,
|
|
|
|
mixed $metaKeywords = null,
|
|
|
|
mixed $data = null) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('INSERT INTO `hostPage` (`hostId`,
|
|
|
|
`crc32uri`,
|
|
|
|
`uri`,
|
|
|
|
`timeAdded`,
|
|
|
|
`timeUpdated`,
|
2023-05-06 05:45:37 +00:00
|
|
|
`timeBanned`,
|
2023-04-07 01:04:24 +00:00
|
|
|
`httpCode`,
|
2023-05-06 04:25:54 +00:00
|
|
|
`mime`,
|
2023-04-07 01:04:24 +00:00
|
|
|
`rank`,
|
|
|
|
`metaTitle`,
|
|
|
|
`metaDescription`,
|
|
|
|
`metaKeywords`,
|
2023-05-06 05:45:37 +00:00
|
|
|
`data`) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)');
|
2023-04-07 01:04:24 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
$query->execute([$hostId, $crc32uri, $uri, $timeAdded, $timeUpdated, $timeBanned, $httpCode, $mime, $rank, $metaTitle, $metaDescription, $metaKeywords, $data]);
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function updateHostPage( int $hostPageId,
|
|
|
|
mixed $metaTitle,
|
|
|
|
mixed $metaDescription,
|
|
|
|
mixed $metaKeywords,
|
2023-05-06 04:25:54 +00:00
|
|
|
string $mime,
|
2023-05-06 05:45:37 +00:00
|
|
|
mixed $data,
|
|
|
|
int $timeUpdated,
|
|
|
|
mixed $timeBanned = null) {
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostPage` SET `metaTitle` = ?,
|
|
|
|
`metaDescription` = ?,
|
|
|
|
`metaKeywords` = ?,
|
2023-05-06 04:25:54 +00:00
|
|
|
`mime` = ?,
|
2023-05-06 05:45:37 +00:00
|
|
|
`data` = ?,
|
|
|
|
`timeUpdated` = ?,
|
|
|
|
`timeBanned` = ? WHERE `hostPageId` = ? LIMIT 1');
|
2023-04-07 01:04:24 +00:00
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
$query->execute([$metaTitle, $metaDescription, $metaKeywords, $mime, $data, $timeUpdated, $timeBanned, $hostPageId]);
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-04-25 13:54:01 +00:00
|
|
|
public function updateHostPageRank(int $hostId,
|
|
|
|
int $crc32uri,
|
|
|
|
int $increment) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostPage` SET `rank` = `rank` + ' . (int) $increment . '
|
|
|
|
|
|
|
|
WHERE `hostId` = ?
|
|
|
|
AND `crc32uri` = ?
|
|
|
|
|
|
|
|
LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostId, $crc32uri]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-06 07:11:25 +00:00
|
|
|
public function updateHostPageTimeBanned(int $hostPageId, int $timeBanned) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostPage` SET `timeBanned` = ? WHERE `hostPageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$timeBanned, $hostPageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-04-08 21:06:28 +00:00
|
|
|
public function deleteHostPage(int $hostPageId) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `hostPage` WHERE `hostPageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$hostPageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
public function deleteHostPageToHostImage(int $hostPageId) {
|
2023-04-08 21:06:28 +00:00
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
$query = $this->_db->prepare('DELETE FROM `hostImageToHostPage` WHERE `hostPageId` = ?');
|
2023-04-08 21:06:28 +00:00
|
|
|
|
2023-05-03 22:04:39 +00:00
|
|
|
$query->execute([$hostPageId]);
|
2023-04-08 21:06:28 +00:00
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
|
|
|
// Cleaner tools
|
|
|
|
public function getCleanerQueue(int $limit, int $timeFrom) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `host`
|
|
|
|
|
|
|
|
WHERE (`timeUpdated` IS NULL OR `timeUpdated` < ? ) AND `host`.`status` <> 0
|
|
|
|
|
|
|
|
ORDER BY `hostId`
|
|
|
|
|
|
|
|
LIMIT ' . (int) $limit);
|
|
|
|
|
|
|
|
$query->execute([$timeFrom]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-05-06 05:45:37 +00:00
|
|
|
public function resetBannedHostPages(int $timeOffset) {
|
|
|
|
|
2023-05-08 08:04:59 +00:00
|
|
|
$query = $this->_db->prepare('UPDATE `hostPage` SET `timeBanned` = NULL WHERE `timeBanned` IS NOT NULL AND `timeBanned` < ' . (int) $timeOffset);
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function resetBannedHostImages(int $timeOffset) {
|
|
|
|
|
2023-05-08 08:04:59 +00:00
|
|
|
$query = $this->_db->prepare('UPDATE `hostImage` SET `timeBanned` = NULL WHERE `timeBanned` IS NOT NULL AND `timeBanned` < ' . (int) $timeOffset);
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function addCleanerLog(int $timeAdded,
|
|
|
|
int $hostsTotal,
|
|
|
|
int $hostsUpdated,
|
|
|
|
int $hostPagesDeleted,
|
|
|
|
int $hostPagesBansRemoved,
|
|
|
|
int $hostImagesDeleted,
|
|
|
|
int $hostImagesBansRemoved,
|
|
|
|
int $manifestsTotal,
|
|
|
|
int $manifestsDeleted,
|
|
|
|
int $logsCleanerDeleted,
|
|
|
|
int $logsCrawlerDeleted,
|
|
|
|
int $httpRequestsTotal,
|
|
|
|
int $httpRequestsSizeTotal,
|
|
|
|
int $httpDownloadSizeTotal,
|
|
|
|
float $httpRequestsTimeTotal,
|
|
|
|
float $executionTimeTotal) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('INSERT INTO `logCleaner` (`timeAdded`,
|
|
|
|
`hostsTotal`,
|
|
|
|
`hostsUpdated`,
|
|
|
|
`hostPagesDeleted`,
|
|
|
|
`hostPagesBansRemoved`,
|
|
|
|
`hostImagesDeleted`,
|
|
|
|
`hostImagesBansRemoved`,
|
|
|
|
`manifestsTotal`,
|
|
|
|
`manifestsDeleted`,
|
|
|
|
`logsCleanerDeleted`,
|
|
|
|
`logsCrawlerDeleted`,
|
|
|
|
`httpRequestsTotal`,
|
|
|
|
`httpRequestsSizeTotal`,
|
|
|
|
`httpDownloadSizeTotal`,
|
|
|
|
`httpRequestsTimeTotal`,
|
|
|
|
`executionTimeTotal`) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)');
|
|
|
|
|
|
|
|
$query->execute([
|
|
|
|
$timeAdded,
|
|
|
|
$hostsTotal,
|
|
|
|
$hostsUpdated,
|
|
|
|
$hostPagesDeleted,
|
|
|
|
$hostPagesBansRemoved,
|
|
|
|
$hostImagesDeleted,
|
|
|
|
$hostImagesBansRemoved,
|
|
|
|
$manifestsTotal,
|
|
|
|
$manifestsDeleted,
|
|
|
|
$logsCleanerDeleted,
|
|
|
|
$logsCrawlerDeleted,
|
|
|
|
$httpRequestsTotal,
|
|
|
|
$httpRequestsSizeTotal,
|
|
|
|
$httpDownloadSizeTotal,
|
|
|
|
$httpRequestsTimeTotal,
|
|
|
|
$executionTimeTotal
|
|
|
|
]);
|
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function deleteLogCleaner(int $timeOffset) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `logCleaner` WHERE `timeAdded` < ' . (int) $timeOffset);
|
2023-05-06 05:45:37 +00:00
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
|
|
|
|
2023-04-07 01:04:24 +00:00
|
|
|
// Crawl tools
|
2023-05-04 03:45:04 +00:00
|
|
|
public function getHostPageCrawlQueue(int $limit, int $timeFrom) {
|
2023-04-07 01:04:24 +00:00
|
|
|
|
2023-04-09 00:28:31 +00:00
|
|
|
$query = $this->_db->prepare('SELECT `hostPage`.`hostId`,
|
|
|
|
`hostPage`.`hostPageId`,
|
2023-04-07 01:04:24 +00:00
|
|
|
`hostPage`.`uri`,
|
|
|
|
`host`.`scheme`,
|
|
|
|
`host`.`name`,
|
|
|
|
`host`.`port`,
|
|
|
|
`host`.`crawlPageLimit`,
|
2023-05-03 22:04:39 +00:00
|
|
|
`host`.`crawlImageLimit`,
|
2023-04-07 01:04:24 +00:00
|
|
|
`host`.`crawlPageMetaOnly`,
|
2023-04-09 00:28:31 +00:00
|
|
|
`host`.`robots`,
|
|
|
|
`host`.`robotsPostfix`
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
FROM `hostPage`
|
|
|
|
JOIN `host` ON (`host`.`hostId` = `hostPage`.`hostId`)
|
|
|
|
|
|
|
|
WHERE (`hostPage`.`timeUpdated` IS NULL OR `hostPage`.`timeUpdated` < ? ) AND `host`.`status` <> 0
|
2023-05-06 05:45:37 +00:00
|
|
|
AND `hostPage`.`timeBanned` IS NULL
|
2023-04-07 01:04:24 +00:00
|
|
|
|
2023-05-04 03:55:05 +00:00
|
|
|
ORDER BY `hostPage`.`rank` DESC, RAND()
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
LIMIT ' . (int) $limit);
|
|
|
|
|
|
|
|
$query->execute([$timeFrom]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
2023-05-04 03:45:04 +00:00
|
|
|
public function updateHostPageCrawlQueue(int $hostPageId, int $timeUpdated, int $httpCode) {
|
2023-04-07 01:04:24 +00:00
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostPage` SET `timeUpdated` = ?, `httpCode` = ? WHERE `hostPageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$timeUpdated, $httpCode, $hostPageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
2023-05-04 03:45:04 +00:00
|
|
|
|
|
|
|
public function getHostImageCrawlQueue(int $limit, int $timeFrom) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT `hostImage`.`hostId`,
|
|
|
|
`hostImage`.`hostImageId`,
|
|
|
|
`hostImage`.`uri`,
|
|
|
|
`host`.`scheme`,
|
|
|
|
`host`.`name`,
|
|
|
|
`host`.`port`
|
|
|
|
|
|
|
|
FROM `hostImage`
|
|
|
|
JOIN `host` ON (`host`.`hostId` = `hostImage`.`hostId`)
|
|
|
|
|
|
|
|
WHERE (`hostImage`.`timeUpdated` IS NULL OR `hostImage`.`timeUpdated` < ? ) AND `host`.`status` <> 0
|
2023-05-06 05:45:37 +00:00
|
|
|
AND `hostImage`.`timeBanned` IS NULL
|
2023-05-04 03:45:04 +00:00
|
|
|
|
2023-05-04 03:55:05 +00:00
|
|
|
ORDER BY `hostImage`.`rank` DESC, RAND()
|
2023-05-04 03:45:04 +00:00
|
|
|
|
|
|
|
LIMIT ' . (int) $limit);
|
|
|
|
|
|
|
|
$query->execute([$timeFrom]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function updateHostImageCrawlQueue(int $hostImageId, int $timeUpdated, int $httpCode) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `hostImage` SET `timeUpdated` = ?, `httpCode` = ? WHERE `hostImageId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$timeUpdated, $httpCode, $hostImageId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
2023-05-05 02:26:53 +00:00
|
|
|
|
|
|
|
public function getManifestCrawlQueue(int $limit, int $timeFrom) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('SELECT * FROM `manifest`
|
|
|
|
|
|
|
|
WHERE (`timeUpdated` IS NULL OR `timeUpdated` < ? ) AND `status` <> 0
|
|
|
|
|
|
|
|
ORDER BY RAND()
|
|
|
|
|
|
|
|
LIMIT ' . (int) $limit);
|
|
|
|
|
|
|
|
$query->execute([$timeFrom]);
|
|
|
|
|
|
|
|
return $query->fetchAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function updateManifestCrawlQueue(int $manifestId, int $timeUpdated, int $httpCode) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('UPDATE `manifest` SET `timeUpdated` = ?, `httpCode` = ? WHERE `manifestId` = ? LIMIT 1');
|
|
|
|
|
|
|
|
$query->execute([$timeUpdated, $httpCode, $manifestId]);
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
2023-05-08 08:04:59 +00:00
|
|
|
|
|
|
|
public function addCrawlerLog(int $timeAdded,
|
|
|
|
int $hostsAdded,
|
|
|
|
int $hostPagesProcessed,
|
|
|
|
int $hostPagesIndexed,
|
|
|
|
int $hostPagesAdded,
|
|
|
|
int $hostPagesBanned,
|
|
|
|
int $hostImagesIndexed,
|
|
|
|
int $hostImagesProcessed,
|
|
|
|
int $hostImagesAdded,
|
|
|
|
int $hostImagesBanned,
|
|
|
|
int $manifestsProcessed,
|
|
|
|
int $manifestsAdded,
|
|
|
|
int $httpRequestsTotal,
|
|
|
|
int $httpRequestsSizeTotal,
|
|
|
|
int $httpDownloadSizeTotal,
|
|
|
|
float $httpRequestsTimeTotal,
|
|
|
|
float $executionTimeTotal) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('INSERT INTO `logCrawler` (`timeAdded`,
|
|
|
|
`hostsAdded`,
|
|
|
|
`hostPagesProcessed`,
|
|
|
|
`hostPagesIndexed`,
|
|
|
|
`hostPagesAdded`,
|
|
|
|
`hostPagesBanned`,
|
|
|
|
`hostImagesIndexed`,
|
|
|
|
`hostImagesProcessed`,
|
|
|
|
`hostImagesAdded`,
|
|
|
|
`hostImagesBanned`,
|
|
|
|
`manifestsProcessed`,
|
|
|
|
`manifestsAdded`,
|
|
|
|
`httpRequestsTotal`,
|
|
|
|
`httpRequestsSizeTotal`,
|
|
|
|
`httpDownloadSizeTotal`,
|
|
|
|
`httpRequestsTimeTotal`,
|
|
|
|
`executionTimeTotal`) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)');
|
|
|
|
|
|
|
|
$query->execute([
|
|
|
|
$timeAdded,
|
|
|
|
$hostsAdded,
|
|
|
|
$hostPagesProcessed,
|
|
|
|
$hostPagesIndexed,
|
|
|
|
$hostPagesAdded,
|
|
|
|
$hostPagesBanned,
|
|
|
|
$hostImagesIndexed,
|
|
|
|
$hostImagesProcessed,
|
|
|
|
$hostImagesAdded,
|
|
|
|
$hostImagesBanned,
|
|
|
|
$manifestsProcessed,
|
|
|
|
$manifestsAdded,
|
|
|
|
$httpRequestsTotal,
|
|
|
|
$httpRequestsSizeTotal,
|
|
|
|
$httpDownloadSizeTotal,
|
|
|
|
$httpRequestsTimeTotal,
|
|
|
|
$executionTimeTotal
|
|
|
|
]);
|
|
|
|
|
|
|
|
return $this->_db->lastInsertId();
|
|
|
|
}
|
|
|
|
|
|
|
|
public function deleteLogCrawler(int $timeOffset) {
|
|
|
|
|
|
|
|
$query = $this->_db->prepare('DELETE FROM `logCrawler` WHERE `timeAdded` < ' . (int) $timeOffset);
|
|
|
|
|
|
|
|
$query->execute();
|
|
|
|
|
|
|
|
return $query->rowCount();
|
|
|
|
}
|
2023-04-07 01:04:24 +00:00
|
|
|
}
|