2023-04-01 19:29:39 +03:00
|
|
|
<?php
|
|
|
|
|
|
|
|
class Filter {
|
|
|
|
|
2023-05-09 12:52:07 +03:00
|
|
|
static public function string(mixed $data) {
|
|
|
|
|
|
|
|
return (string) $data;
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:58:07 +03:00
|
|
|
static public function url(mixed $url) {
|
|
|
|
|
|
|
|
$url = (string) $url;
|
2023-04-01 19:29:39 +03:00
|
|
|
|
2023-04-07 04:04:24 +03:00
|
|
|
return trim(urldecode($url));
|
2023-04-01 19:29:39 +03:00
|
|
|
}
|
|
|
|
|
2023-05-06 07:25:54 +03:00
|
|
|
static public function mime(mixed $mime) {
|
|
|
|
|
|
|
|
$mime = (string) $mime;
|
|
|
|
|
2023-05-10 18:35:18 +03:00
|
|
|
return trim(strtolower($mime));
|
2023-05-06 07:25:54 +03:00
|
|
|
}
|
|
|
|
|
2023-05-04 07:58:07 +03:00
|
|
|
static public function pageTitle(mixed $title) {
|
|
|
|
|
|
|
|
$title = (string) $title;
|
2023-04-01 19:29:39 +03:00
|
|
|
|
|
|
|
$title = preg_replace('/[\s]+/', ' ', $title);
|
|
|
|
|
|
|
|
$title = trim($title);
|
|
|
|
|
|
|
|
return $title;
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:58:07 +03:00
|
|
|
static public function pageDescription(mixed $description) {
|
|
|
|
|
|
|
|
$description = (string) $description;
|
2023-04-01 19:29:39 +03:00
|
|
|
|
|
|
|
$description = preg_replace('/[\s]+/', ' ', $description);
|
|
|
|
|
|
|
|
$description = trim($description);
|
|
|
|
|
|
|
|
return $description;
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:58:07 +03:00
|
|
|
static public function pageKeywords(mixed $keywords) {
|
|
|
|
|
|
|
|
$keywords = (string) $keywords;
|
2023-04-01 19:29:39 +03:00
|
|
|
|
|
|
|
$keywords = preg_replace('/[\s]+/', ' ', $keywords);
|
|
|
|
|
|
|
|
$keywords = trim($keywords);
|
|
|
|
|
|
|
|
return $keywords;
|
|
|
|
}
|
|
|
|
|
2023-05-04 07:58:07 +03:00
|
|
|
static public function pageData(mixed $data) {
|
|
|
|
|
|
|
|
$data = (string) $data;
|
2023-04-01 19:29:39 +03:00
|
|
|
|
|
|
|
$filterDataPre = [
|
|
|
|
'/<script.*?\/script>/s',
|
|
|
|
'/<style.*?\/style>/s'
|
|
|
|
];
|
|
|
|
|
|
|
|
$filterDataPost = [
|
|
|
|
'/[\s]{2,}/',
|
|
|
|
];
|
|
|
|
|
|
|
|
$data = preg_replace($filterDataPre, ' ', $data);
|
|
|
|
|
|
|
|
$data = html_entity_decode($data);
|
|
|
|
$data = strip_tags($data);
|
|
|
|
|
|
|
|
$data = preg_replace($filterDataPost, ' ', $data);
|
|
|
|
|
|
|
|
return $data;
|
|
|
|
}
|
|
|
|
|
2023-05-01 20:09:28 +03:00
|
|
|
static public function searchQuery(string $query, string $mode = 'default') {
|
2023-05-01 18:39:46 +03:00
|
|
|
|
2023-08-01 13:50:07 +03:00
|
|
|
// Create query CRC32
|
|
|
|
$crc32query = crc32($query);
|
|
|
|
|
2023-07-31 22:07:59 +03:00
|
|
|
// Prepare user-friendly search request (default mode)
|
|
|
|
// https://sphinxsearch.com/docs/current.html#extended-syntax
|
2023-05-01 20:09:28 +03:00
|
|
|
if ($mode == 'default') {
|
2023-06-05 23:33:07 +03:00
|
|
|
|
2023-07-31 22:07:59 +03:00
|
|
|
// Remove extra separators
|
|
|
|
$query = preg_replace('/[\s]+/', ' ', $query);
|
2023-06-22 13:37:12 +03:00
|
|
|
|
2023-07-31 22:07:59 +03:00
|
|
|
$query = trim($query);
|
2023-06-22 13:37:12 +03:00
|
|
|
|
2023-08-01 17:20:42 +03:00
|
|
|
// Return short or empty queries
|
|
|
|
if (mb_strlen($query) <= 1) {
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Lowercase query to deactivate reserved operators
|
|
|
|
$query = mb_strtolower($query);
|
|
|
|
|
|
|
|
// Quote other operators
|
2023-07-31 22:07:59 +03:00
|
|
|
$operators = [
|
2023-08-01 17:20:42 +03:00
|
|
|
/* lowercased
|
2023-07-31 22:07:59 +03:00
|
|
|
'MAYBE',
|
|
|
|
'AND',
|
|
|
|
'OR',
|
|
|
|
'NOT',
|
|
|
|
'SENTENCE',
|
|
|
|
'NEAR',
|
|
|
|
'ZONE',
|
|
|
|
'ZONESPAN',
|
|
|
|
'PARAGRAPH',
|
2023-08-01 17:20:42 +03:00
|
|
|
*/
|
|
|
|
'\\', '/', '~', '@', '!', '"', "'", '(', ')', '[', ']', '|', '?', '%', '-', '>', '<', ':', ';', '^', '$'
|
2023-07-31 22:07:59 +03:00
|
|
|
];
|
|
|
|
|
|
|
|
foreach ($operators as $operator) {
|
|
|
|
$query = str_ireplace($operator, '\\' . $operator, $query);
|
|
|
|
}
|
2023-05-01 18:39:46 +03:00
|
|
|
|
2023-08-01 13:50:07 +03:00
|
|
|
// Apply separators
|
|
|
|
$query = str_replace(['-', '_', '/'], ' ', $query);
|
|
|
|
|
|
|
|
// Apply query MATCH rules
|
2023-08-01 14:15:14 +03:00
|
|
|
if (false !== strpos($query, '\:\ \ ')) { // URL request
|
2023-07-31 23:33:06 +03:00
|
|
|
|
2023-08-01 13:50:07 +03:00
|
|
|
$query = sprintf('"%s"', $crc32query);
|
2023-07-31 23:33:06 +03:00
|
|
|
|
2023-08-01 14:15:14 +03:00
|
|
|
} else if (mb_strlen($query) > 68) { // @TODO Queries longer than 68 chars unreachable in search index
|
2023-07-31 23:33:06 +03:00
|
|
|
|
2023-08-01 13:50:07 +03:00
|
|
|
$query = sprintf('"%s" | (%s*)', $crc32query, substr($query, 0, 67));
|
|
|
|
|
2023-08-01 14:15:14 +03:00
|
|
|
} else { // Default condition
|
|
|
|
|
|
|
|
$words = [];
|
2023-08-01 13:50:07 +03:00
|
|
|
|
|
|
|
// Remove single char words
|
|
|
|
foreach ((array) explode(' ', $query) as $word) {
|
|
|
|
|
|
|
|
if (mb_strlen($word) > 1) {
|
|
|
|
|
2023-08-01 17:20:42 +03:00
|
|
|
$words[] = sprintf('(%s*)', $word);
|
2023-08-01 13:50:07 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-01 17:20:42 +03:00
|
|
|
$query = sprintf('@title %s | "%s" | (%s)', $query,
|
|
|
|
$crc32query,
|
|
|
|
implode(' | ', $words));
|
2023-08-01 13:50:07 +03:00
|
|
|
}
|
2023-07-31 23:33:06 +03:00
|
|
|
}
|
2023-05-01 18:39:46 +03:00
|
|
|
|
2023-07-31 22:07:59 +03:00
|
|
|
return trim($query);
|
2023-05-01 18:39:46 +03:00
|
|
|
}
|
|
|
|
|
2023-04-01 19:29:39 +03:00
|
|
|
static public function plural(int $number, array $texts) {
|
|
|
|
|
|
|
|
$cases = array (2, 0, 1, 1, 1, 2);
|
|
|
|
|
|
|
|
return $texts[(($number % 100) > 4 && ($number % 100) < 20) ? 2 : $cases[min($number % 10, 5)]];
|
|
|
|
}
|
|
|
|
}
|