YGGo/library/filter.php

163 lines
3.6 KiB
PHP
Raw Normal View History

2023-04-01 19:29:39 +03:00
<?php
class Filter {
2023-05-09 12:52:07 +03:00
static public function string(mixed $data) {
return (string) $data;
}
2023-05-04 07:58:07 +03:00
static public function url(mixed $url) {
$url = (string) $url;
2023-04-01 19:29:39 +03:00
return trim(urldecode($url));
2023-04-01 19:29:39 +03:00
}
2023-05-06 07:25:54 +03:00
static public function mime(mixed $mime) {
$mime = (string) $mime;
2023-05-10 18:35:18 +03:00
return trim(strtolower($mime));
2023-05-06 07:25:54 +03:00
}
2023-05-04 07:58:07 +03:00
static public function pageTitle(mixed $title) {
$title = (string) $title;
2023-04-01 19:29:39 +03:00
$title = preg_replace('/[\s]+/', ' ', $title);
$title = trim($title);
return $title;
}
2023-05-04 07:58:07 +03:00
static public function pageDescription(mixed $description) {
$description = (string) $description;
2023-04-01 19:29:39 +03:00
$description = preg_replace('/[\s]+/', ' ', $description);
$description = trim($description);
return $description;
}
2023-05-04 07:58:07 +03:00
static public function pageKeywords(mixed $keywords) {
$keywords = (string) $keywords;
2023-04-01 19:29:39 +03:00
$keywords = preg_replace('/[\s]+/', ' ', $keywords);
$keywords = trim($keywords);
return $keywords;
}
2023-05-04 07:58:07 +03:00
static public function pageData(mixed $data) {
$data = (string) $data;
2023-04-01 19:29:39 +03:00
$filterDataPre = [
'/<script.*?\/script>/s',
'/<style.*?\/style>/s'
];
$filterDataPost = [
'/[\s]{2,}/',
];
$data = preg_replace($filterDataPre, ' ', $data);
$data = html_entity_decode($data);
$data = strip_tags($data);
$data = preg_replace($filterDataPost, ' ', $data);
return $data;
}
static public function searchQuery(string $query, string $mode = 'default') {
// Create query CRC32
$crc32query = crc32($query);
2023-07-31 22:07:59 +03:00
// Prepare user-friendly search request (default mode)
// https://sphinxsearch.com/docs/current.html#extended-syntax
if ($mode == 'default') {
2023-07-31 22:07:59 +03:00
// Remove extra separators
$query = preg_replace('/[\s]+/', ' ', $query);
2023-06-22 13:37:12 +03:00
2023-07-31 22:07:59 +03:00
$query = trim($query);
2023-06-22 13:37:12 +03:00
2023-08-01 17:20:42 +03:00
// Return short or empty queries
if (mb_strlen($query) <= 1) {
return false;
}
// Lowercase query to deactivate reserved operators
$query = mb_strtolower($query);
// Quote other operators
2023-07-31 22:07:59 +03:00
$operators = [
2023-08-01 17:20:42 +03:00
/* lowercased
2023-07-31 22:07:59 +03:00
'MAYBE',
'AND',
'OR',
'NOT',
'SENTENCE',
'NEAR',
'ZONE',
'ZONESPAN',
'PARAGRAPH',
2023-08-01 17:20:42 +03:00
*/
'\\', '/', '~', '@', '!', '"', "'", '(', ')', '[', ']', '|', '?', '%', '-', '>', '<', ':', ';', '^', '$'
2023-07-31 22:07:59 +03:00
];
foreach ($operators as $operator) {
$query = str_ireplace($operator, '\\' . $operator, $query);
}
// Apply separators
$query = str_replace(['-', '_', '/'], ' ', $query);
// Apply query MATCH rules
if (false !== strpos($query, '\:\ \ ')) { // URL request
2023-07-31 23:33:06 +03:00
$query = sprintf('"%s"', $crc32query);
2023-07-31 23:33:06 +03:00
} else if (mb_strlen($query) > 68) { // @TODO Queries longer than 68 chars unreachable in search index
2023-07-31 23:33:06 +03:00
$query = sprintf('"%s" | (%s*)', $crc32query, substr($query, 0, 67));
} else { // Default condition
$words = [];
// Remove single char words
foreach ((array) explode(' ', $query) as $word) {
if (mb_strlen($word) > 1) {
2023-08-01 17:20:42 +03:00
$words[] = sprintf('(%s*)', $word);
}
}
2023-08-01 17:20:42 +03:00
$query = sprintf('@title %s | "%s" | (%s)', $query,
$crc32query,
implode(' | ', $words));
}
2023-07-31 23:33:06 +03:00
}
2023-07-31 22:07:59 +03:00
return trim($query);
}
2023-04-01 19:29:39 +03:00
static public function plural(int $number, array $texts) {
$cases = array (2, 0, 1, 1, 1, 2);
return $texts[(($number % 100) > 4 && ($number % 100) < 20) ? 2 : $cases[min($number % 10, 5)]];
}
}