yggverse
|
5e4494c9e8
|
use PHP 8 str_starts_with function
|
2024-03-21 18:47:11 +02:00 |
|
yggverse
|
79b82d46e1
|
add cleanup limit argument
|
2024-03-21 18:41:33 +02:00 |
|
yggverse
|
e635ec6dc9
|
enable cleanup on configuration update, delete snap match cleanup conditions
|
2024-03-21 18:23:07 +02:00 |
|
yggverse
|
573d249e1f
|
fix snap filesize
|
2024-03-21 15:30:28 +02:00 |
|
yggverse
|
1b12153183
|
add body cache decoration
|
2024-03-21 04:23:02 +02:00 |
|
yggverse
|
eac2734b9f
|
display document body cache
|
2024-03-21 04:13:35 +02:00 |
|
yggverse
|
900e3a453f
|
Disable keywords collection from headers as body index enabled
|
2024-03-21 03:46:58 +02:00 |
|
yggverse
|
1f3ee435e9
|
fix custom encoding conversion
|
2024-03-21 03:38:46 +02:00 |
|
yggverse
|
e09440b44a
|
strip code content
|
2024-03-21 00:38:24 +02:00 |
|
yggverse
|
b5cd219f47
|
strip css content from index
|
2024-03-21 00:34:25 +02:00 |
|
yggverse
|
b440e6edff
|
disable configuration changes cleanup
|
2024-03-20 22:41:12 +02:00 |
|
yggverse
|
ad3fd31f67
|
update cleanup condition
|
2024-03-20 22:35:33 +02:00 |
|
yggverse
|
dd914e0e1b
|
fix cleanup query
|
2024-03-20 22:33:11 +02:00 |
|
yggverse
|
36972cab19
|
implement alter index tool
|
2024-03-20 21:06:18 +02:00 |
|
yggverse
|
2257ce771f
|
apply cleaner to the current url configuration
|
2024-03-20 20:18:55 +02:00 |
|
yggverse
|
3884f375d4
|
save document body text to index
|
2024-03-20 19:31:56 +02:00 |
|
ghost
|
1f27a7e105
|
trim extra spaces before query escape
|
2024-02-25 09:11:12 +02:00 |
|
ghost
|
d6b5f8b210
|
build combined search query
|
2024-02-25 09:07:57 +02:00 |
|
ghost
|
1c2e8dafb2
|
collect keywords from document headers
|
2024-01-23 02:49:52 +02:00 |
|
ghost
|
cfbc84cbaf
|
sort queue by rank asc
|
2024-01-23 02:19:35 +02:00 |
|
ghost
|
db9dc8d4ba
|
force results to string
|
2024-01-23 01:55:28 +02:00 |
|
ghost
|
ff8461835d
|
calculate initial rank
|
2024-01-22 23:03:33 +02:00 |
|
ghost
|
50dc9d315a
|
add rank field
|
2024-01-22 22:56:36 +02:00 |
|
ghost
|
6f4abe4729
|
set crc32url as document id
|
2024-01-22 22:52:37 +02:00 |
|
ghost
|
93baed4b90
|
delete deprecated documents with HTTP code not 200 on second scan
|
2023-12-20 08:44:35 +02:00 |
|
ghost
|
17d6171d95
|
fix directory existion check #2
|
2023-12-13 00:36:50 +02:00 |
|
ghost
|
100806af02
|
complete local snaps feature #2
|
2023-12-13 00:29:34 +02:00 |
|
ghost
|
33cc778999
|
crawl newest pages by rand in queue
|
2023-12-10 00:29:18 +02:00 |
|
ghost
|
811c700049
|
add http code notice
|
2023-12-03 01:14:06 +02:00 |
|
ghost
|
35ad144a9e
|
add stripos url rules for crawl snaps
|
2023-12-02 22:15:44 +02:00 |
|
ghost
|
0e06ff3c0f
|
fix debug message
|
2023-12-02 21:18:57 +02:00 |
|
ghost
|
e066223bd2
|
fix link container
|
2023-12-02 20:59:40 +02:00 |
|
ghost
|
51d52dea7d
|
fix destination name
|
2023-12-02 20:12:03 +02:00 |
|
ghost
|
87ca594860
|
add debug levels
|
2023-12-02 16:04:22 +02:00 |
|
ghost
|
33d657cb72
|
apply sleep on timeout value provided only
|
2023-12-02 15:03:51 +02:00 |
|
ghost
|
bc00f0c851
|
make tmp subfolders storage optimization
|
2023-12-02 14:39:11 +02:00 |
|
ghost
|
f613b44d3f
|
disable sort by RAND() in crawler queue
|
2023-12-02 14:22:50 +02:00 |
|
ghost
|
fa3c0491e2
|
fix chromium -webkit-autofill input colors
|
2023-12-01 23:56:57 +02:00 |
|
ghost
|
9087c4b0d7
|
add footer links settings, implement nodes registry with database download list
|
2023-12-01 23:47:15 +02:00 |
|
ghost
|
4cec81c893
|
make extended search mode disabled by default #7
|
2023-12-01 21:26:12 +02:00 |
|
ghost
|
f0da3caaf5
|
add extended search mode option
|
2023-12-01 20:05:38 +02:00 |
|
ghost
|
d3f8d1c0e3
|
fix result output
|
2023-11-30 02:59:07 +02:00 |
|
ghost
|
86b20cbc51
|
add debug output on skip condition
|
2023-11-30 02:36:25 +02:00 |
|
ghost
|
3306dc1961
|
add skip url filter by stripos condition
|
2023-11-30 02:24:02 +02:00 |
|
ghost
|
ee074b684a
|
add semaphore namespace prefix
|
2023-11-30 00:51:42 +02:00 |
|
ghost
|
880764aa49
|
make paths relative
|
2023-11-29 23:13:16 +02:00 |
|
ghost
|
24904f667e
|
add Utils::escape note
|
2023-11-29 22:51:14 +02:00 |
|
ghost
|
27946ff27c
|
define missed crc32url field value
|
2023-11-27 21:03:38 +02:00 |
|
ghost
|
38fbc32151
|
fix document fields update
|
2023-11-27 20:55:10 +02:00 |
|
ghost
|
08995e6199
|
randomize new pages queue
|
2023-11-27 20:24:46 +02:00 |
|