1
0
mirror of git://erdgeist.org/opentracker synced 2025-01-12 16:00:06 +00:00
opentracker/ot_fullscrape.c

458 lines
14 KiB
C
Raw Normal View History

2007-11-12 01:38:08 +00:00
/* This software was written by Dirk Engling <erdgeist@erdgeist.org>
2007-12-20 05:59:34 +00:00
It is considered beerware. Prost. Skol. Cheers or whatever.
2008-10-28 01:27:22 +00:00
2007-12-20 05:59:34 +00:00
$id$ */
2007-11-12 01:38:08 +00:00
#ifdef WANT_FULLSCRAPE
2007-11-12 01:38:08 +00:00
/* System */
2024-04-14 22:39:02 +00:00
#include <arpa/inet.h>
#include <pthread.h>
2007-11-12 01:38:08 +00:00
#include <stdio.h>
#include <string.h>
2024-04-14 22:39:02 +00:00
#include <sys/param.h>
#ifdef WANT_COMPRESSION_GZIP
#include <zlib.h>
#endif
2024-04-18 12:54:34 +00:00
#ifdef WANT_COMPRESSION_ZSTD
#include <zstd.h>
#endif
2007-11-12 01:38:08 +00:00
/* Libowfat */
#include "byte.h"
#include "io.h"
#include "textcode.h"
2007-11-12 01:38:08 +00:00
/* Opentracker */
#include "ot_fullscrape.h"
2024-04-14 22:39:02 +00:00
#include "ot_iovec.h"
#include "ot_mutex.h"
#include "trackerlogic.h"
2007-11-12 01:38:08 +00:00
/* Fetch full scrape info for all torrents
Full scrapes usually are huge and one does not want to
2007-11-21 01:54:31 +00:00
allocate more memory. So lets get them in 512k units
2007-11-12 01:38:08 +00:00
*/
2024-04-14 22:39:02 +00:00
#define OT_SCRAPE_CHUNK_SIZE (1024 * 1024)
2007-11-12 01:38:08 +00:00
/* "d8:completei%zde10:downloadedi%zde10:incompletei%zdee" */
#define OT_SCRAPE_MAXENTRYLEN 256
/* Forward declaration */
2024-04-14 22:39:02 +00:00
static void fullscrape_make(int taskid, ot_tasktype mode);
#ifdef WANT_COMPRESSION_GZIP
2024-04-14 22:39:02 +00:00
static void fullscrape_make_gzip(int taskid, ot_tasktype mode);
#endif
2024-04-18 12:54:34 +00:00
#ifdef WANT_COMPRESSION_ZSTD
static void fullscrape_make_zstd(int taskid, ot_tasktype mode);
#endif
/* Converter function from memory to human readable hex strings
XXX - Duplicated from ot_stats. Needs fix. */
2024-04-14 22:39:02 +00:00
static char *to_hex(char *d, uint8_t *s) {
char *m = "0123456789ABCDEF";
char *t = d;
char *e = d + 40;
while (d < e) {
*d++ = m[*s >> 4];
*d++ = m[*s++ & 15];
}
*d = 0;
return t;
}
/* This is the entry point into this worker thread
It grabs tasks from mutex_tasklist and delivers results back
*/
2024-04-14 22:39:02 +00:00
static void *fullscrape_worker(void *args) {
(void)args;
2024-04-14 22:39:02 +00:00
while (g_opentracker_running) {
ot_tasktype tasktype = TASK_FULLSCRAPE;
2024-04-14 22:39:02 +00:00
ot_taskid taskid = mutex_workqueue_poptask(&tasktype);
2024-04-18 12:54:34 +00:00
#ifdef WANT_COMPRESSION_ZSTD
if (tasktype & TASK_FLAG_ZSTD)
fullscrape_make_zstd(taskid, tasktype);
else
#endif
#ifdef WANT_COMPRESSION_GZIP
if (tasktype & TASK_FLAG_GZIP)
2024-04-14 22:39:02 +00:00
fullscrape_make_gzip(taskid, tasktype);
else
#endif
2024-04-14 22:39:02 +00:00
fullscrape_make(taskid, tasktype);
mutex_workqueue_pushchunked(taskid, NULL);
}
return NULL;
}
static pthread_t thread_id;
void fullscrape_init( ) {
pthread_create( &thread_id, NULL, fullscrape_worker, NULL );
}
void fullscrape_deinit( ) {
pthread_cancel( thread_id );
}
void fullscrape_deliver( int64 sock, ot_tasktype tasktype ) {
mutex_workqueue_pushtask( sock, tasktype );
}
static char * fullscrape_write_one( ot_tasktype mode, char *r, ot_torrent *torrent, ot_hash *hash ) {
size_t seed_count = torrent->peer_list6->seed_count + torrent->peer_list4->seed_count;
size_t peer_count = torrent->peer_list6->peer_count + torrent->peer_list4->peer_count;
size_t down_count = torrent->peer_list6->down_count + torrent->peer_list4->down_count;
2024-04-14 22:39:02 +00:00
switch (mode & TASK_TASK_MASK) {
case TASK_FULLSCRAPE:
default:
/* push hash as bencoded string */
*r++ = '2';
*r++ = '0';
*r++ = ':';
memcpy(r, hash, sizeof(ot_hash));
r += sizeof(ot_hash);
/* push rest of the scrape string */
r += sprintf(r, "d8:completei%zde10:downloadedi%zde10:incompletei%zdee", seed_count, down_count, peer_count - seed_count);
break;
case TASK_FULLSCRAPE_TPB_ASCII:
to_hex(r, *hash);
r += 2 * sizeof(ot_hash);
r += sprintf(r, ":%zd:%zd\n", seed_count, peer_count - seed_count);
break;
case TASK_FULLSCRAPE_TPB_ASCII_PLUS:
to_hex(r, *hash);
r += 2 * sizeof(ot_hash);
r += sprintf(r, ":%zd:%zd:%zd\n", seed_count, peer_count - seed_count, down_count);
break;
case TASK_FULLSCRAPE_TPB_BINARY:
memcpy(r, *hash, sizeof(ot_hash));
r += sizeof(ot_hash);
*(uint32_t *)(r + 0) = htonl((uint32_t)seed_count);
*(uint32_t *)(r + 4) = htonl((uint32_t)(peer_count - seed_count));
r += 8;
break;
case TASK_FULLSCRAPE_TPB_URLENCODED:
r += fmt_urlencoded(r, (char *)*hash, 20);
r += sprintf(r, ":%zd:%zd\n", seed_count, peer_count - seed_count);
break;
case TASK_FULLSCRAPE_TRACKERSTATE:
to_hex(r, *hash);
r += 2 * sizeof(ot_hash);
r += sprintf(r, ":%zd:%zd\n", torrent->peer_list6->base, down_count);
break;
}
return r;
}
2024-04-14 22:39:02 +00:00
static void fullscrape_make(int taskid, ot_tasktype mode) {
int bucket;
char *r, *re;
struct iovec iovector = {NULL, 0};
2007-11-12 01:38:08 +00:00
2007-11-12 17:26:01 +00:00
/* Setup return vector... */
2024-04-14 22:39:02 +00:00
r = iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!r)
return;
/* re points to low watermark */
re = r + OT_SCRAPE_CHUNK_SIZE - OT_SCRAPE_MAXENTRYLEN;
2007-11-12 01:38:08 +00:00
2024-04-14 22:39:02 +00:00
if ((mode & TASK_TASK_MASK) == TASK_FULLSCRAPE)
r += sprintf(r, "d5:filesd");
/* For each bucket... */
2024-04-14 22:39:02 +00:00
for (bucket = 0; bucket < OT_BUCKET_COUNT; ++bucket) {
/* Get exclusive access to that bucket */
2024-04-14 22:39:02 +00:00
ot_vector *torrents_list = mutex_bucket_lock(bucket);
ot_torrent *torrents = (ot_torrent *)(torrents_list->data);
size_t i;
/* For each torrent in this bucket.. */
2024-04-14 22:39:02 +00:00
for (i = 0; i < torrents_list->size; ++i) {
r = fullscrape_write_one(mode, r, torrents + i, &torrents[i].hash);
2024-04-14 22:39:02 +00:00
if (r > re) {
2024-04-12 22:47:29 +00:00
iovector.iov_len = r - (char *)iovector.iov_base;
2024-04-14 22:39:02 +00:00
if (mutex_workqueue_pushchunked(taskid, &iovector)) {
2024-04-12 22:47:29 +00:00
free(iovector.iov_base);
2024-04-14 22:39:02 +00:00
return mutex_bucket_unlock(bucket, 0);
2024-04-12 22:47:29 +00:00
}
2024-04-13 10:51:04 +00:00
/* Allocate a fresh output buffer */
2024-04-14 22:39:02 +00:00
r = iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!r)
return mutex_bucket_unlock(bucket, 0);
/* re points to low watermark */
re = r + OT_SCRAPE_CHUNK_SIZE - OT_SCRAPE_MAXENTRYLEN;
2007-11-12 01:38:08 +00:00
}
}
/* All torrents done: release lock on current bucket */
2024-04-14 22:39:02 +00:00
mutex_bucket_unlock(bucket, 0);
/* Parent thread died? */
2024-04-14 22:39:02 +00:00
if (!g_opentracker_running)
return;
}
2024-04-14 22:39:02 +00:00
if ((mode & TASK_TASK_MASK) == TASK_FULLSCRAPE)
r += sprintf(r, "ee");
2024-04-13 10:51:04 +00:00
/* Send rest of data */
2024-04-12 22:47:29 +00:00
iovector.iov_len = r - (char *)iovector.iov_base;
2024-04-14 22:39:02 +00:00
if (mutex_workqueue_pushchunked(taskid, &iovector))
2024-04-12 22:47:29 +00:00
free(iovector.iov_base);
}
2007-11-12 01:38:08 +00:00
#ifdef WANT_COMPRESSION_GZIP
2024-04-14 22:39:02 +00:00
static void fullscrape_make_gzip(int taskid, ot_tasktype mode) {
int bucket;
char *r;
struct iovec iovector = {NULL, 0};
int zres;
z_stream strm;
/* Setup return vector... */
2024-04-14 22:39:02 +00:00
iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!iovector.iov_base)
return;
2024-04-14 22:39:02 +00:00
byte_zero(&strm, sizeof(strm));
strm.next_out = (uint8_t *)iovector.iov_base;
strm.avail_out = OT_SCRAPE_CHUNK_SIZE;
2024-04-14 22:39:02 +00:00
if (deflateInit2(&strm, 7, Z_DEFLATED, 31, 9, Z_DEFAULT_STRATEGY) != Z_OK)
fprintf(stderr, "not ok.\n");
2024-04-14 22:39:02 +00:00
if ((mode & TASK_TASK_MASK) == TASK_FULLSCRAPE) {
strm.next_in = (uint8_t *)"d5:filesd";
strm.avail_in = strlen("d5:filesd");
zres = deflate(&strm, Z_NO_FLUSH);
}
/* For each bucket... */
2024-04-14 22:39:02 +00:00
for (bucket = 0; bucket < OT_BUCKET_COUNT; ++bucket) {
/* Get exclusive access to that bucket */
2024-04-14 22:39:02 +00:00
ot_vector *torrents_list = mutex_bucket_lock(bucket);
ot_torrent *torrents = (ot_torrent *)(torrents_list->data);
size_t i;
/* For each torrent in this bucket.. */
2024-04-14 22:39:02 +00:00
for (i = 0; i < torrents_list->size; ++i) {
char compress_buffer[OT_SCRAPE_MAXENTRYLEN];
2024-04-14 22:39:02 +00:00
r = fullscrape_write_one(mode, compress_buffer, torrents + i, &torrents[i].hash);
strm.next_in = (uint8_t *)compress_buffer;
strm.avail_in = r - compress_buffer;
zres = deflate(&strm, Z_NO_FLUSH);
if ((zres < Z_OK) && (zres != Z_BUF_ERROR))
fprintf(stderr, "deflate() failed while in fullscrape_make().\n");
/* Check if there still is enough buffer left */
2024-04-14 22:39:02 +00:00
while (!strm.avail_out) {
2024-04-13 10:51:04 +00:00
iovector.iov_len = (char *)strm.next_out - (char *)iovector.iov_base;
2024-04-14 22:39:02 +00:00
if (mutex_workqueue_pushchunked(taskid, &iovector)) {
2024-04-13 10:51:04 +00:00
free(iovector.iov_base);
2024-04-14 22:39:02 +00:00
return mutex_bucket_unlock(bucket, 0);
2024-04-13 10:51:04 +00:00
}
/* Allocate a fresh output buffer */
2024-04-14 22:39:02 +00:00
iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!iovector.iov_base) {
fprintf(stderr, "Out of memory trying to claim ouput buffer\n");
deflateEnd(&strm);
2024-04-14 22:39:02 +00:00
return mutex_bucket_unlock(bucket, 0);
}
2024-04-14 22:39:02 +00:00
strm.next_out = (uint8_t *)iovector.iov_base;
strm.avail_out = OT_SCRAPE_CHUNK_SIZE;
2024-04-14 22:39:02 +00:00
zres = deflate(&strm, Z_NO_FLUSH);
if ((zres < Z_OK) && (zres != Z_BUF_ERROR))
fprintf(stderr, "deflate() failed while in fullscrape_make().\n");
}
2007-11-12 01:38:08 +00:00
}
2008-12-07 03:50:51 +00:00
/* All torrents done: release lock on current bucket */
2024-04-14 22:39:02 +00:00
mutex_bucket_unlock(bucket, 0);
2008-12-07 03:50:51 +00:00
/* Parent thread died? */
2024-04-18 12:54:34 +00:00
if (!g_opentracker_running) {
deflateEnd(&strm);
2008-12-07 03:50:51 +00:00
return;
2024-04-18 12:54:34 +00:00
}
2007-11-12 01:38:08 +00:00
}
2024-04-14 22:39:02 +00:00
if ((mode & TASK_TASK_MASK) == TASK_FULLSCRAPE) {
strm.next_in = (uint8_t *)"ee";
strm.avail_in = strlen("ee");
}
2007-11-12 01:38:08 +00:00
2024-04-14 22:39:02 +00:00
if (deflate(&strm, Z_FINISH) < Z_OK)
fprintf(stderr, "deflate() failed while in fullscrape_make()'s endgame.\n");
iovector.iov_len = (char *)strm.next_out - (char *)iovector.iov_base;
2024-04-14 22:39:02 +00:00
if (mutex_workqueue_pushchunked(taskid, &iovector)) {
free(iovector.iov_base);
2024-04-18 12:54:34 +00:00
deflateEnd(&strm);
return;
}
/* Check if there's a last batch of data in the zlib buffer */
if (!strm.avail_out) {
/* Allocate a fresh output buffer */
iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
2024-04-14 22:39:02 +00:00
if (!iovector.iov_base) {
fprintf(stderr, "Problem with iovec_fix_increase_or_free\n");
deflateEnd(&strm);
2024-04-18 12:54:34 +00:00
return;
}
strm.next_out = iovector.iov_base;
strm.avail_out = OT_SCRAPE_CHUNK_SIZE;
2024-04-14 22:39:02 +00:00
if (deflate(&strm, Z_FINISH) < Z_OK)
fprintf(stderr, "deflate() failed while in fullscrape_make()'s endgame.\n");
2024-04-13 10:51:04 +00:00
/* Only pass the new buffer if there actually was some data left in the buffer */
iovector.iov_len = (char *)strm.next_out - (char *)iovector.iov_base;
if (!iovector.iov_len || mutex_workqueue_pushchunked(taskid, &iovector))
free(iovector.iov_base);
2024-04-13 10:51:04 +00:00
}
deflateEnd(&strm);
2007-11-12 01:38:08 +00:00
}
/* WANT_COMPRESSION_GZIP */
#endif
2007-12-20 05:59:34 +00:00
2024-04-18 12:54:34 +00:00
#ifdef WANT_COMPRESSION_ZSTD
static void fullscrape_make_zstd(int taskid, ot_tasktype mode) {
int bucket;
char *r;
struct iovec iovector = {NULL, 0};
ZSTD_CCtx *zstream = ZSTD_createCCtx();
ZSTD_inBuffer inbuf;
ZSTD_outBuffer outbuf;
size_t more_bytes;
if (!zstream)
return;
/* Setup return vector... */
iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!iovector.iov_base) {
ZSTD_freeCCtx(zstream);
return;
}
/* Working with a compression level 6 is half as fast as level 3, but
seems to be the last reasonable bump that's worth extra cpu */
ZSTD_CCtx_setParameter(zstream, ZSTD_c_compressionLevel, 6);
outbuf.dst = iovector.iov_base;
outbuf.size = OT_SCRAPE_CHUNK_SIZE;
outbuf.pos = 0;
if ((mode & TASK_TASK_MASK) == TASK_FULLSCRAPE) {
inbuf.src = (const void *)"d5:filesd";
inbuf.size = strlen("d5:filesd");
inbuf.pos = 0;
ZSTD_compressStream2(zstream, &outbuf, &inbuf, ZSTD_e_continue);
}
/* For each bucket... */
for (bucket = 0; bucket < OT_BUCKET_COUNT; ++bucket) {
/* Get exclusive access to that bucket */
ot_vector *torrents_list = mutex_bucket_lock(bucket);
ot_torrent *torrents = (ot_torrent *)(torrents_list->data);
size_t i;
/* For each torrent in this bucket.. */
for (i = 0; i < torrents_list->size; ++i) {
char compress_buffer[OT_SCRAPE_MAXENTRYLEN];
r = fullscrape_write_one(mode, compress_buffer, torrents + i, &torrents[i].hash);
inbuf.src = compress_buffer;
inbuf.size = r - compress_buffer;
inbuf.pos = 0;
ZSTD_compressStream2(zstream, &outbuf, &inbuf, ZSTD_e_continue);
/* Check if there still is enough buffer left */
while (outbuf.pos + OT_SCRAPE_MAXENTRYLEN > outbuf.size) {
iovector.iov_len = outbuf.size;
if (mutex_workqueue_pushchunked(taskid, &iovector)) {
free(iovector.iov_base);
ZSTD_freeCCtx(zstream);
return mutex_bucket_unlock(bucket, 0);
}
/* Allocate a fresh output buffer */
iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!iovector.iov_base) {
fprintf(stderr, "Out of memory trying to claim ouput buffer\n");
ZSTD_freeCCtx(zstream);
return mutex_bucket_unlock(bucket, 0);
}
outbuf.dst = iovector.iov_base;
outbuf.size = OT_SCRAPE_CHUNK_SIZE;
outbuf.pos = 0;
ZSTD_compressStream2(zstream, &outbuf, &inbuf, ZSTD_e_continue);
}
}
/* All torrents done: release lock on current bucket */
mutex_bucket_unlock(bucket, 0);
/* Parent thread died? */
if (!g_opentracker_running)
return;
}
if ((mode & TASK_TASK_MASK) == TASK_FULLSCRAPE) {
inbuf.src = (const void *)"ee";
inbuf.size = strlen("ee");
inbuf.pos = 0;
}
more_bytes = ZSTD_compressStream2(zstream, &outbuf, &inbuf, ZSTD_e_end);
iovector.iov_len = outbuf.pos;
if (mutex_workqueue_pushchunked(taskid, &iovector)) {
free(iovector.iov_base);
ZSTD_freeCCtx(zstream);
return;
}
/* Check if there's a last batch of data in the zlib buffer */
if (more_bytes) {
/* Allocate a fresh output buffer */
iovector.iov_base = malloc(OT_SCRAPE_CHUNK_SIZE);
if (!iovector.iov_base) {
fprintf(stderr, "Problem with iovec_fix_increase_or_free\n");
ZSTD_freeCCtx(zstream);
return;
}
outbuf.dst = iovector.iov_base;
outbuf.size = OT_SCRAPE_CHUNK_SIZE;
outbuf.pos = 0;
ZSTD_compressStream2(zstream, &outbuf, &inbuf, ZSTD_e_end);
/* Only pass the new buffer if there actually was some data left in the buffer */
iovector.iov_len = outbuf.pos;
if (!iovector.iov_len || mutex_workqueue_pushchunked(taskid, &iovector))
free(iovector.iov_base);
}
ZSTD_freeCCtx(zstream);
}
/* WANT_COMPRESSION_ZSTD */
#endif
/* WANT_FULLSCRAPE */
#endif