2018-04-17 03:57:04 +03:00

751 lines
19 KiB
C

/*
frame.c - compact version of famous library mpg123
Copyright (C) 2017 Uncle Mike
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
*/
#include "mpg123.h"
#include <math.h>
static void *aligned_pointer( void *base, uint alignment )
{
// work in unsigned integer realm, explicitly.
// tricking the compiler into integer operations like % by invoking base-NULL is dangerous:
// it results into ptrdiff_t, which gets negative on big addresses. Big screw up, that.
// i try to do it "properly" here: Casting only to size_t and no artihmethic with void*.
size_t baseval = (size_t)(char *)base;
size_t aoff = baseval % alignment;
if( aoff )
return (char *)base + alignment - aoff;
return base;
}
static void frame_default_parm( mpg123_parm_t *mp )
{
mp->outscale = 1.0;
mp->flags = 0;
mp->flags |= MPG123_GAPLESS;
mp->flags |= MPG123_AUTO_RESAMPLE;
mp->down_sample = 0;
mp->rva = 0;
mp->halfspeed = 0;
mp->doublespeed = 0;
mp->verbose = 0;
mp->timeout = 0;
mp->resync_limit = 1024;
mp->index_size = INDEX_SIZE;
mp->preframes = 4; // that's good for layer 3 ISO compliance bitstream.
mpg123_fmt_all( mp );
// default of keeping some 4K buffers at hand, should cover the "usual" use case
// (using 16K pipe buffers as role model).
mp->feedpool = 5;
mp->feedbuffer = 4096;
}
// reset everythign except dynamic memory.
static void frame_fixed_reset( mpg123_handle_t *fr )
{
open_bad( fr );
fr->to_decode = FALSE;
fr->to_ignore = FALSE;
fr->metaflags = 0;
fr->outblock = 0; // this will be set before decoding!
fr->num = -1;
fr->input_offset = -1;
fr->playnum = -1;
fr->state_flags = FRAME_ACCURATE;
fr->silent_resync = 0;
fr->audio_start = 0;
fr->clip = 0;
fr->oldhead = 0;
fr->firsthead = 0;
fr->vbr = MPG123_CBR;
fr->abr_rate = 0;
fr->track_frames = 0;
fr->track_samples = -1;
fr->framesize=0;
fr->mean_frames = 0;
fr->mean_framesize = 0;
fr->freesize = 0;
fr->lastscale = -1;
fr->rva.level[0] = -1;
fr->rva.level[1] = -1;
fr->rva.gain[0] = 0;
fr->rva.gain[1] = 0;
fr->rva.peak[0] = 0;
fr->rva.peak[1] = 0;
fr->fsizeold = 0;
fr->firstframe = 0;
fr->ignoreframe = fr->firstframe - fr->p.preframes;
fr->header_change = 0;
fr->lastframe = -1;
fr->fresh = 1;
fr->new_format = 0;
frame_gapless_init( fr, -1, 0, 0 );
fr->lastoff = 0;
fr->firstoff = 0;
fr->bo = 1; // the usual bo
fr->halfphase = 0; // here or indeed only on first-time init?
fr->error_protection = 0;
fr->freeformat_framesize = -1;
}
int frame_index_setup( mpg123_handle_t *fr )
{
int ret = MPG123_ERR;
if( fr->p.index_size >= 0 )
{
// simple fixed index.
fr->index.grow_size = 0;
ret = fi_resize( &fr->index, (size_t)fr->p.index_size );
}
else
{
// a growing index. we give it a start, though.
fr->index.grow_size = (size_t)(-fr->p.index_size );
if( fr->index.size < fr->index.grow_size )
ret = fi_resize( &fr->index, fr->index.grow_size );
else ret = MPG123_OK; // we have minimal size already... and since growing is OK...
}
return ret;
}
void frame_init_par( mpg123_handle_t *fr, mpg123_parm_t *mp )
{
fr->own_buffer = TRUE;
fr->buffer.data = NULL;
fr->buffer.rdata = NULL;
fr->buffer.fill = 0;
fr->buffer.size = 0;
fr->rawbuffs = NULL;
fr->rawbuffss = 0;
fr->rawdecwin = NULL;
fr->rawdecwins = 0;
fr->layerscratch = NULL;
fr->xing_toc = NULL;
// unnecessary: fr->buffer.size = fr->buffer.fill = 0;
// frame_outbuffer is missing...
// frame_buffers is missing... that one needs cpu opt setting!
// after these... frame_reset is needed before starting full decode
invalidate_format( &fr->af );
fr->rdat.r_read = NULL;
fr->rdat.r_lseek = NULL;
fr->rdat.iohandle = NULL;
fr->rdat.r_read_handle = NULL;
fr->rdat.r_lseek_handle = NULL;
fr->rdat.cleanup_handle = NULL;
fr->wrapperdata = NULL;
fr->wrapperclean = NULL;
fr->decoder_change = 1;
fr->err = MPG123_OK;
if( mp == NULL ) frame_default_parm( &fr->p );
else memcpy( &fr->p, mp, sizeof( mpg123_parm_t ));
bc_prepare( &fr->rdat.buffer, fr->p.feedpool, fr->p.feedbuffer );
fr->down_sample = 0; // initialize to silence harmless errors when debugging.
frame_fixed_reset( fr ); // reset only the fixed data, dynamic buffers are not there yet!
fr->synth = NULL;
fr->synth_mono = NULL;
fr->make_decode_tables = NULL;
fi_init( &fr->index );
frame_index_setup( fr ); // apply the size setting.
}
static void frame_decode_buffers_reset(mpg123_handle_t *fr)
{
memset(fr->rawbuffs, 0, fr->rawbuffss);
}
int frame_buffers( mpg123_handle_t *fr )
{
int buffssize = 4352;
buffssize += 15; // for 16-byte alignment
if(fr->rawbuffs != NULL && fr->rawbuffss != buffssize)
{
free(fr->rawbuffs);
fr->rawbuffs = NULL;
}
if( fr->rawbuffs == NULL )
fr->rawbuffs = (byte *)malloc( buffssize );
if( fr->rawbuffs == NULL )
return -1;
fr->rawbuffss = buffssize;
fr->short_buffs[0][0] = aligned_pointer( fr->rawbuffs, 16 );
fr->short_buffs[0][1] = fr->short_buffs[0][0] + 0x110;
fr->short_buffs[1][0] = fr->short_buffs[0][1] + 0x110;
fr->short_buffs[1][1] = fr->short_buffs[1][0] + 0x110;
fr->float_buffs[0][0] = aligned_pointer( fr->rawbuffs, 16 );
fr->float_buffs[0][1] = fr->float_buffs[0][0] + 0x110;
fr->float_buffs[1][0] = fr->float_buffs[0][1] + 0x110;
fr->float_buffs[1][1] = fr->float_buffs[1][0] + 0x110;
// now the different decwins... all of the same size, actually
// the MMX ones want 32byte alignment, which I'll try to ensure manually
{
int decwin_size = (512 + 32) * sizeof( float );
// hm, that's basically realloc() ...
if( fr->rawdecwin != NULL && fr->rawdecwins != decwin_size )
{
free( fr->rawdecwin );
fr->rawdecwin = NULL;
}
if( fr->rawdecwin == NULL )
fr->rawdecwin = (byte *)malloc( decwin_size );
if( fr->rawdecwin == NULL )
return -1;
fr->rawdecwins = decwin_size;
fr->decwin = (float *)fr->rawdecwin;
}
// layer scratch buffers are of compile-time fixed size, so allocate only once.
if( fr->layerscratch == NULL )
{
// allocate specific layer3 buffers
size_t scratchsize = 0;
float *scratcher;
scratchsize += sizeof( float ) * 2 * SBLIMIT * SSLIMIT; // hybrid_in
scratchsize += sizeof( float ) * 2 * SSLIMIT * SBLIMIT; // hybrid_out
fr->layerscratch = malloc( scratchsize + 63 );
if(fr->layerscratch == NULL) return -1;
// get aligned part of the memory, then divide it up.
scratcher = aligned_pointer( fr->layerscratch, 64 );
// those funky pointer casts silence compilers...
// One might change the code at hand to really just use 1D arrays,
// but in practice, that would not make a (positive) difference.
fr->layer3.hybrid_in = (float(*)[SBLIMIT][SSLIMIT])scratcher;
scratcher += 2 * SBLIMIT * SSLIMIT;
fr->layer3.hybrid_out = (float(*)[SSLIMIT][SBLIMIT])scratcher;
scratcher += 2 * SSLIMIT * SBLIMIT;
// note: These buffers don't need resetting here.
}
// only reset the buffers we created just now.
frame_decode_buffers_reset( fr );
return 0;
}
int frame_buffers_reset( mpg123_handle_t *fr )
{
fr->buffer.fill = 0; // hm, reset buffer fill... did we do a flush?
fr->bsnum = 0;
// wondering: could it be actually _wanted_ to retain buffer contents over different files? (special gapless / cut stuff)
fr->bsbuf = fr->bsspace[1];
fr->bsbufold = fr->bsbuf;
fr->bitreservoir = 0;
frame_decode_buffers_reset( fr );
memset( fr->bsspace, 0, 2 * ( MAXFRAMESIZE + 512 ));
memset( fr->ssave, 0, 34 );
fr->hybrid_blc[0] = fr->hybrid_blc[1] = 0;
memset( fr->hybrid_block, 0, sizeof( float ) * 2 * 2 * SBLIMIT * SSLIMIT );
return 0;
}
void frame_init( mpg123_handle_t *fr )
{
frame_init_par( fr, NULL );
}
int frame_outbuffer( mpg123_handle_t *fr )
{
size_t size = fr->outblock;
if( !fr->own_buffer )
{
if( fr->buffer.size < size )
{
fr->err = MPG123_BAD_BUFFER;
return MPG123_ERR;
}
}
if( fr->buffer.rdata != NULL && fr->buffer.size != size )
{
free( fr->buffer.rdata );
fr->buffer.rdata = NULL;
}
fr->buffer.size = size;
fr->buffer.data = NULL;
// be generous: use 16 byte alignment
if( fr->buffer.rdata == NULL )
fr->buffer.rdata = (byte *)malloc( fr->buffer.size + 15 );
if( fr->buffer.rdata == NULL )
{
fr->err = MPG123_OUT_OF_MEM;
return MPG123_ERR;
}
fr->buffer.data = aligned_pointer( fr->buffer.rdata, 16 );
fr->own_buffer = TRUE;
fr->buffer.fill = 0;
return MPG123_OK;
}
static void frame_free_toc( mpg123_handle_t *fr )
{
if( fr->xing_toc != NULL )
{
free( fr->xing_toc );
fr->xing_toc = NULL;
}
}
// Just copy the Xing TOC over...
int frame_fill_toc( mpg123_handle_t *fr, byte *in )
{
if( fr->xing_toc == NULL )
fr->xing_toc = malloc( 100 );
if( fr->xing_toc != NULL )
{
memcpy( fr->xing_toc, in, 100 );
return TRUE;
}
return FALSE;
}
// prepare the handle for a new track.
// reset variables, buffers...
int frame_reset( mpg123_handle_t *fr )
{
frame_buffers_reset( fr );
frame_fixed_reset( fr );
frame_free_toc( fr );
fi_reset( &fr->index );
return 0;
}
static void frame_free_buffers( mpg123_handle_t *fr )
{
if( fr->rawbuffs != NULL )
free( fr->rawbuffs );
fr->rawbuffs = NULL;
fr->rawbuffss = 0;
if( fr->rawdecwin != NULL )
free( fr->rawdecwin );
fr->rawdecwin = NULL;
fr->rawdecwins = 0;
if( fr->layerscratch != NULL )
free( fr->layerscratch );
}
void frame_exit( mpg123_handle_t *fr )
{
if( fr->buffer.rdata != NULL )
free( fr->buffer.rdata );
fr->buffer.rdata = NULL;
frame_free_buffers( fr );
frame_free_toc( fr );
fi_exit( &fr->index );
// clean up possible mess from LFS wrapper.
if( fr->wrapperclean != NULL )
{
fr->wrapperclean( fr->wrapperdata );
fr->wrapperdata = NULL;
}
bc_cleanup( &fr->rdat.buffer );
}
int mpg123_framedata( mpg123_handle_t *mh, ulong *header, byte **bodydata, size_t *bodybytes )
{
if( mh == NULL )
return MPG123_BAD_HANDLE;
if( !mh->to_decode )
return MPG123_ERR;
if( header != NULL )
*header = mh->oldhead;
if( bodydata != NULL )
*bodydata = mh->bsbuf;
if( bodybytes != NULL )
*bodybytes = mh->framesize;
return MPG123_OK;
}
// Fuzzy frame offset searching (guessing).
// When we don't have an accurate position, we may use an inaccurate one.
// Possibilities:
// - use approximate positions from Xing TOC (not yet parsed)
// - guess wildly from mean framesize and offset of first frame / beginning of file.
static mpg_off_t frame_fuzzy_find( mpg123_handle_t *fr, mpg_off_t want_frame, mpg_off_t *get_frame )
{
mpg_off_t ret = fr->audio_start; // default is to go to the beginning.
*get_frame = 0;
// but we try to find something better.
// Xing VBR TOC works with relative positions, both in terms of audio frames and stream bytes.
// thus, it only works when whe know the length of things.
// oh... I assume the offsets are relative to the _total_ file length.
if( fr->xing_toc != NULL && fr->track_frames > 0 && fr->rdat.filelen > 0 )
{
// one could round...
int toc_entry = (int)((double)want_frame * 100.0 / fr->track_frames );
// it is an index in the 100-entry table.
if( toc_entry < 0 ) toc_entry = 0;
if( toc_entry > 99 ) toc_entry = 99;
// now estimate back what frame we get.
*get_frame = (mpg_off_t)((double)toc_entry / 100.0 * fr->track_frames );
fr->state_flags &= ~FRAME_ACCURATE;
fr->silent_resync = 1;
// question: Is the TOC for whole file size (with/without ID3) or the "real" audio data only?
// ID3v1 info could also matter.
ret = (mpg_off_t)((double)fr->xing_toc[toc_entry] / 256.0 * fr->rdat.filelen);
}
else if( fr->mean_framesize > 0 )
{
// just guess with mean framesize (may be exact with CBR files).
// query filelen here or not?
fr->state_flags &= ~FRAME_ACCURATE; // fuzzy!
fr->silent_resync = 1;
*get_frame = want_frame;
ret = (mpg_off_t)(fr->audio_start + fr->mean_framesize * want_frame);
}
return ret;
}
// find the best frame in index just before the wanted one, seek to there
// then step to just before wanted one with read_frame
// do not care tabout the stuff that was in buffer but not played back
// everything that left the decoder is counted as played
// decide if you want low latency reaction and accurate timing info or stable long-time playback with buffer!
mpg_off_t frame_index_find( mpg123_handle_t *fr, mpg_off_t want_frame, mpg_off_t* get_frame )
{
mpg_off_t gopos = 0; // default is file start if no index position
*get_frame = 0;
// possibly use VBRI index, too? I'd need an example for this...
if( fr->index.fill )
{
size_t fi; // find in index
// at index fi there is frame step*fi...
fi = want_frame / fr->index.step;
if( fi >= fr->index.fill )
{
// if we are beyond the end of frame index...
// when fuzzy seek is allowed, we have some limited tolerance for the frames we want to read rather then jump over.
if( fr->p.flags & MPG123_FUZZY && want_frame - (fr->index.fill- 1) * fr->index.step > 10 )
{
gopos = frame_fuzzy_find( fr, want_frame, get_frame );
if( gopos > fr->audio_start )
return gopos; // only in that case, we have a useful guess.
// else... just continue, fuzzyness didn't help.
}
// use the last available position, slowly advancing from that one.
fi = fr->index.fill - 1;
}
// we have index position, that yields frame and byte offsets.
*get_frame = fi * fr->index.step;
gopos = fr->index.data[fi];
fr->state_flags |= FRAME_ACCURATE; // when using the frame index, we are accurate.
}
else
{
if( fr->p.flags & MPG123_FUZZY )
return frame_fuzzy_find( fr, want_frame, get_frame );
// a bit hackish here... but we need to be fresh when looking for the first header again.
fr->firsthead = 0;
fr->oldhead = 0;
}
return gopos;
}
mpg_off_t frame_ins2outs( mpg123_handle_t *fr, mpg_off_t ins )
{
mpg_off_t outs = 0;
switch( fr->down_sample )
{
case 0:
outs = ins >> fr->down_sample;
break;
default: break;
}
return outs;
}
mpg_off_t frame_outs( mpg123_handle_t *fr, mpg_off_t num )
{
mpg_off_t outs = 0;
switch( fr->down_sample )
{
case 0:
outs = (fr->spf >> fr->down_sample) * num;
break;
default: break;
}
return outs;
}
// compute the number of output samples we expect from this frame.
// this is either simple spf() or a tad more elaborate for ntom.
mpg_off_t frame_expect_outsamples( mpg123_handle_t *fr )
{
mpg_off_t outs = 0;
switch( fr->down_sample )
{
case 0:
outs = fr->spf >> fr->down_sample;
break;
default: break;
}
return outs;
}
mpg_off_t frame_offset( mpg123_handle_t *fr, mpg_off_t outs )
{
mpg_off_t num = 0;
switch( fr->down_sample )
{
case 0:
num = outs / (fr->spf >> fr->down_sample);
break;
default: break;
}
return num;
}
// input in _input_ samples
void frame_gapless_init( mpg123_handle_t *fr, mpg_off_t framecount, mpg_off_t bskip, mpg_off_t eskip )
{
fr->gapless_frames = framecount;
if( fr->gapless_frames > 0 && bskip >= 0 && eskip >= 0 )
{
fr->begin_s = bskip + GAPLESS_DELAY;
fr->end_s = framecount * fr->spf - eskip + GAPLESS_DELAY;
}
else fr->begin_s = fr->end_s = 0;
// these will get proper values later, from above plus resampling info.
fr->begin_os = 0;
fr->end_os = 0;
fr->fullend_os = 0;
}
void frame_gapless_realinit( mpg123_handle_t *fr )
{
fr->begin_os = frame_ins2outs( fr, fr->begin_s );
fr->end_os = frame_ins2outs( fr, fr->end_s );
if( fr->gapless_frames > 0 )
fr->fullend_os = frame_ins2outs( fr, fr->gapless_frames * fr->spf );
else fr->fullend_os = 0;
}
// at least note when there is trouble...
void frame_gapless_update( mpg123_handle_t *fr, mpg_off_t total_samples )
{
mpg_off_t gapless_samples = fr->gapless_frames * fr->spf;
if( fr->gapless_frames < 1 )
return;
if( gapless_samples > total_samples )
{
// This invalidates the current position... but what should I do?
frame_gapless_init( fr, -1, 0, 0 );
frame_gapless_realinit( fr );
fr->lastframe = -1;
fr->lastoff = 0;
}
}
// compute the needed frame to ignore from, for getting accurate/consistent output for intended firstframe.
static mpg_off_t ignoreframe( mpg123_handle_t *fr )
{
mpg_off_t preshift = fr->p.preframes;
// layer 3 _really_ needs at least one frame before.
if( fr->lay == 3 && preshift < 1 )
preshift = 1;
// layer 1 & 2 really do not need more than 2.
if(fr->lay != 3 && preshift > 2 )
preshift = 2;
return fr->firstframe - preshift;
}
// the frame seek... this is not simply the seek to fe * fr->spf samples in output because we think of _input_ frames here.
// seek to frame offset 1 may be just seek to 200 samples offset in output since the beginning of first frame is delay/padding.
// hm, is that right? OK for the padding stuff, but actually, should the decoder delay be better totally hidden or not?
// with gapless, even the whole frame position could be advanced further than requested (since Homey don't play dat).
void frame_set_frameseek( mpg123_handle_t *fr, mpg_off_t fe )
{
fr->firstframe = fe;
if( fr->p.flags & MPG123_GAPLESS && fr->gapless_frames > 0 )
{
// take care of the beginning...
mpg_off_t beg_f = frame_offset( fr, fr->begin_os );
if( fe <= beg_f )
{
fr->firstframe = beg_f;
fr->firstoff = fr->begin_os - frame_outs( fr, beg_f );
}
else
{
fr->firstoff = 0;
}
// the end is set once for a track at least, on the frame_set_frameseek called in get_next_frame()
if( fr->end_os > 0 )
{
fr->lastframe = frame_offset( fr, fr->end_os );
fr->lastoff = fr->end_os - frame_outs( fr, fr->lastframe );
}
else
{
fr->lastframe = -1;
fr->lastoff = 0;
}
}
else
{
fr->firstoff = fr->lastoff = 0;
fr->lastframe = -1;
}
fr->ignoreframe = ignoreframe( fr );
}
void frame_skip( mpg123_handle_t *fr )
{
if( fr->lay == 3 )
set_pointer( fr, 512 );
}
// sample accurate seek prepare for decoder.
// this gets unadjusted output samples and takes resampling into account
void frame_set_seek( mpg123_handle_t *fr, mpg_off_t sp )
{
fr->firstframe = frame_offset( fr, sp );
fr->ignoreframe = ignoreframe( fr );
fr->firstoff = sp - frame_outs( fr, fr->firstframe );
}
static int get_rva( mpg123_handle_t *fr, double *peak, double *gain )
{
double p = -1;
double g = 0;
int ret = 0;
if( fr->p.rva )
{
int rt = 0;
// should one assume a zero RVA as no RVA?
if( fr->p.rva == 2 && fr->rva.level[1] != -1 )
rt = 1;
if( fr->rva.level[rt] != -1 )
{
p = fr->rva.peak[rt];
g = fr->rva.gain[rt];
ret = 1; // success.
}
}
if( peak != NULL ) *peak = p;
if( gain != NULL ) *gain = g;
return ret;
}
// adjust the volume, taking both fr->outscale and rva values into account
void do_rva( mpg123_handle_t *fr )
{
double peak = 0;
double gain = 0;
double newscale;
double rvafact = 1;
if( get_rva( fr, &peak, &gain ))
rvafact = pow( 10, gain / 20 );
newscale = fr->p.outscale * rvafact;
// if peak is unknown (== 0) this check won't hurt
if(( peak * newscale ) > 1.0 )
newscale = 1.0 / peak;
// first rva setting is forced with fr->lastscale < 0
if( newscale != fr->lastscale || fr->decoder_change )
{
fr->lastscale = newscale;
// it may be too early, actually.
if( fr->make_decode_tables != NULL )
fr->make_decode_tables( fr ); // the actual work
}
}