123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958 |
- #include <stdlib.h>
- #include <string.h>
- #define _USE_MATH_DEFINES
- #include <math.h>
- #if (defined(_M_IX86) || defined(__i386__) || defined(_M_X64) || defined(__amd64__))
- #include <xmmintrin.h>
- #define RESAMPLER_SSE
- #endif
- #ifdef _MSC_VER
- #define ALIGNED _declspec(align(16))
- #else
- #define ALIGNED __attribute__((aligned(16)))
- #endif
- #ifndef M_PI
- #define M_PI 3.14159265358979323846
- #endif
- #include "resampler.h"
- enum { RESAMPLER_SHIFT = 10 };
- enum { RESAMPLER_RESOLUTION = 1 << RESAMPLER_SHIFT };
- enum { SINC_WIDTH = 16 };
- enum { SINC_SAMPLES = RESAMPLER_RESOLUTION * SINC_WIDTH };
- enum { CUBIC_SAMPLES = RESAMPLER_RESOLUTION * 4 };
- ALIGNED static float cubic_lut[CUBIC_SAMPLES];
- static float sinc_lut[SINC_SAMPLES + 1];
- static float window_lut[SINC_SAMPLES + 1];
- enum { resampler_buffer_size = SINC_WIDTH * 4 };
- static int fEqual(const float b, const float a)
- {
- return fabs(a - b) < 1.0e-6;
- }
- static float sinc(float x)
- {
- return fEqual(x, 0.0f) ? 1.0f : (float)(sin(x * M_PI) / (x * M_PI));
- }
- #ifdef RESAMPLER_SSE
- #ifdef _MSC_VER
- #include <intrin.h>
- #elif defined(__clang__) || defined(__GNUC__)
- static inline void
- __cpuid(int *data, int selector)
- {
- #if defined(__PIC__) && defined(__i386__)
- asm("xchgl %%ebx, %%esi; cpuid; xchgl %%ebx, %%esi"
- : "=a" (data[0]),
- "=S" (data[1]),
- "=c" (data[2]),
- "=d" (data[3])
- : "0" (selector));
- #elif defined(__PIC__) && defined(__amd64__)
- asm("xchg{q} {%%}rbx, %q1; cpuid; xchg{q} {%%}rbx, %q1"
- : "=a" (data[0]),
- "=&r" (data[1]),
- "=c" (data[2]),
- "=d" (data[3])
- : "0" (selector));
- #else
- asm("cpuid"
- : "=a" (data[0]),
- "=b" (data[1]),
- "=c" (data[2]),
- "=d" (data[3])
- : "0" (selector));
- #endif
- }
- #else
- #define __cpuid(a,b) memset((a), 0, sizeof(int) * 4)
- #endif
- static int query_cpu_feature_sse() {
- int buffer[4];
- __cpuid(buffer,1);
- if ((buffer[3]&(1<<25)) == 0) return 0;
- return 1;
- }
- static int resampler_has_sse = 0;
- #endif
- void resampler_init(void)
- {
- unsigned i;
- double dx = (float)(SINC_WIDTH) / SINC_SAMPLES, x = 0.0;
- for (i = 0; i < SINC_SAMPLES + 1; ++i, x += dx)
- {
- float y = x / SINC_WIDTH;
- #if 0
- // Blackman
- float window = 0.42659 - 0.49656 * cos(M_PI + M_PI * y) + 0.076849 * cos(2.0 * M_PI * y);
- #elif 1
- // Nuttal 3 term
- float window = 0.40897 + 0.5 * cos(M_PI * y) + 0.09103 * cos(2.0 * M_PI * y);
- #elif 0
- // C.R.Helmrich's 2 term window
- float window = 0.79445 * cos(0.5 * M_PI * y) + 0.20555 * cos(1.5 * M_PI * y);
- #elif 0
- // Lanczos
- float window = sinc(y);
- #endif
- sinc_lut[i] = fabs(x) < SINC_WIDTH ? sinc(x) : 0.0;
- window_lut[i] = window;
- }
- dx = 1.0 / (float)(RESAMPLER_RESOLUTION);
- x = 0.0;
- for (i = 0; i < RESAMPLER_RESOLUTION; ++i, x += dx)
- {
- cubic_lut[i*4] = (float)(-0.5 * x * x * x + x * x - 0.5 * x);
- cubic_lut[i*4+1] = (float)( 1.5 * x * x * x - 2.5 * x * x + 1.0);
- cubic_lut[i*4+2] = (float)(-1.5 * x * x * x + 2.0 * x * x + 0.5 * x);
- cubic_lut[i*4+3] = (float)( 0.5 * x * x * x - 0.5 * x * x);
- }
- #ifdef RESAMPLER_SSE
- resampler_has_sse = query_cpu_feature_sse();
- #endif
- }
- typedef struct resampler
- {
- int write_pos, write_filled;
- int read_pos, read_filled;
- unsigned int phase;
- unsigned int phase_inc;
- unsigned int inv_phase;
- unsigned int inv_phase_inc;
- unsigned char quality;
- signed char delay_added;
- signed char delay_removed;
- float last_amp;
- float accumulator;
- float buffer_in[resampler_buffer_size * 2];
- float buffer_out[resampler_buffer_size + SINC_WIDTH * 2 - 1];
- } resampler;
- void * resampler_create(void)
- {
- resampler * r = ( resampler * ) malloc( sizeof(resampler) );
- if ( !r ) return 0;
- r->write_pos = SINC_WIDTH - 1;
- r->write_filled = 0;
- r->read_pos = 0;
- r->read_filled = 0;
- r->phase = 0;
- r->phase_inc = 0;
- r->inv_phase = 0;
- r->inv_phase_inc = 0;
- r->quality = RESAMPLER_QUALITY_MAX;
- r->delay_added = -1;
- r->delay_removed = -1;
- r->last_amp = 0;
- r->accumulator = 0;
- memset( r->buffer_in, 0, sizeof(r->buffer_in) );
- memset( r->buffer_out, 0, sizeof(r->buffer_out) );
- return r;
- }
- void resampler_delete(void * _r)
- {
- free( _r );
- }
- void * resampler_dup(const void * _r)
- {
- const resampler * r_in = ( const resampler * ) _r;
- resampler * r_out = ( resampler * ) malloc( sizeof(resampler) );
- if ( !r_out ) return 0;
- r_out->write_pos = r_in->write_pos;
- r_out->write_filled = r_in->write_filled;
- r_out->read_pos = r_in->read_pos;
- r_out->read_filled = r_in->read_filled;
- r_out->phase = r_in->phase;
- r_out->phase_inc = r_in->phase_inc;
- r_out->inv_phase = r_in->inv_phase;
- r_out->inv_phase_inc = r_in->inv_phase_inc;
- r_out->quality = r_in->quality;
- r_out->delay_added = r_in->delay_added;
- r_out->delay_removed = r_in->delay_removed;
- r_out->last_amp = r_in->last_amp;
- r_out->accumulator = r_in->accumulator;
- memcpy( r_out->buffer_in, r_in->buffer_in, sizeof(r_in->buffer_in) );
- memcpy( r_out->buffer_out, r_in->buffer_out, sizeof(r_in->buffer_out) );
- return r_out;
- }
- void resampler_dup_inplace(void *_d, const void *_s)
- {
- const resampler * r_in = ( const resampler * ) _s;
- resampler * r_out = ( resampler * ) _d;
- r_out->write_pos = r_in->write_pos;
- r_out->write_filled = r_in->write_filled;
- r_out->read_pos = r_in->read_pos;
- r_out->read_filled = r_in->read_filled;
- r_out->phase = r_in->phase;
- r_out->phase_inc = r_in->phase_inc;
- r_out->inv_phase = r_in->inv_phase;
- r_out->inv_phase_inc = r_in->inv_phase_inc;
- r_out->quality = r_in->quality;
- r_out->delay_added = r_in->delay_added;
- r_out->delay_removed = r_in->delay_removed;
- r_out->last_amp = r_in->last_amp;
- r_out->accumulator = r_in->accumulator;
- memcpy( r_out->buffer_in, r_in->buffer_in, sizeof(r_in->buffer_in) );
- memcpy( r_out->buffer_out, r_in->buffer_out, sizeof(r_in->buffer_out) );
- }
- void resampler_set_quality(void *_r, int quality)
- {
- resampler * r = ( resampler * ) _r;
- if (quality < RESAMPLER_QUALITY_MIN)
- quality = RESAMPLER_QUALITY_MIN;
- else if (quality > RESAMPLER_QUALITY_MAX)
- quality = RESAMPLER_QUALITY_MAX;
- if ( r->quality != quality )
- {
- if ( quality == RESAMPLER_QUALITY_BLEP || r->quality == RESAMPLER_QUALITY_BLEP )
- {
- r->read_pos = 0;
- r->read_filled = 0;
- r->last_amp = 0;
- r->accumulator = 0;
- memset( r->buffer_out, 0, sizeof(r->buffer_out) );
- }
- r->delay_added = -1;
- r->delay_removed = -1;
- }
- r->quality = (unsigned char)quality;
- }
- int resampler_get_free_count(void *_r)
- {
- resampler * r = ( resampler * ) _r;
- return resampler_buffer_size - r->write_filled;
- }
- static int resampler_min_filled(resampler *r)
- {
- switch (r->quality)
- {
- default:
- case RESAMPLER_QUALITY_ZOH:
- case RESAMPLER_QUALITY_BLEP:
- return 1;
-
- case RESAMPLER_QUALITY_LINEAR:
- return 2;
-
- case RESAMPLER_QUALITY_CUBIC:
- return 4;
-
- case RESAMPLER_QUALITY_SINC:
- return SINC_WIDTH * 2;
- }
- }
- static int resampler_input_delay(resampler *r)
- {
- switch (r->quality)
- {
- default:
- case RESAMPLER_QUALITY_ZOH:
- case RESAMPLER_QUALITY_BLEP:
- case RESAMPLER_QUALITY_LINEAR:
- return 0;
-
- case RESAMPLER_QUALITY_CUBIC:
- return 1;
-
- case RESAMPLER_QUALITY_SINC:
- return SINC_WIDTH - 1;
- }
- }
- static int resampler_output_delay(resampler *r)
- {
- switch (r->quality)
- {
- default:
- case RESAMPLER_QUALITY_ZOH:
- case RESAMPLER_QUALITY_LINEAR:
- case RESAMPLER_QUALITY_CUBIC:
- case RESAMPLER_QUALITY_SINC:
- return 0;
-
- case RESAMPLER_QUALITY_BLEP:
- return SINC_WIDTH - 1;
- }
- }
- int resampler_ready(void *_r)
- {
- resampler * r = ( resampler * ) _r;
- return r->write_filled > resampler_min_filled(r);
- }
- void resampler_clear(void *_r)
- {
- resampler * r = ( resampler * ) _r;
- r->write_pos = SINC_WIDTH - 1;
- r->write_filled = 0;
- r->read_pos = 0;
- r->read_filled = 0;
- r->phase = 0;
- r->delay_added = -1;
- r->delay_removed = -1;
- memset(r->buffer_in, 0, (SINC_WIDTH - 1) * sizeof(r->buffer_in[0]));
- memset(r->buffer_in + resampler_buffer_size, 0, (SINC_WIDTH - 1) * sizeof(r->buffer_in[0]));
- if (r->quality == RESAMPLER_QUALITY_BLEP)
- memset(r->buffer_out, 0, sizeof(r->buffer_out));
- }
- void resampler_set_rate(void *_r, double new_factor)
- {
- resampler * r = ( resampler * ) _r;
- r->phase_inc = (int)( new_factor * RESAMPLER_RESOLUTION );
- new_factor = 1.0 / new_factor;
- r->inv_phase_inc = (int)( new_factor * RESAMPLER_RESOLUTION );
- }
- void resampler_write_sample(void *_r, short s)
- {
- resampler * r = ( resampler * ) _r;
- if ( r->delay_added < 0 )
- {
- r->delay_added = 0;
- r->write_filled = resampler_input_delay( r );
- }
-
- if ( r->write_filled < resampler_buffer_size )
- {
- float s32 = s;
- s32 *= 256.0;
- r->buffer_in[ r->write_pos ] = s32;
- r->buffer_in[ r->write_pos + resampler_buffer_size ] = s32;
- ++r->write_filled;
- r->write_pos = ( r->write_pos + 1 ) % resampler_buffer_size;
- }
- }
- void resampler_write_sample_fixed(void *_r, int s, unsigned char depth)
- {
- resampler * r = ( resampler * ) _r;
-
- if ( r->delay_added < 0 )
- {
- r->delay_added = 0;
- r->write_filled = resampler_input_delay( r );
- }
-
- if ( r->write_filled < resampler_buffer_size )
- {
- float s32 = s;
- s32 /= (double)(1 << (depth - 1));
-
- r->buffer_in[ r->write_pos ] = s32;
- r->buffer_in[ r->write_pos + resampler_buffer_size ] = s32;
-
- ++r->write_filled;
-
- r->write_pos = ( r->write_pos + 1 ) % resampler_buffer_size;
- }
- }
- static int resampler_run_zoh(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= 1;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- int phase = r->phase;
- int phase_inc = r->phase_inc;
-
- do
- {
- float sample;
-
- if ( out >= out_end )
- break;
- sample = *in;
- *out++ = sample;
-
- phase += phase_inc;
-
- in += phase >> RESAMPLER_SHIFT;
-
- phase &= RESAMPLER_RESOLUTION-1;
- }
- while ( in < in_end );
-
- r->phase = (unsigned short) phase;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- static int resampler_run_blep(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= 1;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- float last_amp = r->last_amp;
- int inv_phase = r->inv_phase;
- int inv_phase_inc = r->inv_phase_inc;
-
- const int step = RESAMPLER_RESOLUTION;
-
- do
- {
- float kernel[SINC_WIDTH * 2], kernel_sum = 0.0;
- int i = SINC_WIDTH;
- float sample;
-
- if ( out + SINC_WIDTH * 2 > out_end )
- break;
-
- for (; i >= -SINC_WIDTH + 1; --i)
- {
- int pos = i * step;
- int abs_pos = abs(inv_phase - pos);
- kernel_sum += kernel[i + SINC_WIDTH - 1] = sinc_lut[abs_pos] * window_lut[abs_pos];
- }
- sample = *in++ - last_amp;
- last_amp += sample;
- sample /= kernel_sum;
- for (sample = 0, i = 0; i < SINC_WIDTH * 2; ++i)
- out[i] += sample * kernel[i];
-
- inv_phase += inv_phase_inc;
-
- out += inv_phase >> RESAMPLER_SHIFT;
-
- inv_phase &= RESAMPLER_RESOLUTION-1;
- }
- while ( in < in_end );
-
- r->inv_phase = inv_phase;
- r->last_amp = last_amp;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- #ifdef RESAMPLER_SSE
- static int resampler_run_blep_sse(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= 1;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- float last_amp = r->last_amp;
- int inv_phase = r->inv_phase;
- int inv_phase_inc = r->inv_phase_inc;
-
- const int step = RESAMPLER_RESOLUTION;
-
- do
- {
- // accumulate in extended precision
- float kernel_sum = 0.0;
- __m128 kernel[SINC_WIDTH / 2];
- __m128 temp1, temp2;
- __m128 samplex;
- float sample;
- float *kernelf = (float*)(&kernel);
- int i = SINC_WIDTH;
-
- if ( out + SINC_WIDTH * 2 > out_end )
- break;
-
- for (; i >= -SINC_WIDTH + 1; --i)
- {
- int pos = i * step;
- int abs_pos = abs(inv_phase - pos);
- kernel_sum += kernelf[i + SINC_WIDTH - 1] = sinc_lut[abs_pos] * window_lut[abs_pos];
- }
- sample = *in++ - last_amp;
- last_amp += sample;
- sample /= kernel_sum;
- samplex = _mm_set1_ps( sample );
- for (i = 0; i < SINC_WIDTH / 2; ++i)
- {
- temp1 = _mm_load_ps( (const float *)( kernel + i ) );
- temp1 = _mm_mul_ps( temp1, samplex );
- temp2 = _mm_loadu_ps( (const float *) out + i * 4 );
- temp1 = _mm_add_ps( temp1, temp2 );
- _mm_storeu_ps( (float *) out + i * 4, temp1 );
- }
-
- inv_phase += inv_phase_inc;
-
- out += inv_phase >> RESAMPLER_SHIFT;
-
- inv_phase &= RESAMPLER_RESOLUTION - 1;
- }
- while ( in < in_end );
-
- r->inv_phase = inv_phase;
- r->last_amp = last_amp;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- #endif
- static int resampler_run_linear(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= 2;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- int phase = r->phase;
- int phase_inc = r->phase_inc;
-
- do
- {
- float sample;
-
- if ( out >= out_end )
- break;
-
- sample = in[0] + (in[1] - in[0]) * ((float)phase / RESAMPLER_RESOLUTION);
- *out++ = sample;
-
- phase += phase_inc;
-
- in += phase >> RESAMPLER_SHIFT;
-
- phase &= RESAMPLER_RESOLUTION-1;
- }
- while ( in < in_end );
-
- r->phase = phase;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- static int resampler_run_cubic(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= 4;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- int phase = r->phase;
- int phase_inc = r->phase_inc;
-
- do
- {
- float * kernel;
- int i;
- float sample;
-
- if ( out >= out_end )
- break;
-
- kernel = cubic_lut + phase * 4;
-
- for (sample = 0, i = 0; i < 4; ++i)
- sample += in[i] * kernel[i];
- *out++ = sample;
-
- phase += phase_inc;
-
- in += phase >> RESAMPLER_SHIFT;
-
- phase &= RESAMPLER_RESOLUTION-1;
- }
- while ( in < in_end );
-
- r->phase = phase;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- #ifdef RESAMPLER_SSE
- static int resampler_run_cubic_sse(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= 4;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- int phase = r->phase;
- int phase_inc = r->phase_inc;
-
- do
- {
- __m128 temp1, temp2;
- __m128 samplex = _mm_setzero_ps();
-
- if ( out >= out_end )
- break;
-
- temp1 = _mm_loadu_ps( (const float *)( in ) );
- temp2 = _mm_load_ps( (const float *)( cubic_lut + phase * 4 ) );
- temp1 = _mm_mul_ps( temp1, temp2 );
- samplex = _mm_add_ps( samplex, temp1 );
- temp1 = _mm_movehl_ps( temp1, samplex );
- samplex = _mm_add_ps( samplex, temp1 );
- temp1 = samplex;
- temp1 = _mm_shuffle_ps( temp1, samplex, _MM_SHUFFLE(0, 0, 0, 1) );
- samplex = _mm_add_ps( samplex, temp1 );
- _mm_store_ss( out, samplex );
- ++out;
-
- phase += phase_inc;
-
- in += phase >> RESAMPLER_SHIFT;
-
- phase &= RESAMPLER_RESOLUTION - 1;
- }
- while ( in < in_end );
-
- r->phase = phase;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- #endif
- static int resampler_run_sinc(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= SINC_WIDTH * 2;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- int phase = r->phase;
- int phase_inc = r->phase_inc;
- int step = phase_inc > RESAMPLER_RESOLUTION ? RESAMPLER_RESOLUTION * RESAMPLER_RESOLUTION / phase_inc : RESAMPLER_RESOLUTION;
- int window_step = RESAMPLER_RESOLUTION;
- do
- {
- float kernel[SINC_WIDTH * 2], kernel_sum = 0.0;
- int i = SINC_WIDTH;
- int phase_adj = phase * step / RESAMPLER_RESOLUTION;
- float sample;
- if ( out >= out_end )
- break;
- for (; i >= -SINC_WIDTH + 1; --i)
- {
- int pos = i * step;
- int window_pos = i * window_step;
- kernel_sum += kernel[i + SINC_WIDTH - 1] = sinc_lut[abs(phase_adj - pos)] * window_lut[abs(phase - window_pos)];
- }
- for (sample = 0, i = 0; i < SINC_WIDTH * 2; ++i)
- sample += in[i] * kernel[i];
- *out++ = (float)(sample / kernel_sum);
- phase += phase_inc;
- in += phase >> RESAMPLER_SHIFT;
- phase &= RESAMPLER_RESOLUTION-1;
- }
- while ( in < in_end );
- r->phase = phase;
- *out_ = out;
- used = (int)(in - in_);
- r->write_filled -= used;
- }
- return used;
- }
- #ifdef RESAMPLER_SSE
- static int resampler_run_sinc_sse(resampler * r, float ** out_, float * out_end)
- {
- int in_size = r->write_filled;
- float const* in_ = r->buffer_in + resampler_buffer_size + r->write_pos - r->write_filled;
- int used = 0;
- in_size -= SINC_WIDTH * 2;
- if ( in_size > 0 )
- {
- float* out = *out_;
- float const* in = in_;
- float const* const in_end = in + in_size;
- int phase = r->phase;
- int phase_inc = r->phase_inc;
-
- int step = phase_inc > RESAMPLER_RESOLUTION ? RESAMPLER_RESOLUTION * RESAMPLER_RESOLUTION / phase_inc : RESAMPLER_RESOLUTION;
- int window_step = RESAMPLER_RESOLUTION;
-
- do
- {
- // accumulate in extended precision
- float kernel_sum = 0.0;
- __m128 kernel[SINC_WIDTH / 2];
- __m128 temp1, temp2;
- __m128 samplex = _mm_setzero_ps();
- float *kernelf = (float*)(&kernel);
- int i = SINC_WIDTH;
- int phase_adj = phase * step / RESAMPLER_RESOLUTION;
-
- if ( out >= out_end )
- break;
-
- for (; i >= -SINC_WIDTH + 1; --i)
- {
- int pos = i * step;
- int window_pos = i * window_step;
- kernel_sum += kernelf[i + SINC_WIDTH - 1] = sinc_lut[abs(phase_adj - pos)] * window_lut[abs(phase - window_pos)];
- }
- for (i = 0; i < SINC_WIDTH / 2; ++i)
- {
- temp1 = _mm_loadu_ps( (const float *)( in + i * 4 ) );
- temp2 = _mm_load_ps( (const float *)( kernel + i ) );
- temp1 = _mm_mul_ps( temp1, temp2 );
- samplex = _mm_add_ps( samplex, temp1 );
- }
- kernel_sum = 1.0f / kernel_sum;
- temp1 = _mm_movehl_ps( temp1, samplex );
- samplex = _mm_add_ps( samplex, temp1 );
- temp1 = samplex;
- temp1 = _mm_shuffle_ps( temp1, samplex, _MM_SHUFFLE(0, 0, 0, 1) );
- samplex = _mm_add_ps( samplex, temp1 );
- temp1 = _mm_set_ss( kernel_sum );
- samplex = _mm_mul_ps( samplex, temp1 );
- _mm_store_ss( out, samplex );
- ++out;
-
- phase += phase_inc;
-
- in += phase >> RESAMPLER_SHIFT;
-
- phase &= RESAMPLER_RESOLUTION - 1;
- }
- while ( in < in_end );
-
- r->phase = phase;
- *out_ = out;
-
- used = (int)(in - in_);
-
- r->write_filled -= used;
- }
-
- return used;
- }
- #endif
- static void resampler_fill(resampler * r)
- {
- int min_filled = resampler_min_filled(r);
- int quality = r->quality;
- while ( r->write_filled > min_filled &&
- r->read_filled < resampler_buffer_size )
- {
- int write_pos = ( r->read_pos + r->read_filled ) % resampler_buffer_size;
- int write_size = resampler_buffer_size - write_pos;
- float * out = r->buffer_out + write_pos;
- if ( write_size > ( resampler_buffer_size - r->read_filled ) )
- write_size = resampler_buffer_size - r->read_filled;
- switch (quality)
- {
- case RESAMPLER_QUALITY_ZOH:
- resampler_run_zoh( r, &out, out + write_size );
- break;
-
- case RESAMPLER_QUALITY_BLEP:
- {
- int used;
- int write_extra = 0;
- if ( write_pos >= r->read_pos )
- write_extra = r->read_pos;
- if ( write_extra > SINC_WIDTH * 2 - 1 )
- write_extra = SINC_WIDTH * 2 - 1;
- memcpy( r->buffer_out + resampler_buffer_size, r->buffer_out, write_extra * sizeof(r->buffer_out[0]) );
- #ifdef RESAMPLER_SSE
- if ( resampler_has_sse )
- used = resampler_run_blep_sse( r, &out, out + write_size + write_extra );
- else
- #endif
- used = resampler_run_blep( r, &out, out + write_size + write_extra );
- memcpy( r->buffer_out, r->buffer_out + resampler_buffer_size, write_extra * sizeof(r->buffer_out[0]) );
- if (!used)
- return;
- break;
- }
-
- case RESAMPLER_QUALITY_LINEAR:
- resampler_run_linear( r, &out, out + write_size );
- break;
-
- case RESAMPLER_QUALITY_CUBIC:
- #ifdef RESAMPLER_SSE
- if ( resampler_has_sse )
- resampler_run_cubic_sse( r, &out, out + write_size );
- else
- #endif
- resampler_run_cubic( r, &out, out + write_size );
- break;
-
- case RESAMPLER_QUALITY_SINC:
- #ifdef RESAMPLER_SSE
- if ( resampler_has_sse )
- resampler_run_sinc_sse( r, &out, out + write_size );
- else
- #endif
- resampler_run_sinc( r, &out, out + write_size );
- break;
- }
- r->read_filled += out - r->buffer_out - write_pos;
- }
- }
- static void resampler_fill_and_remove_delay(resampler * r)
- {
- resampler_fill( r );
- if ( r->delay_removed < 0 )
- {
- int delay = resampler_output_delay( r );
- r->delay_removed = 0;
- while ( delay-- )
- resampler_remove_sample( r );
- }
- }
- int resampler_get_sample_count(void *_r)
- {
- resampler * r = ( resampler * ) _r;
- if ( r->read_filled < 1 && (r->quality != RESAMPLER_QUALITY_BLEP || r->inv_phase_inc))
- resampler_fill_and_remove_delay( r );
- return r->read_filled;
- }
- int resampler_get_sample(void *_r)
- {
- resampler * r = ( resampler * ) _r;
- if ( r->read_filled < 1 && r->phase_inc)
- resampler_fill_and_remove_delay( r );
- if ( r->read_filled < 1 )
- return 0;
- if ( r->quality == RESAMPLER_QUALITY_BLEP )
- return (int)(r->buffer_out[ r->read_pos ] + r->accumulator);
- else
- return (int)r->buffer_out[ r->read_pos ];
- }
- void resampler_remove_sample(void *_r)
- {
- resampler * r = ( resampler * ) _r;
- if ( r->read_filled > 0 )
- {
- if ( r->quality == RESAMPLER_QUALITY_BLEP )
- {
- r->accumulator += r->buffer_out[ r->read_pos ];
- r->buffer_out[ r->read_pos ] = 0;
- r->accumulator -= r->accumulator * (1.0 / 8192.0);
- if (fabs(r->accumulator) < 1e-20)
- r->accumulator = 0;
- }
- --r->read_filled;
- r->read_pos = ( r->read_pos + 1 ) % resampler_buffer_size;
- }
- }
- /* Get a 16-bit sample without overflow */
- short resampler_get_and_remove_sample(void *_r)
- {
- int sample = (int)round(resampler_get_sample(_r) / 256.0);
- resampler_remove_sample(_r);
- if (sample > 32767)
- return 32767;
- else if (sample < -32768)
- return -32768;
- else
- return (short)sample;
- }
|