4cc1c64646
Turns out the C version of the cubic resampler is just slightly faster than even the SSE3 version of the FIR4 resampler. This is likely due to not using a 64KB random-access lookup table along with unaligned loads, both offseting the gains from SSE.
120 lines
6.5 KiB
C
120 lines
6.5 KiB
C
#ifndef MIXER_DEFS_H
|
|
#define MIXER_DEFS_H
|
|
|
|
#include "AL/alc.h"
|
|
#include "AL/al.h"
|
|
#include "alMain.h"
|
|
#include "alu.h"
|
|
|
|
struct MixGains;
|
|
|
|
struct MixHrtfParams;
|
|
struct HrtfState;
|
|
|
|
/* C resamplers */
|
|
const ALfloat *Resample_copy_C(const InterpState *state, const ALfloat *restrict src, ALsizei frac, ALint increment, ALfloat *restrict dst, ALsizei dstlen);
|
|
const ALfloat *Resample_point_C(const InterpState *state, const ALfloat *restrict src, ALsizei frac, ALint increment, ALfloat *restrict dst, ALsizei dstlen);
|
|
const ALfloat *Resample_lerp_C(const InterpState *state, const ALfloat *restrict src, ALsizei frac, ALint increment, ALfloat *restrict dst, ALsizei dstlen);
|
|
const ALfloat *Resample_cubic_C(const InterpState *state, const ALfloat *restrict src, ALsizei frac, ALint increment, ALfloat *restrict dst, ALsizei dstlen);
|
|
const ALfloat *Resample_bsinc_C(const InterpState *state, const ALfloat *restrict src, ALsizei frac, ALint increment, ALfloat *restrict dst, ALsizei dstlen);
|
|
|
|
|
|
/* C mixers */
|
|
void MixHrtf_C(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, ALsizei OutPos,
|
|
const ALsizei IrSize, struct MixHrtfParams *hrtfparams,
|
|
struct HrtfState *hrtfstate, ALsizei BufferSize);
|
|
void MixHrtfBlend_C(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, ALsizei OutPos,
|
|
const ALsizei IrSize, const HrtfParams *oldparams,
|
|
MixHrtfParams *newparams, HrtfState *hrtfstate,
|
|
ALsizei BufferSize);
|
|
void MixDirectHrtf_C(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, const ALsizei IrSize,
|
|
const ALfloat (*restrict Coeffs)[2], ALfloat (*restrict Values)[2],
|
|
ALsizei BufferSize);
|
|
void Mix_C(const ALfloat *data, ALsizei OutChans, ALfloat (*restrict OutBuffer)[BUFFERSIZE],
|
|
ALfloat *CurrentGains, const ALfloat *TargetGains, ALsizei Counter, ALsizei OutPos,
|
|
ALsizei BufferSize);
|
|
void MixRow_C(ALfloat *OutBuffer, const ALfloat *Gains,
|
|
const ALfloat (*restrict data)[BUFFERSIZE], ALsizei InChans,
|
|
ALsizei InPos, ALsizei BufferSize);
|
|
|
|
/* SSE mixers */
|
|
void MixHrtf_SSE(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, ALsizei OutPos,
|
|
const ALsizei IrSize, struct MixHrtfParams *hrtfparams,
|
|
struct HrtfState *hrtfstate, ALsizei BufferSize);
|
|
void MixHrtfBlend_SSE(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, ALsizei OutPos,
|
|
const ALsizei IrSize, const HrtfParams *oldparams,
|
|
MixHrtfParams *newparams, HrtfState *hrtfstate,
|
|
ALsizei BufferSize);
|
|
void MixDirectHrtf_SSE(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, const ALsizei IrSize,
|
|
const ALfloat (*restrict Coeffs)[2], ALfloat (*restrict Values)[2],
|
|
ALsizei BufferSize);
|
|
void Mix_SSE(const ALfloat *data, ALsizei OutChans, ALfloat (*restrict OutBuffer)[BUFFERSIZE],
|
|
ALfloat *CurrentGains, const ALfloat *TargetGains, ALsizei Counter, ALsizei OutPos,
|
|
ALsizei BufferSize);
|
|
void MixRow_SSE(ALfloat *OutBuffer, const ALfloat *Gains,
|
|
const ALfloat (*restrict data)[BUFFERSIZE], ALsizei InChans,
|
|
ALsizei InPos, ALsizei BufferSize);
|
|
|
|
/* SSE resamplers */
|
|
inline void InitiatePositionArrays(ALsizei frac, ALint increment, ALsizei *restrict frac_arr, ALint *restrict pos_arr, ALsizei size)
|
|
{
|
|
ALsizei i;
|
|
|
|
pos_arr[0] = 0;
|
|
frac_arr[0] = frac;
|
|
for(i = 1;i < size;i++)
|
|
{
|
|
ALint frac_tmp = frac_arr[i-1] + increment;
|
|
pos_arr[i] = pos_arr[i-1] + (frac_tmp>>FRACTIONBITS);
|
|
frac_arr[i] = frac_tmp&FRACTIONMASK;
|
|
}
|
|
}
|
|
|
|
const ALfloat *Resample_lerp_SSE2(const InterpState *state, const ALfloat *restrict src,
|
|
ALsizei frac, ALint increment, ALfloat *restrict dst,
|
|
ALsizei numsamples);
|
|
const ALfloat *Resample_lerp_SSE41(const InterpState *state, const ALfloat *restrict src,
|
|
ALsizei frac, ALint increment, ALfloat *restrict dst,
|
|
ALsizei numsamples);
|
|
|
|
const ALfloat *Resample_bsinc_SSE(const InterpState *state, const ALfloat *restrict src,
|
|
ALsizei frac, ALint increment, ALfloat *restrict dst,
|
|
ALsizei dstlen);
|
|
|
|
/* Neon mixers */
|
|
void MixHrtf_Neon(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, ALsizei OutPos,
|
|
const ALsizei IrSize, struct MixHrtfParams *hrtfparams,
|
|
struct HrtfState *hrtfstate, ALsizei BufferSize);
|
|
void MixHrtfBlend_Neon(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, ALsizei OutPos,
|
|
const ALsizei IrSize, const HrtfParams *oldparams,
|
|
MixHrtfParams *newparams, HrtfState *hrtfstate,
|
|
ALsizei BufferSize);
|
|
void MixDirectHrtf_Neon(ALfloat *restrict LeftOut, ALfloat *restrict RightOut,
|
|
const ALfloat *data, ALsizei Offset, const ALsizei IrSize,
|
|
const ALfloat (*restrict Coeffs)[2], ALfloat (*restrict Values)[2],
|
|
ALsizei BufferSize);
|
|
void Mix_Neon(const ALfloat *data, ALsizei OutChans, ALfloat (*restrict OutBuffer)[BUFFERSIZE],
|
|
ALfloat *CurrentGains, const ALfloat *TargetGains, ALsizei Counter, ALsizei OutPos,
|
|
ALsizei BufferSize);
|
|
void MixRow_Neon(ALfloat *OutBuffer, const ALfloat *Gains,
|
|
const ALfloat (*restrict data)[BUFFERSIZE], ALsizei InChans,
|
|
ALsizei InPos, ALsizei BufferSize);
|
|
|
|
/* Neon resamplers */
|
|
const ALfloat *Resample_lerp_Neon(const InterpState *state, const ALfloat *restrict src,
|
|
ALsizei frac, ALint increment, ALfloat *restrict dst,
|
|
ALsizei numsamples);
|
|
const ALfloat *Resample_bsinc_Neon(const InterpState *state, const ALfloat *restrict src,
|
|
ALsizei frac, ALint increment, ALfloat *restrict dst,
|
|
ALsizei dstlen);
|
|
|
|
#endif /* MIXER_DEFS_H */
|