aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorChris Robinson <[email protected]>2018-12-26 13:20:59 -0800
committerChris Robinson <[email protected]>2018-12-26 13:20:59 -0800
commit5c449de73f491a73cbc948b3301b8305f20be648 (patch)
tree9f790202d0096f399820ff189615f58990eef74a
parent3b9defa4afcbfa96b47cb528d91abb65416d4330 (diff)
Improve UHJ2 encoding
-rw-r--r--Alc/alu.cpp7
-rw-r--r--Alc/uhjfilter.cpp79
-rw-r--r--Alc/uhjfilter.h18
3 files changed, 51 insertions, 53 deletions
diff --git a/Alc/alu.cpp b/Alc/alu.cpp
index 861932c9..2490f0cb 100644
--- a/Alc/alu.cpp
+++ b/Alc/alu.cpp
@@ -169,10 +169,9 @@ void ProcessUhj(ALCdevice *device, ALsizei SamplesToDo)
const int ridx{(device->RealOut.ChannelName[1]==FrontRight) ? 1 : 0};
/* Encode to stereo-compatible 2-channel UHJ output. */
- EncodeUhj2(device->Uhj_Encoder.get(),
- device->RealOut.Buffer[lidx], device->RealOut.Buffer[ridx],
- device->Dry.Buffer, SamplesToDo
- );
+ Uhj2Encoder *uhj2enc{device->Uhj_Encoder.get()};
+ uhj2enc->encode(device->RealOut.Buffer[lidx], device->RealOut.Buffer[ridx],
+ device->Dry.Buffer, SamplesToDo);
}
void ProcessBs2b(ALCdevice *device, ALsizei SamplesToDo)
diff --git a/Alc/uhjfilter.cpp b/Alc/uhjfilter.cpp
index 4fae721f..1c5c836c 100644
--- a/Alc/uhjfilter.cpp
+++ b/Alc/uhjfilter.cpp
@@ -22,16 +22,13 @@ void allpass_process(AllPassState *state, ALfloat *RESTRICT dst, const ALfloat *
{
ALfloat z1 = state->z[0];
ALfloat z2 = state->z[1];
- ALsizei i;
-
- for(i = 0;i < todo;i++)
+ for(ALsizei i{0};i < todo;i++)
{
ALfloat input = src[i];
ALfloat output = input*aa + z1;
z1 = z2; z2 = output*aa - input;
dst[i] = output;
}
-
state->z[0] = z1;
state->z[1] = z2;
}
@@ -59,65 +56,67 @@ void allpass_process(AllPassState *state, ALfloat *RESTRICT dst, const ALfloat *
* know which is the intended result.
*/
-void EncodeUhj2(Uhj2Encoder *enc, ALfloat *RESTRICT LeftOut, ALfloat *RESTRICT RightOut, ALfloat (*RESTRICT InSamples)[BUFFERSIZE], ALsizei SamplesToDo)
+void Uhj2Encoder::encode(ALfloat *LeftOut, ALfloat *RightOut, ALfloat (*InSamples)[BUFFERSIZE], const ALsizei SamplesToDo)
{
- ALfloat D[MAX_UPDATE_SAMPLES], S[MAX_UPDATE_SAMPLES];
- ALfloat temp[2][MAX_UPDATE_SAMPLES];
- ALsizei base, i;
+ alignas(16) ALfloat D[MAX_UPDATE_SAMPLES], S[MAX_UPDATE_SAMPLES];
+ alignas(16) ALfloat temp[2][MAX_UPDATE_SAMPLES];
ASSUME(SamplesToDo > 0);
- for(base = 0;base < SamplesToDo;)
+ for(ALsizei base{0};base < SamplesToDo;)
{
ALsizei todo = mini(SamplesToDo - base, MAX_UPDATE_SAMPLES);
ASSUME(todo > 0);
/* D = 0.6554516*Y */
- for(i = 0;i < todo;i++)
- temp[0][i] = 0.6554516f*InSamples[2][base+i];
- allpass_process(&enc->Filter1_Y[0], temp[1], temp[0], Filter1CoeffSqr[0], todo);
- allpass_process(&enc->Filter1_Y[1], temp[0], temp[1], Filter1CoeffSqr[1], todo);
- allpass_process(&enc->Filter1_Y[2], temp[1], temp[0], Filter1CoeffSqr[2], todo);
- allpass_process(&enc->Filter1_Y[3], temp[0], temp[1], Filter1CoeffSqr[3], todo);
+ const ALfloat *RESTRICT input{al::assume_aligned<16>(InSamples[2]+base)};
+ for(ALsizei i{0};i < todo;i++)
+ temp[0][i] = 0.6554516f*input[i];
+ allpass_process(&mFilter1_Y[0], temp[1], temp[0], Filter1CoeffSqr[0], todo);
+ allpass_process(&mFilter1_Y[1], temp[0], temp[1], Filter1CoeffSqr[1], todo);
+ allpass_process(&mFilter1_Y[2], temp[1], temp[0], Filter1CoeffSqr[2], todo);
+ allpass_process(&mFilter1_Y[3], temp[0], temp[1], Filter1CoeffSqr[3], todo);
/* NOTE: Filter1 requires a 1 sample delay for the final output, so
* take the last processed sample from the previous run as the first
* output sample.
*/
- D[0] = enc->LastY;
- for(i = 1;i < todo;i++)
+ D[0] = mLastY;
+ for(ALsizei i{1};i < todo;i++)
D[i] = temp[0][i-1];
- enc->LastY = temp[0][i-1];
+ mLastY = temp[0][todo-1];
/* D += j(-0.3420201*W + 0.5098604*X) */
- for(i = 0;i < todo;i++)
- temp[0][i] = -0.3420201f*InSamples[0][base+i] +
- 0.5098604f*InSamples[1][base+i];
- allpass_process(&enc->Filter2_WX[0], temp[1], temp[0], Filter2CoeffSqr[0], todo);
- allpass_process(&enc->Filter2_WX[1], temp[0], temp[1], Filter2CoeffSqr[1], todo);
- allpass_process(&enc->Filter2_WX[2], temp[1], temp[0], Filter2CoeffSqr[2], todo);
- allpass_process(&enc->Filter2_WX[3], temp[0], temp[1], Filter2CoeffSqr[3], todo);
- for(i = 0;i < todo;i++)
+ const ALfloat *RESTRICT input0{al::assume_aligned<16>(InSamples[0]+base)};
+ const ALfloat *RESTRICT input1{al::assume_aligned<16>(InSamples[1]+base)};
+ for(ALsizei i{0};i < todo;i++)
+ temp[0][i] = -0.3420201f*input0[i] + 0.5098604f*input1[i];
+ allpass_process(&mFilter2_WX[0], temp[1], temp[0], Filter2CoeffSqr[0], todo);
+ allpass_process(&mFilter2_WX[1], temp[0], temp[1], Filter2CoeffSqr[1], todo);
+ allpass_process(&mFilter2_WX[2], temp[1], temp[0], Filter2CoeffSqr[2], todo);
+ allpass_process(&mFilter2_WX[3], temp[0], temp[1], Filter2CoeffSqr[3], todo);
+ for(ALsizei i{0};i < todo;i++)
D[i] += temp[0][i];
/* S = 0.9396926*W + 0.1855740*X */
- for(i = 0;i < todo;i++)
- temp[0][i] = 0.9396926f*InSamples[0][base+i] +
- 0.1855740f*InSamples[1][base+i];
- allpass_process(&enc->Filter1_WX[0], temp[1], temp[0], Filter1CoeffSqr[0], todo);
- allpass_process(&enc->Filter1_WX[1], temp[0], temp[1], Filter1CoeffSqr[1], todo);
- allpass_process(&enc->Filter1_WX[2], temp[1], temp[0], Filter1CoeffSqr[2], todo);
- allpass_process(&enc->Filter1_WX[3], temp[0], temp[1], Filter1CoeffSqr[3], todo);
- S[0] = enc->LastWX;
- for(i = 1;i < todo;i++)
+ for(ALsizei i{0};i < todo;i++)
+ temp[0][i] = 0.9396926f*input0[i] + 0.1855740f*input1[i];
+ allpass_process(&mFilter1_WX[0], temp[1], temp[0], Filter1CoeffSqr[0], todo);
+ allpass_process(&mFilter1_WX[1], temp[0], temp[1], Filter1CoeffSqr[1], todo);
+ allpass_process(&mFilter1_WX[2], temp[1], temp[0], Filter1CoeffSqr[2], todo);
+ allpass_process(&mFilter1_WX[3], temp[0], temp[1], Filter1CoeffSqr[3], todo);
+ S[0] = mLastWX;
+ for(ALsizei i{1};i < todo;i++)
S[i] = temp[0][i-1];
- enc->LastWX = temp[0][i-1];
+ mLastWX = temp[0][todo-1];
/* Left = (S + D)/2.0 */
- for(i = 0;i < todo;i++)
- *(LeftOut++) += (S[i] + D[i]) * 0.5f;
+ ALfloat *RESTRICT left = al::assume_aligned<16>(LeftOut+base);
+ for(ALsizei i{0};i < todo;i++)
+ left[i] += (S[i] + D[i]) * 0.5f;
/* Right = (S - D)/2.0 */
- for(i = 0;i < todo;i++)
- *(RightOut++) += (S[i] - D[i]) * 0.5f;
+ ALfloat *RESTRICT right = al::assume_aligned<16>(RightOut+base);
+ for(ALsizei i{0};i < todo;i++)
+ right[i] += (S[i] - D[i]) * 0.5f;
base += todo;
}
diff --git a/Alc/uhjfilter.h b/Alc/uhjfilter.h
index c6335af3..1351491b 100644
--- a/Alc/uhjfilter.h
+++ b/Alc/uhjfilter.h
@@ -37,17 +37,17 @@ struct AllPassState {
*/
struct Uhj2Encoder {
- AllPassState Filter1_Y[4];
- AllPassState Filter2_WX[4];
- AllPassState Filter1_WX[4];
- ALfloat LastY{0.0f}, LastWX{0.0f};
+ AllPassState mFilter1_Y[4];
+ AllPassState mFilter2_WX[4];
+ AllPassState mFilter1_WX[4];
+ ALfloat mLastY{0.0f}, mLastWX{0.0f};
+
+ /* Encodes a 2-channel UHJ (stereo-compatible) signal from a B-Format input
+ * signal. The input must use FuMa channel ordering and scaling.
+ */
+ void encode(ALfloat *LeftOut, ALfloat *RightOut, ALfloat (*InSamples)[BUFFERSIZE], const ALsizei SamplesToDo);
DEF_NEWDEL(Uhj2Encoder)
};
-/* Encodes a 2-channel UHJ (stereo-compatible) signal from a B-Format input
- * signal. The input must use FuMa channel ordering and scaling.
- */
-void EncodeUhj2(Uhj2Encoder *enc, ALfloat *RESTRICT LeftOut, ALfloat *RESTRICT RightOut, ALfloat (*RESTRICT InSamples)[BUFFERSIZE], ALsizei SamplesToDo);
-
#endif /* UHJFILTER_H */