Use a decode-encode method for ambisonic upsampling

This should allow for clearer and less diffuse responses. While a cube is in the blindspots for second-order, resulting in an identify transform for first- to-second-order, they do start contributing to third-order channels, which should make for sharper virtual points. The fixed HF scales should also play nicer with larger order upmixes.
2022-08-15 08:20:20 -07:00 · 2022-08-15 08:20:20 -07:00 · 6d5580805e
commit 6d5580805e
parent fbfa8a2686
3 changed files with 284 additions and 23 deletions
--- a/alc/alu.cpp
+++ b/alc/alu.cpp
@ -341,6 +341,101 @@ inline uint dither_rng(uint *seed) noexcept
 }


+/* Ambisonic upsampler functions. These are effectively matrix multiply
+ * operations. They take the 'coeffs' as the input matrix, and combine it with
+ * an "upsampler" matrix, resulting in a coefficient matrix that behaves as if
+ * the initial coefficients were applied to the B-Format input, which was then
+ * decoded to a speaker array at its input order, and finally encoded back into
+ * the higher order mix.
+ */
+void UpsampleFirstOrder(const al::span<std::array<float,MaxAmbiChannels>,MaxAmbiChannels> coeffs)
+{
+    auto transpose = [coeffs]() noexcept
+    {
+        std::array<std::array<float,4>,4> res{};
+        for(size_t i{0};i < 4;++i)
+        {
+            for(size_t j{0};j < 4;++j)
+                res[i][j] = coeffs[j][i];
+        }
+        return res;
+    };
+    const auto input = transpose();
+
+    static_assert(input[0].size() == AmbiScale::FirstOrderUp.size(),
+        "Mismatched first-order input and upsampler size");
+
+    for(size_t i{0};i < input.size();++i)
+    {
+        for(size_t j{0};j < AmbiScale::FirstOrderUp[0].size();++j)
+        {
+            double sum{0.0};
+            for(size_t k{0};k < input[0].size();++k)
+                sum += double{input[i][k]} * AmbiScale::FirstOrderUp[k][j];
+            coeffs[j][i] = static_cast<float>(sum);
+        }
+    }
+}
+
+void UpsampleSecondOrder(const al::span<std::array<float,MaxAmbiChannels>,MaxAmbiChannels> coeffs)
+{
+    auto transpose = [coeffs]() noexcept
+    {
+        std::array<std::array<float,9>,9> res{};
+        for(size_t i{0};i < 9;++i)
+        {
+            for(size_t j{0};j < 9;++j)
+                res[i][j] = coeffs[j][i];
+        }
+        return res;
+    };
+    const auto input = transpose();
+
+    static_assert(input[0].size() == AmbiScale::SecondOrderUp.size(),
+        "Mismatched second-order input and upsampler size");
+
+    for(size_t i{0};i < input.size();++i)
+    {
+        for(size_t j{0};j < AmbiScale::SecondOrderUp[0].size();++j)
+        {
+            double sum{0.0};
+            for(size_t k{0};k < input[0].size();++k)
+                sum += double{input[i][k]} * AmbiScale::SecondOrderUp[k][j];
+            coeffs[j][i] = static_cast<float>(sum);
+        }
+    }
+}
+
+void UpsampleThirdOrder(const al::span<std::array<float,MaxAmbiChannels>,MaxAmbiChannels> coeffs)
+{
+    auto transpose = [coeffs]() noexcept
+    {
+        std::array<std::array<float,16>,16> res{};
+        for(size_t i{0};i < 16;++i)
+        {
+            for(size_t j{0};j < 16;++j)
+                res[i][j] = coeffs[j][i];
+        }
+        return res;
+    };
+    const auto input = transpose();
+
+    static_assert(input[0].size() == AmbiScale::ThirdOrderUp.size(),
+        "Mismatched third-order input and upsampler size");
+
+    for(size_t i{0};i < input.size();++i)
+    {
+        for(size_t j{0};j < AmbiScale::ThirdOrderUp[0].size();++j)
+        {
+            double sum{0.0};
+            for(size_t k{0};k < input[0].size();++k)
+                sum += double{input[i][k]} * AmbiScale::ThirdOrderUp[k][j];
+            coeffs[j][i] = static_cast<float>(sum);
+        }
+    }
+}
+
+
 inline auto& GetAmbiScales(AmbiScaling scaletype) noexcept
 {
    switch(scaletype)
@ -872,6 +967,16 @@ void CalcPanningAndFilters(Voice *voice, const float xpos, const float ypos, con
            shrot[2][1] = -U[1]; shrot[2][2] =  V[1]; shrot[2][3] =  N[1];
            shrot[3][1] =  U[2]; shrot[3][2] = -V[2]; shrot[3][3] = -N[2];
            AmbiRotator(shrot, static_cast<int>(minu(voice->mAmbiOrder, Device->mAmbiOrder)));
+            /* If the device is higher order than the voice, "upsample" the matrix */
+            if(Device->mAmbiOrder > voice->mAmbiOrder)
+            {
+                if(voice->mAmbiOrder == 1)
+                    UpsampleFirstOrder(shrot);
+                else if(voice->mAmbiOrder == 2)
+                    UpsampleSecondOrder(shrot);
+                else if(voice->mAmbiOrder == 3)
+                    UpsampleThirdOrder(shrot);
+            }

            /* Convert the rotation matrix for input ordering and scaling, and
             * whether input is 2D or 3D.
@ -880,20 +985,16 @@ void CalcPanningAndFilters(Voice *voice, const float xpos, const float ypos, con
                GetAmbi2DLayout(voice->mAmbiLayout).data() :
                GetAmbiLayout(voice->mAmbiLayout).data()};

-            static const uint8_t ChansPerOrder[MaxAmbiOrder+1]{1, 3, 5, 7,};
            static const uint8_t OrderOffset[MaxAmbiOrder+1]{0, 1, 4, 9,};
            for(size_t c{1};c < num_channels;c++)
            {
                const size_t acn{index_map[c]};
                const size_t order{AmbiIndex::OrderFromChannel()[acn]};
-                const size_t tocopy{ChansPerOrder[order]};
-                const size_t offset{OrderOffset[order]};
                const float scale{scales[acn] * coverage};
-                auto in = shrot.cbegin() + offset;

                coeffs = std::array<float,MaxAmbiChannels>{};
-                for(size_t x{0};x < tocopy;++x)
-                    coeffs[offset+x] = in[x][acn] * scale;
+                for(size_t x{OrderOffset[order]};x < MaxAmbiChannels;++x)
+                    coeffs[x] = shrot[x][acn] * scale;

                ComputePanGains(&Device->Dry, coeffs.data(), DryGain.Base,
                    voice->mChans[c].mDryParams.Gains.Target);
--- a/core/ambidefs.cpp
+++ b/core/ambidefs.cpp
@ -5,21 +5,22 @@

 #include <cassert>

+#include "alnumbers.h"
+#include "opthelpers.h"
+

 namespace {

 constexpr std::array<float,MaxAmbiOrder+1> Ambi3DDecoderHFScale10{{
-    1.000000000e+00f, 5.773502692e-01f
+    2.000000000e+00f, 1.154700538e+00f
 }};
 constexpr std::array<float,MaxAmbiOrder+1> Ambi3DDecoderHFScale2O{{
-    9.128709292e-01f, 7.071067812e-01f, 3.651483717e-01f
+    1.972026594e+00f, 1.527525232e+00f, 7.888106377e-01f
 }};
+/* TODO: Set properly when making the third-order upsampler decoder. */
 constexpr std::array<float,MaxAmbiOrder+1> Ambi3DDecoderHFScale3O{{
-    8.340921354e-01f, 7.182670250e-01f, 5.107426573e-01f, 2.541870634e-01f
+    1.000000000e+00f, 1.000000000e+00f, 1.000000000e+00f, 1.000000000e+00f
 }};
-/*constexpr std::array<float,MaxAmbiOrder+1> Ambi3DDecoderHFScale4O{{
-    1.727324867e-02f, 3.238734126e-02f, 8.245277297e-02f, 2.360733547e-01f, 7.127761153e-01f
-}};*/

 inline auto& GetDecoderHFScales(uint order) noexcept
 {
@ -28,20 +29,175 @@ inline auto& GetDecoderHFScales(uint order) noexcept
    return Ambi3DDecoderHFScale10;
 }

+
+/* Copied from mixer.cpp. */
+constexpr auto CalcAmbiCoeffs(const float y, const float z, const float x)
+{
+    const float xx{x*x}, yy{y*y}, zz{z*z}, xy{x*y}, yz{y*z}, xz{x*z};
+
+    return std::array<float,MaxAmbiChannels>{{
+        /* Zeroth-order */
+        1.0f, /* ACN 0 = 1 */
+        /* First-order */
+        al::numbers::sqrt3_v<float> * y, /* ACN 1 = sqrt(3) * Y */
+        al::numbers::sqrt3_v<float> * z, /* ACN 2 = sqrt(3) * Z */
+        al::numbers::sqrt3_v<float> * x, /* ACN 3 = sqrt(3) * X */
+        /* Second-order */
+        3.872983346e+00f * xy,               /* ACN 4 = sqrt(15) * X * Y */
+        3.872983346e+00f * yz,               /* ACN 5 = sqrt(15) * Y * Z */
+        1.118033989e+00f * (3.0f*zz - 1.0f), /* ACN 6 = sqrt(5)/2 * (3*Z*Z - 1) */
+        3.872983346e+00f * xz,               /* ACN 7 = sqrt(15) * X * Z */
+        1.936491673e+00f * (xx - yy),        /* ACN 8 = sqrt(15)/2 * (X*X - Y*Y) */
+        /* Third-order */
+        2.091650066e+00f * (y*(3.0f*xx - yy)),   /* ACN  9 = sqrt(35/8) * Y * (3*X*X - Y*Y) */
+        1.024695076e+01f * (z*xy),               /* ACN 10 = sqrt(105) * Z * X * Y */
+        1.620185175e+00f * (y*(5.0f*zz - 1.0f)), /* ACN 11 = sqrt(21/8) * Y * (5*Z*Z - 1) */
+        1.322875656e+00f * (z*(5.0f*zz - 3.0f)), /* ACN 12 = sqrt(7)/2 * Z * (5*Z*Z - 3) */
+        1.620185175e+00f * (x*(5.0f*zz - 1.0f)), /* ACN 13 = sqrt(21/8) * X * (5*Z*Z - 1) */
+        5.123475383e+00f * (z*(xx - yy)),        /* ACN 14 = sqrt(105)/2 * Z * (X*X - Y*Y) */
+        2.091650066e+00f * (x*(xx - 3.0f*yy)),   /* ACN 15 = sqrt(35/8) * X * (X*X - 3*Y*Y) */
+        /* Fourth-order */
+        /* ACN 16 = sqrt(35)*3/2 * X * Y * (X*X - Y*Y) */
+        /* ACN 17 = sqrt(35/2)*3/2 * (3*X*X - Y*Y) * Y * Z */
+        /* ACN 18 = sqrt(5)*3/2 * X * Y * (7*Z*Z - 1) */
+        /* ACN 19 = sqrt(5/2)*3/2 * Y * Z * (7*Z*Z - 3)  */
+        /* ACN 20 = 3/8 * (35*Z*Z*Z*Z - 30*Z*Z + 3) */
+        /* ACN 21 = sqrt(5/2)*3/2 * X * Z * (7*Z*Z - 3) */
+        /* ACN 22 = sqrt(5)*3/4 * (X*X - Y*Y) * (7*Z*Z - 1) */
+        /* ACN 23 = sqrt(35/2)*3/2 * (X*X - 3*Y*Y) * X * Z */
+        /* ACN 24 = sqrt(35)*3/8 * (X*X*X*X - 6*X*X*Y*Y + Y*Y*Y*Y) */
+    }};
+}
+
+
+constexpr std::array<std::array<float,4>,8> FirstOrderDecoder{{
+    {{ 1.250000000e-01f,  1.250000000e-01f,  1.250000000e-01f,  1.250000000e-01f, }},
+    {{ 1.250000000e-01f,  1.250000000e-01f,  1.250000000e-01f, -1.250000000e-01f, }},
+    {{ 1.250000000e-01f, -1.250000000e-01f,  1.250000000e-01f,  1.250000000e-01f, }},
+    {{ 1.250000000e-01f, -1.250000000e-01f,  1.250000000e-01f, -1.250000000e-01f, }},
+    {{ 1.250000000e-01f,  1.250000000e-01f, -1.250000000e-01f,  1.250000000e-01f, }},
+    {{ 1.250000000e-01f,  1.250000000e-01f, -1.250000000e-01f, -1.250000000e-01f, }},
+    {{ 1.250000000e-01f, -1.250000000e-01f, -1.250000000e-01f,  1.250000000e-01f, }},
+    {{ 1.250000000e-01f, -1.250000000e-01f, -1.250000000e-01f, -1.250000000e-01f, }},
+}};
+
+constexpr std::array<std::array<float,MaxAmbiChannels>,8> FirstOrderEncoder{{
+    CalcAmbiCoeffs( 0.57735026919f,  0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs( 0.57735026919f,  0.57735026919f, -0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f,  0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f,  0.57735026919f, -0.57735026919f),
+    CalcAmbiCoeffs( 0.57735026919f, -0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs( 0.57735026919f, -0.57735026919f, -0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f, -0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f, -0.57735026919f, -0.57735026919f),
+}};
+static_assert(FirstOrderDecoder.size() == FirstOrderEncoder.size(), "First-order mismatch");
+
+/* This calculates a first-order "upsampler" matrix. It combines a first-order
+ * decoder matrix with a max-order encoder matrix, creating a matrix that
+ * behaves as if the B-Format input signal is first decoded to a speaker array
+ * at first-order, then those speaker feeds are encoded to a higher-order
+ * signal. While not perfect, this should accurately encode a lower-order
+ * signal into a higher-order signal.
+ */
+auto CalcFirstOrderUp()
+{
+    std::array<std::array<float,MaxAmbiChannels>,4> res{};
+
+    for(size_t i{0};i < FirstOrderDecoder[0].size();++i)
+    {
+        for(size_t j{0};j < FirstOrderEncoder[0].size();++j)
+        {
+            double sum{0.0};
+            for(size_t k{0};k < FirstOrderDecoder.size();++k)
+                sum += double{FirstOrderDecoder[k][i]} * FirstOrderEncoder[k][j];
+            res[i][j] = static_cast<float>(sum);
+        }
+    }
+
+    return res;
+}
+
+
+constexpr std::array<std::array<float,9>,14> SecondOrderDecoder{{
+    {{ 7.142857143e-02f,  0.000000000e+00f,  0.000000000e+00f,  1.237179148e-01f,  0.000000000e+00f,  0.000000000e+00f, -7.453559925e-02f,  0.000000000e+00f,  1.290994449e-01f, }},
+    {{ 7.142857143e-02f,  0.000000000e+00f,  0.000000000e+00f, -1.237179148e-01f,  0.000000000e+00f,  0.000000000e+00f, -7.453559925e-02f,  0.000000000e+00f,  1.290994449e-01f, }},
+    {{ 7.142857143e-02f,  1.237179148e-01f,  0.000000000e+00f,  0.000000000e+00f,  0.000000000e+00f,  0.000000000e+00f, -7.453559925e-02f,  0.000000000e+00f, -1.290994449e-01f, }},
+    {{ 7.142857143e-02f, -1.237179148e-01f,  0.000000000e+00f,  0.000000000e+00f,  0.000000000e+00f,  0.000000000e+00f, -7.453559925e-02f,  0.000000000e+00f, -1.290994449e-01f, }},
+    {{ 7.142857143e-02f,  0.000000000e+00f,  1.237179148e-01f,  0.000000000e+00f,  0.000000000e+00f,  0.000000000e+00f,  1.490711985e-01f,  0.000000000e+00f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f,  0.000000000e+00f, -1.237179148e-01f,  0.000000000e+00f,  0.000000000e+00f,  0.000000000e+00f,  1.490711985e-01f,  0.000000000e+00f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f,  7.142857143e-02f,  7.142857143e-02f,  7.142857143e-02f,  9.682458366e-02f,  9.682458366e-02f,  0.000000000e+00f,  9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f,  7.142857143e-02f,  7.142857143e-02f, -7.142857143e-02f, -9.682458366e-02f,  9.682458366e-02f,  0.000000000e+00f, -9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f, -7.142857143e-02f,  7.142857143e-02f,  7.142857143e-02f, -9.682458366e-02f, -9.682458366e-02f,  0.000000000e+00f,  9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f, -7.142857143e-02f,  7.142857143e-02f, -7.142857143e-02f,  9.682458366e-02f, -9.682458366e-02f,  0.000000000e+00f, -9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f,  7.142857143e-02f, -7.142857143e-02f,  7.142857143e-02f,  9.682458366e-02f, -9.682458366e-02f,  0.000000000e+00f, -9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f,  7.142857143e-02f, -7.142857143e-02f, -7.142857143e-02f, -9.682458366e-02f, -9.682458366e-02f,  0.000000000e+00f,  9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f, -7.142857143e-02f, -7.142857143e-02f,  7.142857143e-02f, -9.682458366e-02f,  9.682458366e-02f,  0.000000000e+00f, -9.682458366e-02f,  0.000000000e+00f, }},
+    {{ 7.142857143e-02f, -7.142857143e-02f, -7.142857143e-02f, -7.142857143e-02f,  9.682458366e-02f,  9.682458366e-02f,  0.000000000e+00f,  9.682458366e-02f,  0.000000000e+00f, }},
+}};
+
+constexpr std::array<std::array<float,MaxAmbiChannels>,14> SecondOrderEncoder{{
+    CalcAmbiCoeffs( 0.00000000000f,  0.00000000000f,  1.00000000000f),
+    CalcAmbiCoeffs( 0.00000000000f,  0.00000000000f, -1.00000000000f),
+    CalcAmbiCoeffs( 1.00000000000f,  0.00000000000f,  0.00000000000f),
+    CalcAmbiCoeffs(-1.00000000000f,  0.00000000000f,  0.00000000000f),
+    CalcAmbiCoeffs( 0.00000000000f,  1.00000000000f,  0.00000000000f),
+    CalcAmbiCoeffs( 0.00000000000f, -1.00000000000f,  0.00000000000f),
+    CalcAmbiCoeffs( 0.57735026919f,  0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs( 0.57735026919f,  0.57735026919f, -0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f,  0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f,  0.57735026919f, -0.57735026919f),
+    CalcAmbiCoeffs( 0.57735026919f, -0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs( 0.57735026919f, -0.57735026919f, -0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f, -0.57735026919f,  0.57735026919f),
+    CalcAmbiCoeffs(-0.57735026919f, -0.57735026919f, -0.57735026919f),
+}};
+static_assert(SecondOrderDecoder.size() == SecondOrderEncoder.size(), "Second-order mismatch");
+
+/* This calculates a second-order "upsampler" matrix. Same as the first-order
+ * matrix, just using a slightly more dense speaker array suitable for second-
+ * order content.
+ */
+auto CalcSecondOrderUp()
+{
+    std::array<std::array<float,MaxAmbiChannels>,9> res{};
+
+    for(size_t i{0};i < SecondOrderDecoder[0].size();++i)
+    {
+        for(size_t j{0};j < SecondOrderEncoder[0].size();++j)
+        {
+            double sum{0.0};
+            for(size_t k{0};k < SecondOrderDecoder.size();++k)
+                sum += double{SecondOrderDecoder[k][i]} * SecondOrderEncoder[k][j];
+            res[i][j] = static_cast<float>(sum);
+        }
+    }
+
+    return res;
+}
+
+/* TODO: When fourth-order is properly supported, fill this out. */
+auto CalcThirdOrderUp()
+{
+    std::array<std::array<float,MaxAmbiChannels>,16> res{};
+
+    for(size_t i{0};i < res.size();++i)
+        res[i][i] = 1.0f;
+
+    return res;
+}
+
 } // namespace

+const auto AmbiScale::FirstOrderUp{CalcFirstOrderUp()};
+const auto AmbiScale::SecondOrderUp{CalcSecondOrderUp()};
+const auto AmbiScale::ThirdOrderUp{CalcThirdOrderUp()};
+
+
 auto AmbiScale::GetHFOrderScales(const uint in_order, const uint out_order) noexcept
    -> std::array<float,MaxAmbiOrder+1>
 {
-    std::array<float,MaxAmbiOrder+1> ret{};
-
-    assert(out_order >= in_order);
-
-    const auto &target = GetDecoderHFScales(out_order);
-    const auto &input = GetDecoderHFScales(in_order);
-
-    for(size_t i{0};i < in_order+1;++i)
-        ret[i] = input[i] / target[i];
-
-    return ret;
+    if(unlikely(in_order >= out_order))
+        return {1.0f, 1.0f, 1.0f, 1.0f};
+    return GetDecoderHFScales(in_order);
 }
--- a/core/ambidefs.h
+++ b/core/ambidefs.h
@ -113,6 +113,10 @@ struct AmbiScale {
    /* Retrieves per-order HF scaling factors for "upsampling" ambisonic data. */
    static std::array<float,MaxAmbiOrder+1> GetHFOrderScales(const uint in_order,
        const uint out_order) noexcept;
+
+    static const std::array<std::array<float,MaxAmbiChannels>,4> FirstOrderUp;
+    static const std::array<std::array<float,MaxAmbiChannels>,9> SecondOrderUp;
+    static const std::array<std::array<float,MaxAmbiChannels>,16> ThirdOrderUp;
 };

 struct AmbiIndex {