alc/alu.cpp

   1 /**
   2  * OpenAL cross platform audio library
   3  * Copyright (C) 1999-2007 by authors.
   4  * This library is free software; you can redistribute it and/or
   5  *  modify it under the terms of the GNU Library General Public
   6  *  License as published by the Free Software Foundation; either
   7  *  version 2 of the License, or (at your option) any later version.
   8  *
   9  * This library is distributed in the hope that it will be useful,
  10  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  11  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  12  *  Library General Public License for more details.
  13  *
  14  * You should have received a copy of the GNU Library General Public
  15  *  License along with this library; if not, write to the
  16  *  Free Software Foundation, Inc.,
  17  *  51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
  18  * Or go to http://www.gnu.org/copyleft/lgpl.html
  19  */
  20
  21 #include "config.h"
  22
  23 #include "alu.h"
  24
  25 #include <algorithm>
  26 #include <array>
  27 #include <atomic>
  28 #include <cassert>
  29 #include <chrono>
  30 #include <climits>
  31 #include <cstdarg>
  32 #include <cstdio>
  33 #include <cstdlib>
  34 #include <functional>
  35 #include <iterator>
  36 #include <limits>
  37 #include <memory>
  38 #include <new>
  39 #include <stdint.h>
  40 #include <utility>
  41
  42 #include "almalloc.h"
  43 #include "alnumbers.h"
  44 #include "alnumeric.h"
  45 #include "alspan.h"
  46 #include "alstring.h"
  47 #include "atomic.h"
  48 #include "core/ambidefs.h"
  49 #include "core/async_event.h"
  50 #include "core/bformatdec.h"
  51 #include "core/bs2b.h"
  52 #include "core/bsinc_defs.h"
  53 #include "core/bsinc_tables.h"
  54 #include "core/bufferline.h"
  55 #include "core/buffer_storage.h"
  56 #include "core/context.h"
  57 #include "core/cpu_caps.h"
  58 #include "core/devformat.h"
  59 #include "core/device.h"
  60 #include "core/effects/base.h"
  61 #include "core/effectslot.h"
  62 #include "core/filters/biquad.h"
  63 #include "core/filters/nfc.h"
  64 #include "core/fpu_ctrl.h"
  65 #include "core/hrtf.h"
  66 #include "core/mastering.h"
  67 #include "core/mixer.h"
  68 #include "core/mixer/defs.h"
  69 #include "core/mixer/hrtfdefs.h"
  70 #include "core/resampler_limits.h"
  71 #include "core/uhjfilter.h"
  72 #include "core/voice.h"
  73 #include "core/voice_change.h"
  74 #include "intrusive_ptr.h"
  75 #include "opthelpers.h"
  76 #include "ringbuffer.h"
  77 #include "strutils.h"
  78 #include "threads.h"
  79 #include "vecmat.h"
  80 #include "vector.h"
  81
  82 struct CTag;
  83 #ifdef HAVE_SSE
  84 struct SSETag;
  85 #endif
  86 #ifdef HAVE_SSE2
  87 struct SSE2Tag;
  88 #endif
  89 #ifdef HAVE_SSE4_1
  90 struct SSE4Tag;
  91 #endif
  92 #ifdef HAVE_NEON
  93 struct NEONTag;
  94 #endif
  95 struct PointTag;
  96 struct LerpTag;
  97 struct CubicTag;
  98 struct BSincTag;
  99 struct FastBSincTag;
 100
 101
 102 static_assert(!(MaxResamplerPadding&1), "MaxResamplerPadding is not a multiple of two");
 103
 104
 105 namespace {
 106
 107 using uint = unsigned int;
 108 using namespace std::chrono;
 109
 110 constexpr uint MaxPitch{10};
 111
 112 static_assert((BufferLineSize-1)/MaxPitch > 0, "MaxPitch is too large for BufferLineSize!");
 113 static_assert((INT_MAX>>MixerFracBits)/MaxPitch > BufferLineSize,
 114     "MaxPitch and/or BufferLineSize are too large for MixerFracBits!");
 115
 116 using namespace std::placeholders;
 117
 118 float InitConeScale()
 119 {
 120     float ret{1.0f};
 121     if(auto optval = al::getenv("__ALSOFT_HALF_ANGLE_CONES"))
 122     {
 123         if(al::strcasecmp(optval->c_str(), "true") == 0
 124             || strtol(optval->c_str(), nullptr, 0) == 1)
 125             ret *= 0.5f;
 126     }
 127     return ret;
 128 }
 129 /* Cone scalar */
 130 const float ConeScale{InitConeScale()};
 131
 132 /* Localized scalars for mono sources (initialized in aluInit, after
 133  * configuration is loaded).
 134  */
 135 float XScale{1.0f};
 136 float YScale{1.0f};
 137 float ZScale{1.0f};
 138
 139 /* Source distance scale for NFC filters. */
 140 float NfcScale{1.0f};
 141
 142
 143 struct ChanMap {
 144     Channel channel;
 145     float angle;
 146     float elevation;
 147 };
 148
 149 using HrtfDirectMixerFunc = void(*)(const FloatBufferSpan LeftOut, const FloatBufferSpan RightOut,
 150     const al::span<const FloatBufferLine> InSamples, float2 *AccumSamples, float *TempBuf,
 151     HrtfChannelState *ChanState, const size_t IrSize, const size_t BufferSize);
 152
 153 HrtfDirectMixerFunc MixDirectHrtf{MixDirectHrtf_<CTag>};
 154
 155 inline HrtfDirectMixerFunc SelectHrtfMixer(void)
 156 {
 157 #ifdef HAVE_NEON
 158     if((CPUCapFlags&CPU_CAP_NEON))
 159         return MixDirectHrtf_<NEONTag>;
 160 #endif
 161 #ifdef HAVE_SSE
 162     if((CPUCapFlags&CPU_CAP_SSE))
 163         return MixDirectHrtf_<SSETag>;
 164 #endif
 165
 166     return MixDirectHrtf_<CTag>;
 167 }
 168
 169
 170 inline void BsincPrepare(const uint increment, BsincState *state, const BSincTable *table)
 171 {
 172     size_t si{BSincScaleCount - 1};
 173     float sf{0.0f};
 174
 175     if(increment > MixerFracOne)
 176     {
 177         sf = MixerFracOne/static_cast<float>(increment) - table->scaleBase;
 178         sf = maxf(0.0f, BSincScaleCount*sf*table->scaleRange - 1.0f);
 179         si = float2uint(sf);
 180         /* The interpolation factor is fit to this diagonally-symmetric curve
 181          * to reduce the transition ripple caused by interpolating different
 182          * scales of the sinc function.
 183          */
 184         sf = 1.0f - std::cos(std::asin(sf - static_cast<float>(si)));
 185     }
 186
 187     state->sf = sf;
 188     state->m = table->m[si];
 189     state->l = (state->m/2) - 1;
 190     state->filter = table->Tab + table->filterOffset[si];
 191 }
 192
 193 inline ResamplerFunc SelectResampler(Resampler resampler, uint increment)
 194 {
 195     switch(resampler)
 196     {
 197     case Resampler::Point:
 198         return Resample_<PointTag,CTag>;
 199     case Resampler::Linear:
 200 #ifdef HAVE_NEON
 201         if((CPUCapFlags&CPU_CAP_NEON))
 202             return Resample_<LerpTag,NEONTag>;
 203 #endif
 204 #ifdef HAVE_SSE4_1
 205         if((CPUCapFlags&CPU_CAP_SSE4_1))
 206             return Resample_<LerpTag,SSE4Tag>;
 207 #endif
 208 #ifdef HAVE_SSE2
 209         if((CPUCapFlags&CPU_CAP_SSE2))
 210             return Resample_<LerpTag,SSE2Tag>;
 211 #endif
 212         return Resample_<LerpTag,CTag>;
 213     case Resampler::Cubic:
 214         return Resample_<CubicTag,CTag>;
 215     case Resampler::BSinc12:
 216     case Resampler::BSinc24:
 217         if(increment > MixerFracOne)
 218         {
 219 #ifdef HAVE_NEON
 220             if((CPUCapFlags&CPU_CAP_NEON))
 221                 return Resample_<BSincTag,NEONTag>;
 222 #endif
 223 #ifdef HAVE_SSE
 224             if((CPUCapFlags&CPU_CAP_SSE))
 225                 return Resample_<BSincTag,SSETag>;
 226 #endif
 227             return Resample_<BSincTag,CTag>;
 228         }
 229         /* fall-through */
 230     case Resampler::FastBSinc12:
 231     case Resampler::FastBSinc24:
 232 #ifdef HAVE_NEON
 233         if((CPUCapFlags&CPU_CAP_NEON))
 234             return Resample_<FastBSincTag,NEONTag>;
 235 #endif
 236 #ifdef HAVE_SSE
 237         if((CPUCapFlags&CPU_CAP_SSE))
 238             return Resample_<FastBSincTag,SSETag>;
 239 #endif
 240         return Resample_<FastBSincTag,CTag>;
 241     }
 242
 243     return Resample_<PointTag,CTag>;
 244 }
 245
 246 } // namespace
 247
 248 void aluInit(CompatFlagBitset flags, const float nfcscale)
 249 {
 250     MixDirectHrtf = SelectHrtfMixer();
 251     XScale = flags.test(CompatFlags::ReverseX) ? -1.0f : 1.0f;
 252     YScale = flags.test(CompatFlags::ReverseY) ? -1.0f : 1.0f;
 253     ZScale = flags.test(CompatFlags::ReverseZ) ? -1.0f : 1.0f;
 254
 255     NfcScale = clampf(nfcscale, 0.0001f, 10000.0f);
 256 }
 257
 258
 259 ResamplerFunc PrepareResampler(Resampler resampler, uint increment, InterpState *state)
 260 {
 261     switch(resampler)
 262     {
 263     case Resampler::Point:
 264     case Resampler::Linear:
 265     case Resampler::Cubic:
 266         break;
 267     case Resampler::FastBSinc12:
 268     case Resampler::BSinc12:
 269         BsincPrepare(increment, &state->bsinc, &bsinc12);
 270         break;
 271     case Resampler::FastBSinc24:
 272     case Resampler::BSinc24:
 273         BsincPrepare(increment, &state->bsinc, &bsinc24);
 274         break;
 275     }
 276     return SelectResampler(resampler, increment);
 277 }
 278
 279
 280 void DeviceBase::ProcessHrtf(const size_t SamplesToDo)
 281 {
 282     /* HRTF is stereo output only. */
 283     const uint lidx{RealOut.ChannelIndex[FrontLeft]};
 284     const uint ridx{RealOut.ChannelIndex[FrontRight]};
 285
 286     MixDirectHrtf(RealOut.Buffer[lidx], RealOut.Buffer[ridx], Dry.Buffer, HrtfAccumData,
 287         mHrtfState->mTemp.data(), mHrtfState->mChannels.data(), mHrtfState->mIrSize, SamplesToDo);
 288 }
 289
 290 void DeviceBase::ProcessAmbiDec(const size_t SamplesToDo)
 291 {
 292     AmbiDecoder->process(RealOut.Buffer, Dry.Buffer.data(), SamplesToDo);
 293 }
 294
 295 void DeviceBase::ProcessAmbiDecStablized(const size_t SamplesToDo)
 296 {
 297     /* Decode with front image stablization. */
 298     const uint lidx{RealOut.ChannelIndex[FrontLeft]};
 299     const uint ridx{RealOut.ChannelIndex[FrontRight]};
 300     const uint cidx{RealOut.ChannelIndex[FrontCenter]};
 301
 302     AmbiDecoder->processStablize(RealOut.Buffer, Dry.Buffer.data(), lidx, ridx, cidx,
 303         SamplesToDo);
 304 }
 305
 306 void DeviceBase::ProcessUhj(const size_t SamplesToDo)
 307 {
 308     /* UHJ is stereo output only. */
 309     const uint lidx{RealOut.ChannelIndex[FrontLeft]};
 310     const uint ridx{RealOut.ChannelIndex[FrontRight]};
 311
 312     /* Encode to stereo-compatible 2-channel UHJ output. */
 313     mUhjEncoder->encode(RealOut.Buffer[lidx].data(), RealOut.Buffer[ridx].data(),
 314         {{Dry.Buffer[0].data(), Dry.Buffer[1].data(), Dry.Buffer[2].data()}}, SamplesToDo);
 315 }
 316
 317 void DeviceBase::ProcessBs2b(const size_t SamplesToDo)
 318 {
 319     /* First, decode the ambisonic mix to the "real" output. */
 320     AmbiDecoder->process(RealOut.Buffer, Dry.Buffer.data(), SamplesToDo);
 321
 322     /* BS2B is stereo output only. */
 323     const uint lidx{RealOut.ChannelIndex[FrontLeft]};
 324     const uint ridx{RealOut.ChannelIndex[FrontRight]};
 325
 326     /* Now apply the BS2B binaural/crossfeed filter. */
 327     bs2b_cross_feed(Bs2b.get(), RealOut.Buffer[lidx].data(), RealOut.Buffer[ridx].data(),
 328         SamplesToDo);
 329 }
 330
 331
 332 namespace {
 333
 334 /* This RNG method was created based on the math found in opusdec. It's quick,
 335  * and starting with a seed value of 22222, is suitable for generating
 336  * whitenoise.
 337  */
 338 inline uint dither_rng(uint *seed) noexcept
 339 {
 340     *seed = (*seed * 96314165) + 907633515;
 341     return *seed;
 342 }
 343
 344
 345 /* Ambisonic upsampler function. It's effectively a matrix multiply. It takes
 346  * an 'upsampler' and 'rotator' as the input matrices, resulting in a matrix
 347  * that behaves as if the B-Format input was first decoded to a speaker array
 348  * at its input order, encoded back into the higher order mix, then finally
 349  * rotated.
 350  */
 351 void UpsampleBFormatTransform(size_t coeffs_order,
 352     const al::span<const std::array<float,MaxAmbiChannels>> matrix1,
 353     const al::span<std::array<float,MaxAmbiChannels>,MaxAmbiChannels> coeffs)
 354 {
 355     auto copy_coeffs = [coeffs]() noexcept
 356     {
 357         std::array<std::array<float,MaxAmbiChannels>,MaxAmbiChannels> res{};
 358         for(size_t i{0};i < MaxAmbiChannels;++i)
 359             res[i] = coeffs[i];
 360         return res;
 361     };
 362     const auto matrix2 = copy_coeffs();
 363
 364     const size_t num_chans{AmbiChannelsFromOrder(coeffs_order)};
 365     for(size_t i{0};i < matrix1.size();++i)
 366     {
 367         for(size_t j{0};j < num_chans;++j)
 368         {
 369             double sum{0.0};
 370             for(size_t k{0};k < num_chans;++k)
 371                 sum += double{matrix1[i][k]} * matrix2[j][k];
 372             coeffs[j][i] = static_cast<float>(sum);
 373         }
 374     }
 375 }
 376
 377
 378 inline auto& GetAmbiScales(AmbiScaling scaletype) noexcept
 379 {
 380     switch(scaletype)
 381     {
 382     case AmbiScaling::FuMa: return AmbiScale::FromFuMa();
 383     case AmbiScaling::SN3D: return AmbiScale::FromSN3D();
 384     case AmbiScaling::UHJ: return AmbiScale::FromUHJ();
 385     case AmbiScaling::N3D: break;
 386     }
 387     return AmbiScale::FromN3D();
 388 }
 389
 390 inline auto& GetAmbiLayout(AmbiLayout layouttype) noexcept
 391 {
 392     if(layouttype == AmbiLayout::FuMa) return AmbiIndex::FromFuMa();
 393     return AmbiIndex::FromACN();
 394 }
 395
 396 inline auto& GetAmbi2DLayout(AmbiLayout layouttype) noexcept
 397 {
 398     if(layouttype == AmbiLayout::FuMa) return AmbiIndex::FromFuMa2D();
 399     return AmbiIndex::FromACN2D();
 400 }
 401
 402
 403 bool CalcContextParams(ContextBase *ctx)
 404 {
 405     ContextProps *props{ctx->mParams.ContextUpdate.exchange(nullptr, std::memory_order_acq_rel)};
 406     if(!props) return false;
 407
 408     const alu::Vector pos{props->Position[0], props->Position[1], props->Position[2], 1.0f};
 409     ctx->mParams.Position = pos;
 410
 411     /* AT then UP */
 412     alu::Vector N{props->OrientAt[0], props->OrientAt[1], props->OrientAt[2], 0.0f};
 413     N.normalize();
 414     alu::Vector V{props->OrientUp[0], props->OrientUp[1], props->OrientUp[2], 0.0f};
 415     V.normalize();
 416     /* Build and normalize right-vector */
 417     alu::Vector U{N.cross_product(V)};
 418     U.normalize();
 419
 420     const alu::Matrix rot{
 421         U[0], V[0], -N[0], 0.0,
 422         U[1], V[1], -N[1], 0.0,
 423         U[2], V[2], -N[2], 0.0,
 424          0.0,  0.0,   0.0, 1.0};
 425     const alu::Vector vel{props->Velocity[0], props->Velocity[1], props->Velocity[2], 0.0};
 426
 427     ctx->mParams.Matrix = rot;
 428     ctx->mParams.Velocity = rot * vel;
 429
 430     ctx->mParams.Gain = props->Gain * ctx->mGainBoost;
 431     ctx->mParams.MetersPerUnit = props->MetersPerUnit;
 432     ctx->mParams.AirAbsorptionGainHF = props->AirAbsorptionGainHF;
 433
 434     ctx->mParams.DopplerFactor = props->DopplerFactor;
 435     ctx->mParams.SpeedOfSound = props->SpeedOfSound * props->DopplerVelocity;
 436
 437     ctx->mParams.SourceDistanceModel = props->SourceDistanceModel;
 438     ctx->mParams.mDistanceModel = props->mDistanceModel;
 439
 440     AtomicReplaceHead(ctx->mFreeContextProps, props);
 441     return true;
 442 }
 443
 444 bool CalcEffectSlotParams(EffectSlot *slot, EffectSlot **sorted_slots, ContextBase *context)
 445 {
 446     EffectSlotProps *props{slot->Update.exchange(nullptr, std::memory_order_acq_rel)};
 447     if(!props) return false;
 448
 449     /* If the effect slot target changed, clear the first sorted entry to force
 450      * a re-sort.
 451      */
 452     if(slot->Target != props->Target)
 453         *sorted_slots = nullptr;
 454     slot->Gain = props->Gain;
 455     slot->AuxSendAuto = props->AuxSendAuto;
 456     slot->Target = props->Target;
 457     slot->EffectType = props->Type;
 458     slot->mEffectProps = props->Props;
 459     if(props->Type == EffectSlotType::Reverb || props->Type == EffectSlotType::EAXReverb)
 460     {
 461         slot->RoomRolloff = props->Props.Reverb.RoomRolloffFactor;
 462         slot->DecayTime = props->Props.Reverb.DecayTime;
 463         slot->DecayLFRatio = props->Props.Reverb.DecayLFRatio;
 464         slot->DecayHFRatio = props->Props.Reverb.DecayHFRatio;
 465         slot->DecayHFLimit = props->Props.Reverb.DecayHFLimit;
 466         slot->AirAbsorptionGainHF = props->Props.Reverb.AirAbsorptionGainHF;
 467     }
 468     else
 469     {
 470         slot->RoomRolloff = 0.0f;
 471         slot->DecayTime = 0.0f;
 472         slot->DecayLFRatio = 0.0f;
 473         slot->DecayHFRatio = 0.0f;
 474         slot->DecayHFLimit = false;
 475         slot->AirAbsorptionGainHF = 1.0f;
 476     }
 477
 478     EffectState *state{props->State.release()};
 479     EffectState *oldstate{slot->mEffectState.release()};
 480     slot->mEffectState.reset(state);
 481
 482     /* Only release the old state if it won't get deleted, since we can't be
 483      * deleting/freeing anything in the mixer.
 484      */
 485     if(!oldstate->releaseIfNoDelete())
 486     {
 487         /* Otherwise, if it would be deleted send it off with a release event. */
 488         RingBuffer *ring{context->mAsyncEvents.get()};
 489         auto evt_vec = ring->getWriteVector();
 490         if(evt_vec.first.len > 0) [[likely]]
 491         {
 492             AsyncEvent *evt{al::construct_at(reinterpret_cast<AsyncEvent*>(evt_vec.first.buf),
 493                 AsyncEvent::ReleaseEffectState)};
 494             evt->u.mEffectState = oldstate;
 495             ring->writeAdvance(1);
 496         }
 497         else
 498         {
 499             /* If writing the event failed, the queue was probably full. Store
 500              * the old state in the property object where it can eventually be
 501              * cleaned up sometime later (not ideal, but better than blocking
 502              * or leaking).
 503              */
 504             props->State.reset(oldstate);
 505         }
 506     }
 507
 508     AtomicReplaceHead(context->mFreeEffectslotProps, props);
 509
 510     EffectTarget output;
 511     if(EffectSlot *target{slot->Target})
 512         output = EffectTarget{&target->Wet, nullptr};
 513     else
 514     {
 515         DeviceBase *device{context->mDevice};
 516         output = EffectTarget{&device->Dry, &device->RealOut};
 517     }
 518     state->update(context, slot, &slot->mEffectProps, output);
 519     return true;
 520 }
 521
 522
 523 /* Scales the given azimuth toward the side (+/- pi/2 radians) for positions in
 524  * front.
 525  */
 526 inline float ScaleAzimuthFront(float azimuth, float scale)
 527 {
 528     const float abs_azi{std::fabs(azimuth)};
 529     if(!(abs_azi >= al::numbers::pi_v<float>*0.5f))
 530         return std::copysign(minf(abs_azi*scale, al::numbers::pi_v<float>*0.5f), azimuth);
 531     return azimuth;
 532 }
 533
 534 /* Wraps the given value in radians to stay between [-pi,+pi] */
 535 inline float WrapRadians(float r)
 536 {
 537     static constexpr float Pi{al::numbers::pi_v<float>};
 538     static constexpr float Pi2{Pi*2.0f};
 539     if(r >  Pi) return std::fmod(Pi+r, Pi2) - Pi;
 540     if(r < -Pi) return Pi - std::fmod(Pi-r, Pi2);
 541     return r;
 542 }
 543
 544 /* Begin ambisonic rotation helpers.
 545  *
 546  * Rotating first-order B-Format just needs a straight-forward X/Y/Z rotation
 547  * matrix. Higher orders, however, are more complicated. The method implemented
 548  * here is a recursive algorithm (the rotation for first-order is used to help
 549  * generate the second-order rotation, which helps generate the third-order
 550  * rotation, etc).
 551  *
 552  * Adapted from
 553  * <https://github.com/polarch/Spherical-Harmonic-Transform/blob/master/getSHrotMtx.m>,
 554  * provided under the BSD 3-Clause license.
 555  *
 556  * Copyright (c) 2015, Archontis Politis
 557  * Copyright (c) 2019, Christopher Robinson
 558  *
 559  * The u, v, and w coefficients used for generating higher-order rotations are
 560  * precomputed since they're constant. The second-order coefficients are
 561  * followed by the third-order coefficients, etc.
 562  */
 563 template<size_t L>
 564 constexpr size_t CalcRotatorSize()
 565 { return (L*2 + 1)*(L*2 + 1) + CalcRotatorSize<L-1>(); }
 566
 567 template<> constexpr size_t CalcRotatorSize<0>() = delete;
 568 template<> constexpr size_t CalcRotatorSize<1>() = delete;
 569 template<> constexpr size_t CalcRotatorSize<2>() { return 5*5; }
 570
 571 struct RotatorCoeffs {
 572     struct CoeffValues {
 573         float u, v, w;
 574     };
 575     std::array<CoeffValues,CalcRotatorSize<MaxAmbiOrder>()> mCoeffs{};
 576
 577     RotatorCoeffs()
 578     {
 579         auto coeffs = mCoeffs.begin();
 580
 581         for(int l=2;l <= MaxAmbiOrder;++l)
 582         {
 583             for(int m{-l};m <= l;++m)
 584             {
 585                 for(int n{-l};n <= l;++n)
 586                 {
 587                     // compute u,v,w terms of Eq.8.1 (Table I)
 588                     const bool d{m == 0}; // the delta function d_m0
 589                     const float denom{static_cast<float>((std::abs(n) == l) ?
 590                         (2*l) * (2*l - 1) : (l*l - n*n))};
 591
 592                     const int abs_m{std::abs(m)};
 593                     coeffs->u = std::sqrt(static_cast<float>(l*l - m*m)/denom);
 594                     coeffs->v = std::sqrt(static_cast<float>(l+abs_m-1) *
 595                         static_cast<float>(l+abs_m) / denom) * (1.0f+d) * (1.0f - 2.0f*d) * 0.5f;
 596                     coeffs->w = std::sqrt(static_cast<float>(l-abs_m-1) *
 597                         static_cast<float>(l-abs_m) / denom) * (1.0f-d) * -0.5f;
 598                     ++coeffs;
 599                 }
 600             }
 601         }
 602     }
 603 };
 604 const RotatorCoeffs RotatorCoeffArray{};
 605
 606 /**
 607  * Given the matrix, pre-filled with the (zeroth- and) first-order rotation
 608  * coefficients, this fills in the coefficients for the higher orders up to and
 609  * including the given order. The matrix is in ACN layout.
 610  */
 611 void AmbiRotator(AmbiRotateMatrix &matrix, const int order)
 612 {
 613     /* Don't do anything for < 2nd order. */
 614     if(order < 2) return;
 615
 616     auto P = [](const int i, const int l, const int a, const int n, const size_t last_band,
 617         const AmbiRotateMatrix &R)
 618     {
 619         const float ri1{ R[static_cast<uint>(i+2)][ 1+2]};
 620         const float rim1{R[static_cast<uint>(i+2)][-1+2]};
 621         const float ri0{ R[static_cast<uint>(i+2)][ 0+2]};
 622
 623         auto vec = R[static_cast<uint>(a+l-1) + last_band].cbegin() + last_band;
 624         if(n == -l)
 625             return ri1*vec[0] + rim1*vec[static_cast<uint>(l-1)*size_t{2}];
 626         if(n == l)
 627             return ri1*vec[static_cast<uint>(l-1)*size_t{2}] - rim1*vec[0];
 628         return ri0*vec[static_cast<uint>(n+l-1)];
 629     };
 630
 631     auto U = [P](const int l, const int m, const int n, const size_t last_band,
 632         const AmbiRotateMatrix &R)
 633     {
 634         return P(0, l, m, n, last_band, R);
 635     };
 636     auto V = [P](const int l, const int m, const int n, const size_t last_band,
 637         const AmbiRotateMatrix &R)
 638     {
 639         using namespace al::numbers;
 640         if(m > 0)
 641         {
 642             const bool d{m == 1};
 643             const float p0{P( 1, l,  m-1, n, last_band, R)};
 644             const float p1{P(-1, l, -m+1, n, last_band, R)};
 645             return d ? p0*sqrt2_v<float> : (p0 - p1);
 646         }
 647         const bool d{m == -1};
 648         const float p0{P( 1, l,  m+1, n, last_band, R)};
 649         const float p1{P(-1, l, -m-1, n, last_band, R)};
 650         return d ? p1*sqrt2_v<float> : (p0 + p1);
 651     };
 652     auto W = [P](const int l, const int m, const int n, const size_t last_band,
 653         const AmbiRotateMatrix &R)
 654     {
 655         assert(m != 0);
 656         if(m > 0)
 657         {
 658             const float p0{P( 1, l,  m+1, n, last_band, R)};
 659             const float p1{P(-1, l, -m-1, n, last_band, R)};
 660             return p0 + p1;
 661         }
 662         const float p0{P( 1, l,  m-1, n, last_band, R)};
 663         const float p1{P(-1, l, -m+1, n, last_band, R)};
 664         return p0 - p1;
 665     };
 666
 667     // compute rotation matrix of each subsequent band recursively
 668     auto coeffs = RotatorCoeffArray.mCoeffs.cbegin();
 669     size_t band_idx{4}, last_band{1};
 670     for(int l{2};l <= order;++l)
 671     {
 672         size_t y{band_idx};
 673         for(int m{-l};m <= l;++m,++y)
 674         {
 675             size_t x{band_idx};
 676             for(int n{-l};n <= l;++n,++x)
 677             {
 678                 float r{0.0f};
 679
 680                 // computes Eq.8.1
 681                 const float u{coeffs->u};
 682                 if(u != 0.0f) r += u * U(l, m, n, last_band, matrix);
 683                 const float v{coeffs->v};
 684                 if(v != 0.0f) r += v * V(l, m, n, last_band, matrix);
 685                 const float w{coeffs->w};
 686                 if(w != 0.0f) r += w * W(l, m, n, last_band, matrix);
 687
 688                 matrix[y][x] = r;
 689                 ++coeffs;
 690             }
 691         }
 692         last_band = band_idx;
 693         band_idx += static_cast<uint>(l)*size_t{2} + 1;
 694     }
 695 }
 696 /* End ambisonic rotation helpers. */
 697
 698
 699 constexpr float Deg2Rad(float x) noexcept
 700 { return static_cast<float>(al::numbers::pi / 180.0 * x); }
 701
 702 struct GainTriplet { float Base, HF, LF; };
 703
 704 void CalcPanningAndFilters(Voice *voice, const float xpos, const float ypos, const float zpos,
 705     const float Distance, const float Spread, const GainTriplet &DryGain,
 706     const al::span<const GainTriplet,MAX_SENDS> WetGain, EffectSlot *(&SendSlots)[MAX_SENDS],
 707     const VoiceProps *props, const ContextParams &Context, DeviceBase *Device)
 708 {
 709     static constexpr ChanMap MonoMap[1]{
 710         { FrontCenter, 0.0f, 0.0f }
 711     }, RearMap[2]{
 712         { BackLeft,  Deg2Rad(-150.0f), Deg2Rad(0.0f) },
 713         { BackRight, Deg2Rad( 150.0f), Deg2Rad(0.0f) }
 714     }, QuadMap[4]{
 715         { FrontLeft,  Deg2Rad( -45.0f), Deg2Rad(0.0f) },
 716         { FrontRight, Deg2Rad(  45.0f), Deg2Rad(0.0f) },
 717         { BackLeft,   Deg2Rad(-135.0f), Deg2Rad(0.0f) },
 718         { BackRight,  Deg2Rad( 135.0f), Deg2Rad(0.0f) }
 719     }, X51Map[6]{
 720         { FrontLeft,   Deg2Rad( -30.0f), Deg2Rad(0.0f) },
 721         { FrontRight,  Deg2Rad(  30.0f), Deg2Rad(0.0f) },
 722         { FrontCenter, Deg2Rad(   0.0f), Deg2Rad(0.0f) },
 723         { LFE, 0.0f, 0.0f },
 724         { SideLeft,    Deg2Rad(-110.0f), Deg2Rad(0.0f) },
 725         { SideRight,   Deg2Rad( 110.0f), Deg2Rad(0.0f) }
 726     }, X61Map[7]{
 727         { FrontLeft,   Deg2Rad(-30.0f), Deg2Rad(0.0f) },
 728         { FrontRight,  Deg2Rad( 30.0f), Deg2Rad(0.0f) },
 729         { FrontCenter, Deg2Rad(  0.0f), Deg2Rad(0.0f) },
 730         { LFE, 0.0f, 0.0f },
 731         { BackCenter,  Deg2Rad(180.0f), Deg2Rad(0.0f) },
 732         { SideLeft,    Deg2Rad(-90.0f), Deg2Rad(0.0f) },
 733         { SideRight,   Deg2Rad( 90.0f), Deg2Rad(0.0f) }
 734     }, X71Map[8]{
 735         { FrontLeft,   Deg2Rad( -30.0f), Deg2Rad(0.0f) },
 736         { FrontRight,  Deg2Rad(  30.0f), Deg2Rad(0.0f) },
 737         { FrontCenter, Deg2Rad(   0.0f), Deg2Rad(0.0f) },
 738         { LFE, 0.0f, 0.0f },
 739         { BackLeft,    Deg2Rad(-150.0f), Deg2Rad(0.0f) },
 740         { BackRight,   Deg2Rad( 150.0f), Deg2Rad(0.0f) },
 741         { SideLeft,    Deg2Rad( -90.0f), Deg2Rad(0.0f) },
 742         { SideRight,   Deg2Rad(  90.0f), Deg2Rad(0.0f) }
 743     };
 744
 745     ChanMap StereoMap[2]{
 746         { FrontLeft,  Deg2Rad(-30.0f), Deg2Rad(0.0f) },
 747         { FrontRight, Deg2Rad( 30.0f), Deg2Rad(0.0f) }
 748     };
 749
 750     const auto Frequency = static_cast<float>(Device->Frequency);
 751     const uint NumSends{Device->NumAuxSends};
 752
 753     const size_t num_channels{voice->mChans.size()};
 754     ASSUME(num_channels > 0);
 755
 756     for(auto &chandata : voice->mChans)
 757     {
 758         chandata.mDryParams.Hrtf.Target = HrtfFilter{};
 759         chandata.mDryParams.Gains.Target.fill(0.0f);
 760         std::for_each(chandata.mWetParams.begin(), chandata.mWetParams.begin()+NumSends,
 761             [](SendParams &params) -> void { params.Gains.Target.fill(0.0f); });
 762     }
 763
 764     DirectMode DirectChannels{props->DirectChannels};
 765     const ChanMap *chans{nullptr};
 766     switch(voice->mFmtChannels)
 767     {
 768     case FmtMono:
 769         chans = MonoMap;
 770         /* Mono buffers are never played direct. */
 771         DirectChannels = DirectMode::Off;
 772         break;
 773
 774     case FmtStereo:
 775         if(DirectChannels == DirectMode::Off)
 776         {
 777             /* Convert counter-clockwise to clock-wise, and wrap between
 778              * [-pi,+pi].
 779              */
 780             StereoMap[0].angle = WrapRadians(-props->StereoPan[0]);
 781             StereoMap[1].angle = WrapRadians(-props->StereoPan[1]);
 782         }
 783         chans = StereoMap;
 784         break;
 785
 786     case FmtRear: chans = RearMap; break;
 787     case FmtQuad: chans = QuadMap; break;
 788     case FmtX51: chans = X51Map; break;
 789     case FmtX61: chans = X61Map; break;
 790     case FmtX71: chans = X71Map; break;
 791
 792     case FmtBFormat2D:
 793     case FmtBFormat3D:
 794     case FmtUHJ2:
 795     case FmtUHJ3:
 796     case FmtUHJ4:
 797     case FmtSuperStereo:
 798         DirectChannels = DirectMode::Off;
 799         break;
 800     }
 801
 802     voice->mFlags.reset(VoiceHasHrtf).reset(VoiceHasNfc);
 803     if(auto *decoder{voice->mDecoder.get()})
 804         decoder->mWidthControl = minf(props->EnhWidth, 0.7f);
 805
 806     if(IsAmbisonic(voice->mFmtChannels))
 807     {
 808         /* Special handling for B-Format and UHJ sources. */
 809
 810         if(Device->AvgSpeakerDist > 0.0f && voice->mFmtChannels != FmtUHJ2
 811             && voice->mFmtChannels != FmtSuperStereo)
 812         {
 813             if(!(Distance > std::numeric_limits<float>::epsilon()))
 814             {
 815                 /* NOTE: The NFCtrlFilters were created with a w0 of 0, which
 816                  * is what we want for FOA input. The first channel may have
 817                  * been previously re-adjusted if panned, so reset it.
 818                  */
 819                 voice->mChans[0].mDryParams.NFCtrlFilter.adjust(0.0f);
 820             }
 821             else
 822             {
 823                 /* Clamp the distance for really close sources, to prevent
 824                  * excessive bass.
 825                  */
 826                 const float mdist{maxf(Distance*NfcScale, Device->AvgSpeakerDist/4.0f)};
 827                 const float w0{SpeedOfSoundMetersPerSec / (mdist * Frequency)};
 828
 829                 /* Only need to adjust the first channel of a B-Format source. */
 830                 voice->mChans[0].mDryParams.NFCtrlFilter.adjust(w0);
 831             }
 832
 833             voice->mFlags.set(VoiceHasNfc);
 834         }
 835
 836         /* Panning a B-Format sound toward some direction is easy. Just pan the
 837          * first (W) channel as a normal mono sound. The angular spread is used
 838          * as a directional scalar to blend between full coverage and full
 839          * panning.
 840          */
 841         const float coverage{!(Distance > std::numeric_limits<float>::epsilon()) ? 1.0f :
 842             (al::numbers::inv_pi_v<float>/2.0f * Spread)};
 843
 844         auto calc_coeffs = [xpos,ypos,zpos](RenderMode mode)
 845         {
 846             if(mode != RenderMode::Pairwise)
 847                 return CalcDirectionCoeffs({xpos, ypos, zpos});
 848
 849             /* Clamp Y, in case rounding errors caused it to end up outside
 850              * of -1...+1.
 851              */
 852             const float ev{std::asin(clampf(ypos, -1.0f, 1.0f))};
 853             /* Negate Z for right-handed coords with -Z in front. */
 854             const float az{std::atan2(xpos, -zpos)};
 855
 856             /* A scalar of 1.5 for plain stereo results in +/-60 degrees
 857              * being moved to +/-90 degrees for direct right and left
 858              * speaker responses.
 859              */
 860             return CalcAngleCoeffs(ScaleAzimuthFront(az, 1.5f), ev, 0.0f);
 861         };
 862         auto&& scales = GetAmbiScales(voice->mAmbiScaling);
 863         auto coeffs = calc_coeffs(Device->mRenderMode);
 864         /* Scale the panned W signal based on the coverage (full coverage means
 865          * no panned signal). Scale the panned W signal according to channel
 866          * scaling.
 867          */
 868         std::transform(coeffs.begin(), coeffs.end(), coeffs.begin(),
 869             std::bind(std::multiplies<float>{}, _1, (1.0f-coverage)*scales[0]));
 870
 871         if(!(coverage > 0.0f))
 872         {
 873             ComputePanGains(&Device->Dry, coeffs.data(), DryGain.Base,
 874                 voice->mChans[0].mDryParams.Gains.Target);
 875             for(uint i{0};i < NumSends;i++)
 876             {
 877                 if(const EffectSlot *Slot{SendSlots[i]})
 878                     ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base*scales[0],
 879                         voice->mChans[0].mWetParams[i].Gains.Target);
 880             }
 881         }
 882         else
 883         {
 884             /* Local B-Format sources have their XYZ channels rotated according
 885              * to the orientation.
 886              */
 887             /* AT then UP */
 888             alu::Vector N{props->OrientAt[0], props->OrientAt[1], props->OrientAt[2], 0.0f};
 889             N.normalize();
 890             alu::Vector V{props->OrientUp[0], props->OrientUp[1], props->OrientUp[2], 0.0f};
 891             V.normalize();
 892             if(!props->HeadRelative)
 893             {
 894                 N = Context.Matrix * N;
 895                 V = Context.Matrix * V;
 896             }
 897             /* Build and normalize right-vector */
 898             alu::Vector U{N.cross_product(V)};
 899             U.normalize();
 900
 901             /* Build a rotation matrix. Manually fill the zeroth- and first-
 902              * order elements, then construct the rotation for the higher
 903              * orders.
 904              */
 905             AmbiRotateMatrix &shrot = Device->mAmbiRotateMatrix;
 906             shrot.fill({});
 907
 908             shrot[0][0] = 1.0f;
 909             shrot[1][1] =  U[0]; shrot[1][2] = -V[0]; shrot[1][3] = -N[0];
 910             shrot[2][1] = -U[1]; shrot[2][2] =  V[1]; shrot[2][3] =  N[1];
 911             shrot[3][1] =  U[2]; shrot[3][2] = -V[2]; shrot[3][3] = -N[2];
 912             AmbiRotator(shrot, static_cast<int>(Device->mAmbiOrder));
 913             /* If the device is higher order than the voice, "upsample" the
 914              * matrix.
 915              *
 916              * NOTE: Starting with second-order, a 2D upsample needs to be
 917              * applied with a 2D source and 3D output, even when they're the
 918              * same order. This is because higher orders have a height offset
 919              * on various channels (i.e. when elevation=0, those height-related
 920              * channels should be non-0).
 921              */
 922             if(Device->mAmbiOrder > voice->mAmbiOrder
 923                 || (Device->mAmbiOrder >= 2 && !Device->m2DMixing
 924                     && Is2DAmbisonic(voice->mFmtChannels)))
 925             {
 926                 if(voice->mAmbiOrder == 1)
 927                 {
 928                     auto&& upsampler = Is2DAmbisonic(voice->mFmtChannels) ?
 929                         AmbiScale::FirstOrder2DUp : AmbiScale::FirstOrderUp;
 930                     UpsampleBFormatTransform(Device->mAmbiOrder, upsampler, shrot);
 931                 }
 932                 else if(voice->mAmbiOrder == 2)
 933                 {
 934                     auto&& upsampler = Is2DAmbisonic(voice->mFmtChannels) ?
 935                         AmbiScale::SecondOrder2DUp : AmbiScale::SecondOrderUp;
 936                     UpsampleBFormatTransform(Device->mAmbiOrder, upsampler, shrot);
 937                 }
 938                 else if(voice->mAmbiOrder == 3)
 939                 {
 940                     auto&& upsampler = Is2DAmbisonic(voice->mFmtChannels) ?
 941                         AmbiScale::ThirdOrder2DUp : AmbiScale::ThirdOrderUp;
 942                     UpsampleBFormatTransform(Device->mAmbiOrder, upsampler, shrot);
 943                 }
 944                 else if(voice->mAmbiOrder == 4)
 945                 {
 946                     auto&& upsampler = AmbiScale::FourthOrder2DUp;
 947                     UpsampleBFormatTransform(Device->mAmbiOrder, upsampler, shrot);
 948                 }
 949             }
 950
 951             /* Convert the rotation matrix for input ordering and scaling, and
 952              * whether input is 2D or 3D.
 953              */
 954             const uint8_t *index_map{Is2DAmbisonic(voice->mFmtChannels) ?
 955                 GetAmbi2DLayout(voice->mAmbiLayout).data() :
 956                 GetAmbiLayout(voice->mAmbiLayout).data()};
 957
 958             static const uint8_t OrderOffset[MaxAmbiOrder+1]{0, 1, 4, 9,};
 959             for(size_t c{0};c < num_channels;c++)
 960             {
 961                 const size_t acn{index_map[c]};
 962                 const size_t order{AmbiIndex::OrderFromChannel()[acn]};
 963                 const float scale{scales[acn] * coverage};
 964
 965                 /* For channel 0, combine the B-Format signal (scaled according
 966                  * to the coverage amount) with the directional pan. For all
 967                  * other channels, use just the (scaled) B-Format signal.
 968                  */
 969                 for(size_t x{OrderOffset[order]};x < MaxAmbiChannels;++x)
 970                     coeffs[x] += shrot[x][acn] * scale;
 971
 972                 ComputePanGains(&Device->Dry, coeffs.data(), DryGain.Base,
 973                     voice->mChans[c].mDryParams.Gains.Target);
 974
 975                 for(uint i{0};i < NumSends;i++)
 976                 {
 977                     if(const EffectSlot *Slot{SendSlots[i]})
 978                         ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
 979                             voice->mChans[c].mWetParams[i].Gains.Target);
 980                 }
 981
 982                 coeffs = std::array<float,MaxAmbiChannels>{};
 983             }
 984         }
 985     }
 986     else if(DirectChannels != DirectMode::Off && !Device->RealOut.RemixMap.empty())
 987     {
 988         /* Direct source channels always play local. Skip the virtual channels
 989          * and write inputs to the matching real outputs.
 990          */
 991         voice->mDirect.Buffer = Device->RealOut.Buffer;
 992
 993         for(size_t c{0};c < num_channels;c++)
 994         {
 995             uint idx{Device->channelIdxByName(chans[c].channel)};
 996             if(idx != INVALID_CHANNEL_INDEX)
 997                 voice->mChans[c].mDryParams.Gains.Target[idx] = DryGain.Base;
 998             else if(DirectChannels == DirectMode::RemixMismatch)
 999             {
1000                 auto match_channel = [chans,c](const InputRemixMap &map) noexcept -> bool
1001                 { return chans[c].channel == map.channel; };
1002                 auto remap = std::find_if(Device->RealOut.RemixMap.cbegin(),
1003                     Device->RealOut.RemixMap.cend(), match_channel);
1004                 if(remap != Device->RealOut.RemixMap.cend())
1005                 {
1006                     for(const auto &target : remap->targets)
1007                     {
1008                         idx = Device->channelIdxByName(target.channel);
1009                         if(idx != INVALID_CHANNEL_INDEX)
1010                             voice->mChans[c].mDryParams.Gains.Target[idx] = DryGain.Base *
1011                                 target.mix;
1012                     }
1013                 }
1014             }
1015         }
1016
1017         /* Auxiliary sends still use normal channel panning since they mix to
1018          * B-Format, which can't channel-match.
1019          */
1020         for(size_t c{0};c < num_channels;c++)
1021         {
1022             /* Skip LFE */
1023             if(chans[c].channel == LFE)
1024                 continue;
1025
1026             const auto coeffs = CalcAngleCoeffs(chans[c].angle, chans[c].elevation, 0.0f);
1027
1028             for(uint i{0};i < NumSends;i++)
1029             {
1030                 if(const EffectSlot *Slot{SendSlots[i]})
1031                     ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1032                         voice->mChans[c].mWetParams[i].Gains.Target);
1033             }
1034         }
1035     }
1036     else if(Device->mRenderMode == RenderMode::Hrtf)
1037     {
1038         /* Full HRTF rendering. Skip the virtual channels and render to the
1039          * real outputs.
1040          */
1041         voice->mDirect.Buffer = Device->RealOut.Buffer;
1042
1043         if(Distance > std::numeric_limits<float>::epsilon())
1044         {
1045             const float src_ev{std::asin(clampf(ypos, -1.0f, 1.0f))};
1046             const float src_az{std::atan2(xpos, -zpos)};
1047
1048             if(voice->mFmtChannels == FmtMono)
1049             {
1050                 Device->mHrtf->getCoeffs(src_ev, src_az, Distance*NfcScale, Spread,
1051                     voice->mChans[0].mDryParams.Hrtf.Target.Coeffs,
1052                     voice->mChans[0].mDryParams.Hrtf.Target.Delay);
1053                 voice->mChans[0].mDryParams.Hrtf.Target.Gain = DryGain.Base;
1054
1055                 const auto coeffs = CalcAngleCoeffs(src_az, src_ev, Spread);
1056                 for(uint i{0};i < NumSends;i++)
1057                 {
1058                     if(const EffectSlot *Slot{SendSlots[i]})
1059                         ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1060                             voice->mChans[0].mWetParams[i].Gains.Target);
1061                 }
1062             }
1063             else for(size_t c{0};c < num_channels;c++)
1064             {
1065                 using namespace al::numbers;
1066
1067                 /* Skip LFE */
1068                 if(chans[c].channel == LFE) continue;
1069
1070                 /* Warp the channel position toward the source position as the
1071                  * source spread decreases. With no spread, all channels are at
1072                  * the source position, at full spread (pi*2), each channel is
1073                  * left unchanged.
1074                  */
1075                 const float ev{lerpf(src_ev, chans[c].elevation, inv_pi_v<float>/2.0f * Spread)};
1076
1077                 float az{chans[c].angle - src_az};
1078                 if(az < -pi_v<float>) az += pi_v<float>*2.0f;
1079                 else if(az > pi_v<float>) az -= pi_v<float>*2.0f;
1080
1081                 az *= inv_pi_v<float>/2.0f * Spread;
1082
1083                 az += src_az;
1084                 if(az < -pi_v<float>) az += pi_v<float>*2.0f;
1085                 else if(az > pi_v<float>) az -= pi_v<float>*2.0f;
1086
1087                 Device->mHrtf->getCoeffs(ev, az, Distance*NfcScale, 0.0f,
1088                     voice->mChans[c].mDryParams.Hrtf.Target.Coeffs,
1089                     voice->mChans[c].mDryParams.Hrtf.Target.Delay);
1090                 voice->mChans[c].mDryParams.Hrtf.Target.Gain = DryGain.Base;
1091
1092                 const auto coeffs = CalcAngleCoeffs(az, ev, 0.0f);
1093                 for(uint i{0};i < NumSends;i++)
1094                 {
1095                     if(const EffectSlot *Slot{SendSlots[i]})
1096                         ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1097                             voice->mChans[c].mWetParams[i].Gains.Target);
1098                 }
1099             }
1100         }
1101         else
1102         {
1103             /* With no distance, spread is only meaningful for mono sources
1104              * where it can be 0 or full (non-mono sources are always full
1105              * spread here).
1106              */
1107             const float spread{Spread * (voice->mFmtChannels == FmtMono)};
1108
1109             /* Local sources on HRTF play with each channel panned to its
1110              * relative location around the listener, providing "virtual
1111              * speaker" responses.
1112              */
1113             for(size_t c{0};c < num_channels;c++)
1114             {
1115                 /* Skip LFE */
1116                 if(chans[c].channel == LFE)
1117                     continue;
1118
1119                 /* Get the HRIR coefficients and delays for this channel
1120                  * position.
1121                  */
1122                 Device->mHrtf->getCoeffs(chans[c].elevation, chans[c].angle,
1123                     std::numeric_limits<float>::infinity(), spread,
1124                     voice->mChans[c].mDryParams.Hrtf.Target.Coeffs,
1125                     voice->mChans[c].mDryParams.Hrtf.Target.Delay);
1126                 voice->mChans[c].mDryParams.Hrtf.Target.Gain = DryGain.Base;
1127
1128                 /* Normal panning for auxiliary sends. */
1129                 const auto coeffs = CalcAngleCoeffs(chans[c].angle, chans[c].elevation, spread);
1130
1131                 for(uint i{0};i < NumSends;i++)
1132                 {
1133                     if(const EffectSlot *Slot{SendSlots[i]})
1134                         ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1135                             voice->mChans[c].mWetParams[i].Gains.Target);
1136                 }
1137             }
1138         }
1139
1140         voice->mFlags.set(VoiceHasHrtf);
1141     }
1142     else
1143     {
1144         /* Non-HRTF rendering. Use normal panning to the output. */
1145
1146         if(Distance > std::numeric_limits<float>::epsilon())
1147         {
1148             /* Calculate NFC filter coefficient if needed. */
1149             if(Device->AvgSpeakerDist > 0.0f)
1150             {
1151                 /* Clamp the distance for really close sources, to prevent
1152                  * excessive bass.
1153                  */
1154                 const float mdist{maxf(Distance*NfcScale, Device->AvgSpeakerDist/4.0f)};
1155                 const float w0{SpeedOfSoundMetersPerSec / (mdist * Frequency)};
1156
1157                 /* Adjust NFC filters. */
1158                 for(size_t c{0};c < num_channels;c++)
1159                     voice->mChans[c].mDryParams.NFCtrlFilter.adjust(w0);
1160
1161                 voice->mFlags.set(VoiceHasNfc);
1162             }
1163
1164             if(voice->mFmtChannels == FmtMono)
1165             {
1166                 auto calc_coeffs = [xpos,ypos,zpos,Spread](RenderMode mode)
1167                 {
1168                     if(mode != RenderMode::Pairwise)
1169                         return CalcDirectionCoeffs({xpos, ypos, zpos}, Spread);
1170                     const float ev{std::asin(clampf(ypos, -1.0f, 1.0f))};
1171                     const float az{std::atan2(xpos, -zpos)};
1172                     return CalcAngleCoeffs(ScaleAzimuthFront(az, 1.5f), ev, Spread);
1173                 };
1174                 const auto coeffs = calc_coeffs(Device->mRenderMode);
1175
1176                 ComputePanGains(&Device->Dry, coeffs.data(), DryGain.Base,
1177                     voice->mChans[0].mDryParams.Gains.Target);
1178                 for(uint i{0};i < NumSends;i++)
1179                 {
1180                     if(const EffectSlot *Slot{SendSlots[i]})
1181                         ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1182                             voice->mChans[0].mWetParams[i].Gains.Target);
1183                 }
1184             }
1185             else
1186             {
1187                 using namespace al::numbers;
1188
1189                 const float src_ev{std::asin(clampf(ypos, -1.0f, 1.0f))};
1190                 const float src_az{std::atan2(xpos, -zpos)};
1191
1192                 for(size_t c{0};c < num_channels;c++)
1193                 {
1194                     /* Special-case LFE */
1195                     if(chans[c].channel == LFE)
1196                     {
1197                         if(Device->Dry.Buffer.data() == Device->RealOut.Buffer.data())
1198                         {
1199                             const uint idx{Device->channelIdxByName(chans[c].channel)};
1200                             if(idx != INVALID_CHANNEL_INDEX)
1201                                 voice->mChans[c].mDryParams.Gains.Target[idx] = DryGain.Base;
1202                         }
1203                         continue;
1204                     }
1205
1206                     /* Warp the channel position toward the source position as
1207                      * the spread decreases. With no spread, all channels are
1208                      * at the source position, at full spread (pi*2), each
1209                      * channel position is left unchanged.
1210                      */
1211                     const float ev{lerpf(src_ev, chans[c].elevation,
1212                         inv_pi_v<float>/2.0f * Spread)};
1213
1214                     float az{chans[c].angle - src_az};
1215                     if(az < -pi_v<float>) az += pi_v<float>*2.0f;
1216                     else if(az > pi_v<float>) az -= pi_v<float>*2.0f;
1217
1218                     az *= inv_pi_v<float>/2.0f * Spread;
1219
1220                     az += src_az;
1221                     if(az < -pi_v<float>) az += pi_v<float>*2.0f;
1222                     else if(az > pi_v<float>) az -= pi_v<float>*2.0f;
1223
1224                     if(Device->mRenderMode == RenderMode::Pairwise)
1225                         az = ScaleAzimuthFront(az, 3.0f);
1226                     const auto coeffs = CalcAngleCoeffs(az, ev, 0.0f);
1227
1228                     ComputePanGains(&Device->Dry, coeffs.data(), DryGain.Base,
1229                         voice->mChans[c].mDryParams.Gains.Target);
1230                     for(uint i{0};i < NumSends;i++)
1231                     {
1232                         if(const EffectSlot *Slot{SendSlots[i]})
1233                             ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1234                                 voice->mChans[c].mWetParams[i].Gains.Target);
1235                     }
1236                 }
1237             }
1238         }
1239         else
1240         {
1241             if(Device->AvgSpeakerDist > 0.0f)
1242             {
1243                 /* If the source distance is 0, simulate a plane-wave by using
1244                  * infinite distance, which results in a w0 of 0.
1245                  */
1246                 static constexpr float w0{0.0f};
1247                 for(size_t c{0};c < num_channels;c++)
1248                     voice->mChans[c].mDryParams.NFCtrlFilter.adjust(w0);
1249
1250                 voice->mFlags.set(VoiceHasNfc);
1251             }
1252
1253             /* With no distance, spread is only meaningful for mono sources
1254              * where it can be 0 or full (non-mono sources are always full
1255              * spread here).
1256              */
1257             const float spread{Spread * (voice->mFmtChannels == FmtMono)};
1258             for(size_t c{0};c < num_channels;c++)
1259             {
1260                 /* Special-case LFE */
1261                 if(chans[c].channel == LFE)
1262                 {
1263                     if(Device->Dry.Buffer.data() == Device->RealOut.Buffer.data())
1264                     {
1265                         const uint idx{Device->channelIdxByName(chans[c].channel)};
1266                         if(idx != INVALID_CHANNEL_INDEX)
1267                             voice->mChans[c].mDryParams.Gains.Target[idx] = DryGain.Base;
1268                     }
1269                     continue;
1270                 }
1271
1272                 const auto coeffs = CalcAngleCoeffs((Device->mRenderMode == RenderMode::Pairwise)
1273                     ? ScaleAzimuthFront(chans[c].angle, 3.0f) : chans[c].angle,
1274                     chans[c].elevation, spread);
1275
1276                 ComputePanGains(&Device->Dry, coeffs.data(), DryGain.Base,
1277                     voice->mChans[c].mDryParams.Gains.Target);
1278                 for(uint i{0};i < NumSends;i++)
1279                 {
1280                     if(const EffectSlot *Slot{SendSlots[i]})
1281                         ComputePanGains(&Slot->Wet, coeffs.data(), WetGain[i].Base,
1282                             voice->mChans[c].mWetParams[i].Gains.Target);
1283                 }
1284             }
1285         }
1286     }
1287
1288     {
1289         const float hfNorm{props->Direct.HFReference / Frequency};
1290         const float lfNorm{props->Direct.LFReference / Frequency};
1291
1292         voice->mDirect.FilterType = AF_None;
1293         if(DryGain.HF != 1.0f) voice->mDirect.FilterType |= AF_LowPass;
1294         if(DryGain.LF != 1.0f) voice->mDirect.FilterType |= AF_HighPass;
1295
1296         auto &lowpass = voice->mChans[0].mDryParams.LowPass;
1297         auto &highpass = voice->mChans[0].mDryParams.HighPass;
1298         lowpass.setParamsFromSlope(BiquadType::HighShelf, hfNorm, DryGain.HF, 1.0f);
1299         highpass.setParamsFromSlope(BiquadType::LowShelf, lfNorm, DryGain.LF, 1.0f);
1300         for(size_t c{1};c < num_channels;c++)
1301         {
1302             voice->mChans[c].mDryParams.LowPass.copyParamsFrom(lowpass);
1303             voice->mChans[c].mDryParams.HighPass.copyParamsFrom(highpass);
1304         }
1305     }
1306     for(uint i{0};i < NumSends;i++)
1307     {
1308         const float hfNorm{props->Send[i].HFReference / Frequency};
1309         const float lfNorm{props->Send[i].LFReference / Frequency};
1310
1311         voice->mSend[i].FilterType = AF_None;
1312         if(WetGain[i].HF != 1.0f) voice->mSend[i].FilterType |= AF_LowPass;
1313         if(WetGain[i].LF != 1.0f) voice->mSend[i].FilterType |= AF_HighPass;
1314
1315         auto &lowpass = voice->mChans[0].mWetParams[i].LowPass;
1316         auto &highpass = voice->mChans[0].mWetParams[i].HighPass;
1317         lowpass.setParamsFromSlope(BiquadType::HighShelf, hfNorm, WetGain[i].HF, 1.0f);
1318         highpass.setParamsFromSlope(BiquadType::LowShelf, lfNorm, WetGain[i].LF, 1.0f);
1319         for(size_t c{1};c < num_channels;c++)
1320         {
1321             voice->mChans[c].mWetParams[i].LowPass.copyParamsFrom(lowpass);
1322             voice->mChans[c].mWetParams[i].HighPass.copyParamsFrom(highpass);
1323         }
1324     }
1325 }
1326
1327 void CalcNonAttnSourceParams(Voice *voice, const VoiceProps *props, const ContextBase *context)
1328 {
1329     DeviceBase *Device{context->mDevice};
1330     EffectSlot *SendSlots[MAX_SENDS];
1331
1332     voice->mDirect.Buffer = Device->Dry.Buffer;
1333     for(uint i{0};i < Device->NumAuxSends;i++)
1334     {
1335         SendSlots[i] = props->Send[i].Slot;
1336         if(!SendSlots[i] || SendSlots[i]->EffectType == EffectSlotType::None)
1337         {
1338             SendSlots[i] = nullptr;
1339             voice->mSend[i].Buffer = {};
1340         }
1341         else
1342             voice->mSend[i].Buffer = SendSlots[i]->Wet.Buffer;
1343     }
1344
1345     /* Calculate the stepping value */
1346     const auto Pitch = static_cast<float>(voice->mFrequency) /
1347         static_cast<float>(Device->Frequency) * props->Pitch;
1348     if(Pitch > float{MaxPitch})
1349         voice->mStep = MaxPitch<<MixerFracBits;
1350     else
1351         voice->mStep = maxu(fastf2u(Pitch * MixerFracOne), 1);
1352     voice->mResampler = PrepareResampler(props->mResampler, voice->mStep, &voice->mResampleState);
1353
1354     /* Calculate gains */
1355     GainTriplet DryGain;
1356     DryGain.Base  = minf(clampf(props->Gain, props->MinGain, props->MaxGain) * props->Direct.Gain *
1357         context->mParams.Gain, GainMixMax);
1358     DryGain.HF = props->Direct.GainHF;
1359     DryGain.LF = props->Direct.GainLF;
1360     GainTriplet WetGain[MAX_SENDS];
1361     for(uint i{0};i < Device->NumAuxSends;i++)
1362     {
1363         WetGain[i].Base = minf(clampf(props->Gain, props->MinGain, props->MaxGain) *
1364             props->Send[i].Gain * context->mParams.Gain, GainMixMax);
1365         WetGain[i].HF = props->Send[i].GainHF;
1366         WetGain[i].LF = props->Send[i].GainLF;
1367     }
1368
1369     CalcPanningAndFilters(voice, 0.0f, 0.0f, -1.0f, 0.0f, 0.0f, DryGain, WetGain, SendSlots, props,
1370         context->mParams, Device);
1371 }
1372
1373 void CalcAttnSourceParams(Voice *voice, const VoiceProps *props, const ContextBase *context)
1374 {
1375     DeviceBase *Device{context->mDevice};
1376     const uint NumSends{Device->NumAuxSends};
1377
1378     /* Set mixing buffers and get send parameters. */
1379     voice->mDirect.Buffer = Device->Dry.Buffer;
1380     EffectSlot *SendSlots[MAX_SENDS];
1381     uint UseDryAttnForRoom{0};
1382     for(uint i{0};i < NumSends;i++)
1383     {
1384         SendSlots[i] = props->Send[i].Slot;
1385         if(!SendSlots[i] || SendSlots[i]->EffectType == EffectSlotType::None)
1386             SendSlots[i] = nullptr;
1387         else if(!SendSlots[i]->AuxSendAuto)
1388         {
1389             /* If the slot's auxiliary send auto is off, the data sent to the
1390              * effect slot is the same as the dry path, sans filter effects.
1391              */
1392             UseDryAttnForRoom |= 1u<<i;
1393         }
1394
1395         if(!SendSlots[i])
1396             voice->mSend[i].Buffer = {};
1397         else
1398             voice->mSend[i].Buffer = SendSlots[i]->Wet.Buffer;
1399     }
1400
1401     /* Transform source to listener space (convert to head relative) */
1402     alu::Vector Position{props->Position[0], props->Position[1], props->Position[2], 1.0f};
1403     alu::Vector Velocity{props->Velocity[0], props->Velocity[1], props->Velocity[2], 0.0f};
1404     alu::Vector Direction{props->Direction[0], props->Direction[1], props->Direction[2], 0.0f};
1405     if(!props->HeadRelative)
1406     {
1407         /* Transform source vectors */
1408         Position = context->mParams.Matrix * (Position - context->mParams.Position);
1409         Velocity = context->mParams.Matrix * Velocity;
1410         Direction = context->mParams.Matrix * Direction;
1411     }
1412     else
1413     {
1414         /* Offset the source velocity to be relative of the listener velocity */
1415         Velocity += context->mParams.Velocity;
1416     }
1417
1418     const bool directional{Direction.normalize() > 0.0f};
1419     alu::Vector ToSource{Position[0], Position[1], Position[2], 0.0f};
1420     const float Distance{ToSource.normalize()};
1421
1422     /* Calculate distance attenuation */
1423     float ClampedDist{Distance};
1424     float DryGainBase{props->Gain};
1425     float WetGainBase{props->Gain};
1426
1427     switch(context->mParams.SourceDistanceModel ? props->mDistanceModel
1428         : context->mParams.mDistanceModel)
1429     {
1430         case DistanceModel::InverseClamped:
1431             if(props->MaxDistance < props->RefDistance) break;
1432             ClampedDist = clampf(ClampedDist, props->RefDistance, props->MaxDistance);
1433             /*fall-through*/
1434         case DistanceModel::Inverse:
1435             if(props->RefDistance > 0.0f)
1436             {
1437                 float dist{lerpf(props->RefDistance, ClampedDist, props->RolloffFactor)};
1438                 if(dist > 0.0f) DryGainBase *= props->RefDistance / dist;
1439
1440                 dist = lerpf(props->RefDistance, ClampedDist, props->RoomRolloffFactor);
1441                 if(dist > 0.0f) WetGainBase *= props->RefDistance / dist;
1442             }
1443             break;
1444
1445         case DistanceModel::LinearClamped:
1446             if(props->MaxDistance < props->RefDistance) break;
1447             ClampedDist = clampf(ClampedDist, props->RefDistance, props->MaxDistance);
1448             /*fall-through*/
1449         case DistanceModel::Linear:
1450             if(props->MaxDistance != props->RefDistance)
1451             {
1452                 float attn{(ClampedDist-props->RefDistance) /
1453                     (props->MaxDistance-props->RefDistance) * props->RolloffFactor};
1454                 DryGainBase *= maxf(1.0f - attn, 0.0f);
1455
1456                 attn = (ClampedDist-props->RefDistance) /
1457                     (props->MaxDistance-props->RefDistance) * props->RoomRolloffFactor;
1458                 WetGainBase *= maxf(1.0f - attn, 0.0f);
1459             }
1460             break;
1461
1462         case DistanceModel::ExponentClamped:
1463             if(props->MaxDistance < props->RefDistance) break;
1464             ClampedDist = clampf(ClampedDist, props->RefDistance, props->MaxDistance);
1465             /*fall-through*/
1466         case DistanceModel::Exponent:
1467             if(ClampedDist > 0.0f && props->RefDistance > 0.0f)
1468             {
1469                 const float dist_ratio{ClampedDist/props->RefDistance};
1470                 DryGainBase *= std::pow(dist_ratio, -props->RolloffFactor);
1471                 WetGainBase *= std::pow(dist_ratio, -props->RoomRolloffFactor);
1472             }
1473             break;
1474
1475         case DistanceModel::Disable:
1476             break;
1477     }
1478
1479     /* Calculate directional soundcones */
1480     float ConeHF{1.0f}, WetConeHF{1.0f};
1481     if(directional && props->InnerAngle < 360.0f)
1482     {
1483         static constexpr float Rad2Deg{static_cast<float>(180.0 / al::numbers::pi)};
1484         const float Angle{Rad2Deg*2.0f * std::acos(-Direction.dot_product(ToSource)) * ConeScale};
1485
1486         float ConeGain{1.0f};
1487         if(Angle >= props->OuterAngle)
1488         {
1489             ConeGain = props->OuterGain;
1490             ConeHF = lerpf(1.0f, props->OuterGainHF, props->DryGainHFAuto);
1491         }
1492         else if(Angle >= props->InnerAngle)
1493         {
1494             const float scale{(Angle-props->InnerAngle) / (props->OuterAngle-props->InnerAngle)};
1495             ConeGain = lerpf(1.0f, props->OuterGain, scale);
1496             ConeHF = lerpf(1.0f, props->OuterGainHF, scale * props->DryGainHFAuto);
1497         }
1498
1499         DryGainBase *= ConeGain;
1500         WetGainBase *= lerpf(1.0f, ConeGain, props->WetGainAuto);
1501
1502         WetConeHF = lerpf(1.0f, ConeHF, props->WetGainHFAuto);
1503     }
1504
1505     /* Apply gain and frequency filters */
1506     DryGainBase = clampf(DryGainBase, props->MinGain, props->MaxGain) * context->mParams.Gain;
1507     WetGainBase = clampf(WetGainBase, props->MinGain, props->MaxGain) * context->mParams.Gain;
1508
1509     GainTriplet DryGain{};
1510     DryGain.Base = minf(DryGainBase * props->Direct.Gain, GainMixMax);
1511     DryGain.HF = ConeHF * props->Direct.GainHF;
1512     DryGain.LF = props->Direct.GainLF;
1513     GainTriplet WetGain[MAX_SENDS]{};
1514     for(uint i{0};i < NumSends;i++)
1515     {
1516         /* If this effect slot's Auxiliary Send Auto is off, then use the dry
1517          * path distance and cone attenuation, otherwise use the wet (room)
1518          * path distance and cone attenuation. The send filter is used instead
1519          * of the direct filter, regardless.
1520          */
1521         const bool use_room{!(UseDryAttnForRoom&(1u<<i))};
1522         const float gain{use_room ? WetGainBase : DryGainBase};
1523         WetGain[i].Base = minf(gain * props->Send[i].Gain, GainMixMax);
1524         WetGain[i].HF = (use_room ? WetConeHF : ConeHF) * props->Send[i].GainHF;
1525         WetGain[i].LF = props->Send[i].GainLF;
1526     }
1527
1528     /* Distance-based air absorption and initial send decay. */
1529     if(Distance > props->RefDistance) [[likely]]
1530     {
1531         const float distance_base{(Distance-props->RefDistance) * props->RolloffFactor};
1532         const float distance_meters{distance_base * context->mParams.MetersPerUnit};
1533         const float dryabsorb{distance_meters * props->AirAbsorptionFactor};
1534         if(dryabsorb > std::numeric_limits<float>::epsilon())
1535             DryGain.HF *= std::pow(context->mParams.AirAbsorptionGainHF, dryabsorb);
1536
1537         /* If the source's Auxiliary Send Filter Gain Auto is off, no extra
1538          * adjustment is applied to the send gains.
1539          */
1540         for(uint i{props->WetGainAuto ? 0u : NumSends};i < NumSends;++i)
1541         {
1542             if(!SendSlots[i] || !(SendSlots[i]->DecayTime > 0.0f))
1543                 continue;
1544
1545             auto calc_attenuation = [](float distance, float refdist, float rolloff) noexcept
1546             {
1547                 const float dist{lerpf(refdist, distance, rolloff)};
1548                 if(dist > refdist) return refdist / dist;
1549                 return 1.0f;
1550             };
1551
1552             /* The reverb effect's room rolloff factor always applies to an
1553              * inverse distance rolloff model.
1554              */
1555             WetGain[i].Base *= calc_attenuation(Distance, props->RefDistance,
1556                 SendSlots[i]->RoomRolloff);
1557
1558             if(distance_meters > std::numeric_limits<float>::epsilon())
1559                 WetGain[i].HF *= std::pow(SendSlots[i]->AirAbsorptionGainHF, distance_meters);
1560
1561             /* If this effect slot's Auxiliary Send Auto is off, don't apply
1562              * the automatic initial reverb decay (should the reverb's room
1563              * rolloff still apply?).
1564              */
1565             if(!SendSlots[i]->AuxSendAuto)
1566                 continue;
1567
1568             GainTriplet DecayDistance;
1569             /* Calculate the distances to where this effect's decay reaches
1570              * -60dB.
1571              */
1572             DecayDistance.Base = SendSlots[i]->DecayTime * SpeedOfSoundMetersPerSec;
1573             DecayDistance.LF = DecayDistance.Base * SendSlots[i]->DecayLFRatio;
1574             DecayDistance.HF = DecayDistance.Base * SendSlots[i]->DecayHFRatio;
1575             if(SendSlots[i]->DecayHFLimit)
1576             {
1577                 const float airAbsorption{SendSlots[i]->AirAbsorptionGainHF};
1578                 if(airAbsorption < 1.0f)
1579                 {
1580                     /* Calculate the distance to where this effect's air
1581                      * absorption reaches -60dB, and limit the effect's HF
1582                      * decay distance (so it doesn't take any longer to decay
1583                      * than the air would allow).
1584                      */
1585                     static constexpr float log10_decaygain{-3.0f/*std::log10(ReverbDecayGain)*/};
1586                     const float absorb_dist{log10_decaygain / std::log10(airAbsorption)};
1587                     DecayDistance.HF = minf(absorb_dist, DecayDistance.HF);
1588                 }
1589             }
1590
1591             const float baseAttn = calc_attenuation(Distance, props->RefDistance,
1592                 props->RolloffFactor);
1593
1594             /* Apply a decay-time transformation to the wet path, based on the
1595              * source distance. The initial decay of the reverb effect is
1596              * calculated and applied to the wet path.
1597              */
1598             const float fact{distance_base / DecayDistance.Base};
1599             const float gain{std::pow(ReverbDecayGain, fact)*(1.0f-baseAttn) + baseAttn};
1600             WetGain[i].Base *= gain;
1601
1602             if(gain > 0.0f)
1603             {
1604                 const float hffact{distance_base / DecayDistance.HF};
1605                 const float gainhf{std::pow(ReverbDecayGain, hffact)*(1.0f-baseAttn) + baseAttn};
1606                 WetGain[i].HF *= minf(gainhf/gain, 1.0f);
1607                 const float lffact{distance_base / DecayDistance.LF};
1608                 const float gainlf{std::pow(ReverbDecayGain, lffact)*(1.0f-baseAttn) + baseAttn};
1609                 WetGain[i].LF *= minf(gainlf/gain, 1.0f);
1610             }
1611         }
1612     }
1613
1614
1615     /* Initial source pitch */
1616     float Pitch{props->Pitch};
1617
1618     /* Calculate velocity-based doppler effect */
1619     float DopplerFactor{props->DopplerFactor * context->mParams.DopplerFactor};
1620     if(DopplerFactor > 0.0f)
1621     {
1622         const alu::Vector &lvelocity = context->mParams.Velocity;
1623         float vss{Velocity.dot_product(ToSource) * -DopplerFactor};
1624         float vls{lvelocity.dot_product(ToSource) * -DopplerFactor};
1625
1626         const float SpeedOfSound{context->mParams.SpeedOfSound};
1627         if(!(vls < SpeedOfSound))
1628         {
1629             /* Listener moving away from the source at the speed of sound.
1630              * Sound waves can't catch it.
1631              */
1632             Pitch = 0.0f;
1633         }
1634         else if(!(vss < SpeedOfSound))
1635         {
1636             /* Source moving toward the listener at the speed of sound. Sound
1637              * waves bunch up to extreme frequencies.
1638              */
1639             Pitch = std::numeric_limits<float>::infinity();
1640         }
1641         else
1642         {
1643             /* Source and listener movement is nominal. Calculate the proper
1644              * doppler shift.
1645              */
1646             Pitch *= (SpeedOfSound-vls) / (SpeedOfSound-vss);
1647         }
1648     }
1649
1650     /* Adjust pitch based on the buffer and output frequencies, and calculate
1651      * fixed-point stepping value.
1652      */
1653     Pitch *= static_cast<float>(voice->mFrequency) / static_cast<float>(Device->Frequency);
1654     if(Pitch > float{MaxPitch})
1655         voice->mStep = MaxPitch<<MixerFracBits;
1656     else
1657         voice->mStep = maxu(fastf2u(Pitch * MixerFracOne), 1);
1658     voice->mResampler = PrepareResampler(props->mResampler, voice->mStep, &voice->mResampleState);
1659
1660     float spread{0.0f};
1661     if(props->Radius > Distance)
1662         spread = al::numbers::pi_v<float>*2.0f - Distance/props->Radius*al::numbers::pi_v<float>;
1663     else if(Distance > 0.0f)
1664         spread = std::asin(props->Radius/Distance) * 2.0f;
1665
1666     CalcPanningAndFilters(voice, ToSource[0]*XScale, ToSource[1]*YScale, ToSource[2]*ZScale,
1667         Distance, spread, DryGain, WetGain, SendSlots, props, context->mParams, Device);
1668 }
1669
1670 void CalcSourceParams(Voice *voice, ContextBase *context, bool force)
1671 {
1672     VoicePropsItem *props{voice->mUpdate.exchange(nullptr, std::memory_order_acq_rel)};
1673     if(!props && !force) return;
1674
1675     if(props)
1676     {
1677         voice->mProps = *props;
1678
1679         AtomicReplaceHead(context->mFreeVoiceProps, props);
1680     }
1681
1682     if((voice->mProps.DirectChannels != DirectMode::Off && voice->mFmtChannels != FmtMono
1683             && !IsAmbisonic(voice->mFmtChannels))
1684         || voice->mProps.mSpatializeMode == SpatializeMode::Off
1685         || (voice->mProps.mSpatializeMode==SpatializeMode::Auto && voice->mFmtChannels != FmtMono))
1686         CalcNonAttnSourceParams(voice, &voice->mProps, context);
1687     else
1688         CalcAttnSourceParams(voice, &voice->mProps, context);
1689 }
1690
1691
1692 void SendSourceStateEvent(ContextBase *context, uint id, VChangeState state)
1693 {
1694     RingBuffer *ring{context->mAsyncEvents.get()};
1695     auto evt_vec = ring->getWriteVector();
1696     if(evt_vec.first.len < 1) return;
1697
1698     AsyncEvent *evt{al::construct_at(reinterpret_cast<AsyncEvent*>(evt_vec.first.buf),
1699         AsyncEvent::SourceStateChange)};
1700     evt->u.srcstate.id = id;
1701     switch(state)
1702     {
1703     case VChangeState::Reset:
1704         evt->u.srcstate.state = AsyncEvent::SrcState::Reset;
1705         break;
1706     case VChangeState::Stop:
1707         evt->u.srcstate.state = AsyncEvent::SrcState::Stop;
1708         break;
1709     case VChangeState::Play:
1710         evt->u.srcstate.state = AsyncEvent::SrcState::Play;
1711         break;
1712     case VChangeState::Pause:
1713         evt->u.srcstate.state = AsyncEvent::SrcState::Pause;
1714         break;
1715     /* Shouldn't happen. */
1716     case VChangeState::Restart:
1717         al::unreachable();
1718     }
1719
1720     ring->writeAdvance(1);
1721 }
1722
1723 void ProcessVoiceChanges(ContextBase *ctx)
1724 {
1725     VoiceChange *cur{ctx->mCurrentVoiceChange.load(std::memory_order_acquire)};
1726     VoiceChange *next{cur->mNext.load(std::memory_order_acquire)};
1727     if(!next) return;
1728
1729     const auto enabledevt = ctx->mEnabledEvts.load(std::memory_order_acquire);
1730     do {
1731         cur = next;
1732
1733         bool sendevt{false};
1734         if(cur->mState == VChangeState::Reset || cur->mState == VChangeState::Stop)
1735         {
1736             if(Voice *voice{cur->mVoice})
1737             {
1738                 voice->mCurrentBuffer.store(nullptr, std::memory_order_relaxed);
1739                 voice->mLoopBuffer.store(nullptr, std::memory_order_relaxed);
1740                 /* A source ID indicates the voice was playing or paused, which
1741                  * gets a reset/stop event.
1742                  */
1743                 sendevt = voice->mSourceID.exchange(0u, std::memory_order_relaxed) != 0u;
1744                 Voice::State oldvstate{Voice::Playing};
1745                 voice->mPlayState.compare_exchange_strong(oldvstate, Voice::Stopping,
1746                     std::memory_order_relaxed, std::memory_order_acquire);
1747                 voice->mPendingChange.store(false, std::memory_order_release);
1748             }
1749             /* Reset state change events are always sent, even if the voice is
1750              * already stopped or even if there is no voice.
1751              */
1752             sendevt |= (cur->mState == VChangeState::Reset);
1753         }
1754         else if(cur->mState == VChangeState::Pause)
1755         {
1756             Voice *voice{cur->mVoice};
1757             Voice::State oldvstate{Voice::Playing};
1758             sendevt = voice->mPlayState.compare_exchange_strong(oldvstate, Voice::Stopping,
1759                 std::memory_order_release, std::memory_order_acquire);
1760         }
1761         else if(cur->mState == VChangeState::Play)
1762         {
1763             /* NOTE: When playing a voice, sending a source state change event
1764              * depends if there's an old voice to stop and if that stop is
1765              * successful. If there is no old voice, a playing event is always
1766              * sent. If there is an old voice, an event is sent only if the
1767              * voice is already stopped.
1768              */
1769             if(Voice *oldvoice{cur->mOldVoice})
1770             {
1771                 oldvoice->mCurrentBuffer.store(nullptr, std::memory_order_relaxed);
1772                 oldvoice->mLoopBuffer.store(nullptr, std::memory_order_relaxed);
1773                 oldvoice->mSourceID.store(0u, std::memory_order_relaxed);
1774                 Voice::State oldvstate{Voice::Playing};
1775                 sendevt = !oldvoice->mPlayState.compare_exchange_strong(oldvstate, Voice::Stopping,
1776                     std::memory_order_relaxed, std::memory_order_acquire);
1777                 oldvoice->mPendingChange.store(false, std::memory_order_release);
1778             }
1779             else
1780                 sendevt = true;
1781
1782             Voice *voice{cur->mVoice};
1783             voice->mPlayState.store(Voice::Playing, std::memory_order_release);
1784         }
1785         else if(cur->mState == VChangeState::Restart)
1786         {
1787             /* Restarting a voice never sends a source change event. */
1788             Voice *oldvoice{cur->mOldVoice};
1789             oldvoice->mCurrentBuffer.store(nullptr, std::memory_order_relaxed);
1790             oldvoice->mLoopBuffer.store(nullptr, std::memory_order_relaxed);
1791             /* If there's no sourceID, the old voice finished so don't start
1792              * the new one at its new offset.
1793              */
1794             if(oldvoice->mSourceID.exchange(0u, std::memory_order_relaxed) != 0u)
1795             {
1796                 /* Otherwise, set the voice to stopping if it's not already (it
1797                  * might already be, if paused), and play the new voice as
1798                  * appropriate.
1799                  */
1800                 Voice::State oldvstate{Voice::Playing};
1801                 oldvoice->mPlayState.compare_exchange_strong(oldvstate, Voice::Stopping,
1802                     std::memory_order_relaxed, std::memory_order_acquire);
1803
1804                 Voice *voice{cur->mVoice};
1805                 voice->mPlayState.store((oldvstate == Voice::Playing) ? Voice::Playing
1806                     : Voice::Stopped, std::memory_order_release);
1807             }
1808             oldvoice->mPendingChange.store(false, std::memory_order_release);
1809         }
1810         if(sendevt && enabledevt.test(AsyncEvent::SourceStateChange))
1811             SendSourceStateEvent(ctx, cur->mSourceID, cur->mState);
1812
1813         next = cur->mNext.load(std::memory_order_acquire);
1814     } while(next);
1815     ctx->mCurrentVoiceChange.store(cur, std::memory_order_release);
1816 }
1817
1818 void ProcessParamUpdates(ContextBase *ctx, const EffectSlotArray &slots,
1819     const al::span<Voice*> voices)
1820 {
1821     ProcessVoiceChanges(ctx);
1822
1823     IncrementRef(ctx->mUpdateCount);
1824     if(!ctx->mHoldUpdates.load(std::memory_order_acquire)) [[likely]]
1825     {
1826         bool force{CalcContextParams(ctx)};
1827         auto sorted_slots = const_cast<EffectSlot**>(slots.data() + slots.size());
1828         for(EffectSlot *slot : slots)
1829             force |= CalcEffectSlotParams(slot, sorted_slots, ctx);
1830
1831         for(Voice *voice : voices)
1832         {
1833             /* Only update voices that have a source. */
1834             if(voice->mSourceID.load(std::memory_order_relaxed) != 0)
1835                 CalcSourceParams(voice, ctx, force);
1836         }
1837     }
1838     IncrementRef(ctx->mUpdateCount);
1839 }
1840
1841 void ProcessContexts(DeviceBase *device, const uint SamplesToDo)
1842 {
1843     ASSUME(SamplesToDo > 0);
1844
1845     const nanoseconds curtime{device->ClockBase +
1846         nanoseconds{seconds{device->SamplesDone}}/device->Frequency};
1847
1848     for(ContextBase *ctx : *device->mContexts.load(std::memory_order_acquire))
1849     {
1850         const EffectSlotArray &auxslots = *ctx->mActiveAuxSlots.load(std::memory_order_acquire);
1851         const al::span<Voice*> voices{ctx->getVoicesSpanAcquired()};
1852
1853         /* Process pending propery updates for objects on the context. */
1854         ProcessParamUpdates(ctx, auxslots, voices);
1855
1856         /* Clear auxiliary effect slot mixing buffers. */
1857         for(EffectSlot *slot : auxslots)
1858         {
1859             for(auto &buffer : slot->Wet.Buffer)
1860                 buffer.fill(0.0f);
1861         }
1862
1863         /* Process voices that have a playing source. */
1864         for(Voice *voice : voices)
1865         {
1866             const Voice::State vstate{voice->mPlayState.load(std::memory_order_acquire)};
1867             if(vstate != Voice::Stopped && vstate != Voice::Pending)
1868                 voice->mix(vstate, ctx, curtime, SamplesToDo);
1869         }
1870
1871         /* Process effects. */
1872         if(const size_t num_slots{auxslots.size()})
1873         {
1874             auto slots = auxslots.data();
1875             auto slots_end = slots + num_slots;
1876
1877             /* Sort the slots into extra storage, so that effect slots come
1878              * before their effect slot target (or their targets' target).
1879              */
1880             const al::span<EffectSlot*> sorted_slots{const_cast<EffectSlot**>(slots_end),
1881                 num_slots};
1882             /* Skip sorting if it has already been done. */
1883             if(!sorted_slots[0])
1884             {
1885                 /* First, copy the slots to the sorted list, then partition the
1886                  * sorted list so that all slots without a target slot go to
1887                  * the end.
1888                  */
1889                 std::copy(slots, slots_end, sorted_slots.begin());
1890                 auto split_point = std::partition(sorted_slots.begin(), sorted_slots.end(),
1891                     [](const EffectSlot *slot) noexcept -> bool
1892                     { return slot->Target != nullptr; });
1893                 /* There must be at least one slot without a slot target. */
1894                 assert(split_point != sorted_slots.end());
1895
1896                 /* Simple case: no more than 1 slot has a target slot. Either
1897                  * all slots go right to the output, or the remaining one must
1898                  * target an already-partitioned slot.
1899                  */
1900                 if(split_point - sorted_slots.begin() > 1)
1901                 {
1902                     /* At least two slots target other slots. Starting from the
1903                      * back of the sorted list, continue partitioning the front
1904                      * of the list given each target until all targets are
1905                      * accounted for. This ensures all slots without a target
1906                      * go last, all slots directly targeting those last slots
1907                      * go second-to-last, all slots directly targeting those
1908                      * second-last slots go third-to-last, etc.
1909                      */
1910                     auto next_target = sorted_slots.end();
1911                     do {
1912                         /* This shouldn't happen, but if there's unsorted slots
1913                          * left that don't target any sorted slots, they can't
1914                          * contribute to the output, so leave them.
1915                          */
1916                         if(next_target == split_point) [[unlikely]]
1917                             break;
1918
1919                         --next_target;
1920                         split_point = std::partition(sorted_slots.begin(), split_point,
1921                             [next_target](const EffectSlot *slot) noexcept -> bool
1922                             { return slot->Target != *next_target; });
1923                     } while(split_point - sorted_slots.begin() > 1);
1924                 }
1925             }
1926
1927             for(const EffectSlot *slot : sorted_slots)
1928             {
1929                 EffectState *state{slot->mEffectState.get()};
1930                 state->process(SamplesToDo, slot->Wet.Buffer, state->mOutTarget);
1931             }
1932         }
1933
1934         /* Signal the event handler if there are any events to read. */
1935         RingBuffer *ring{ctx->mAsyncEvents.get()};
1936         if(ring->readSpace() > 0)
1937             ctx->mEventSem.post();
1938     }
1939 }
1940
1941
1942 void ApplyDistanceComp(const al::span<FloatBufferLine> Samples, const size_t SamplesToDo,
1943     const DistanceComp::ChanData *distcomp)
1944 {
1945     ASSUME(SamplesToDo > 0);
1946
1947     for(auto &chanbuffer : Samples)
1948     {
1949         const float gain{distcomp->Gain};
1950         const size_t base{distcomp->Length};
1951         float *distbuf{al::assume_aligned<16>(distcomp->Buffer)};
1952         ++distcomp;
1953
1954         if(base < 1)
1955             continue;
1956
1957         float *inout{al::assume_aligned<16>(chanbuffer.data())};
1958         auto inout_end = inout + SamplesToDo;
1959         if(SamplesToDo >= base) [[likely]]
1960         {
1961             auto delay_end = std::rotate(inout, inout_end - base, inout_end);
1962             std::swap_ranges(inout, delay_end, distbuf);
1963         }
1964         else
1965         {
1966             auto delay_start = std::swap_ranges(inout, inout_end, distbuf);
1967             std::rotate(distbuf, delay_start, distbuf + base);
1968         }
1969         std::transform(inout, inout_end, inout, std::bind(std::multiplies<float>{}, _1, gain));
1970     }
1971 }
1972
1973 void ApplyDither(const al::span<FloatBufferLine> Samples, uint *dither_seed,
1974     const float quant_scale, const size_t SamplesToDo)
1975 {
1976     ASSUME(SamplesToDo > 0);
1977
1978     /* Dithering. Generate whitenoise (uniform distribution of random values
1979      * between -1 and +1) and add it to the sample values, after scaling up to
1980      * the desired quantization depth amd before rounding.
1981      */
1982     const float invscale{1.0f / quant_scale};
1983     uint seed{*dither_seed};
1984     auto dither_sample = [&seed,invscale,quant_scale](const float sample) noexcept -> float
1985     {
1986         float val{sample * quant_scale};
1987         uint rng0{dither_rng(&seed)};
1988         uint rng1{dither_rng(&seed)};
1989         val += static_cast<float>(rng0*(1.0/UINT_MAX) - rng1*(1.0/UINT_MAX));
1990         return fast_roundf(val) * invscale;
1991     };
1992     for(FloatBufferLine &inout : Samples)
1993         std::transform(inout.begin(), inout.begin()+SamplesToDo, inout.begin(), dither_sample);
1994     *dither_seed = seed;
1995 }
1996
1997
1998 /* Base template left undefined. Should be marked =delete, but Clang 3.8.1
1999  * chokes on that given the inline specializations.
2000  */
2001 template<typename T>
2002 inline T SampleConv(float) noexcept;
2003
2004 template<> inline float SampleConv(float val) noexcept
2005 { return val; }
2006 template<> inline int32_t SampleConv(float val) noexcept
2007 {
2008     /* Floats have a 23-bit mantissa, plus an implied 1 bit and a sign bit.
2009      * This means a normalized float has at most 25 bits of signed precision.
2010      * When scaling and clamping for a signed 32-bit integer, these following
2011      * values are the best a float can give.
2012      */
2013     return fastf2i(clampf(val*2147483648.0f, -2147483648.0f, 2147483520.0f));
2014 }
2015 template<> inline int16_t SampleConv(float val) noexcept
2016 { return static_cast<int16_t>(fastf2i(clampf(val*32768.0f, -32768.0f, 32767.0f))); }
2017 template<> inline int8_t SampleConv(float val) noexcept
2018 { return static_cast<int8_t>(fastf2i(clampf(val*128.0f, -128.0f, 127.0f))); }
2019
2020 /* Define unsigned output variations. */
2021 template<> inline uint32_t SampleConv(float val) noexcept
2022 { return static_cast<uint32_t>(SampleConv<int32_t>(val)) + 2147483648u; }
2023 template<> inline uint16_t SampleConv(float val) noexcept
2024 { return static_cast<uint16_t>(SampleConv<int16_t>(val) + 32768); }
2025 template<> inline uint8_t SampleConv(float val) noexcept
2026 { return static_cast<uint8_t>(SampleConv<int8_t>(val) + 128); }
2027
2028 template<DevFmtType T>
2029 void Write(const al::span<const FloatBufferLine> InBuffer, void *OutBuffer, const size_t Offset,
2030     const size_t SamplesToDo, const size_t FrameStep)
2031 {
2032     ASSUME(FrameStep > 0);
2033     ASSUME(SamplesToDo > 0);
2034
2035     DevFmtType_t<T> *outbase{static_cast<DevFmtType_t<T>*>(OutBuffer) + Offset*FrameStep};
2036     size_t c{0};
2037     for(const FloatBufferLine &inbuf : InBuffer)
2038     {
2039         DevFmtType_t<T> *out{outbase++};
2040         auto conv_sample = [FrameStep,&out](const float s) noexcept -> void
2041         {
2042             *out = SampleConv<DevFmtType_t<T>>(s);
2043             out += FrameStep;
2044         };
2045         std::for_each(inbuf.begin(), inbuf.begin()+SamplesToDo, conv_sample);
2046         ++c;
2047     }
2048     if(const size_t extra{FrameStep - c})
2049     {
2050         const auto silence = SampleConv<DevFmtType_t<T>>(0.0f);
2051         for(size_t i{0};i < SamplesToDo;++i)
2052         {
2053             std::fill_n(outbase, extra, silence);
2054             outbase += FrameStep;
2055         }
2056     }
2057 }
2058
2059 } // namespace
2060
2061 uint DeviceBase::renderSamples(const uint numSamples)
2062 {
2063     const uint samplesToDo{minu(numSamples, BufferLineSize)};
2064
2065     /* Clear main mixing buffers. */
2066     for(FloatBufferLine &buffer : MixBuffer)
2067         buffer.fill(0.0f);
2068
2069     /* Increment the mix count at the start (lsb should now be 1). */
2070     IncrementRef(MixCount);
2071
2072     /* Process and mix each context's sources and effects. */
2073     ProcessContexts(this, samplesToDo);
2074
2075     /* Increment the clock time. Every second's worth of samples is converted
2076      * and added to clock base so that large sample counts don't overflow
2077      * during conversion. This also guarantees a stable conversion.
2078      */
2079     SamplesDone += samplesToDo;
2080     ClockBase += std::chrono::seconds{SamplesDone / Frequency};
2081     SamplesDone %= Frequency;
2082
2083     /* Increment the mix count at the end (lsb should now be 0). */
2084     IncrementRef(MixCount);
2085
2086     /* Apply any needed post-process for finalizing the Dry mix to the RealOut
2087      * (Ambisonic decode, UHJ encode, etc).
2088      */
2089     postProcess(samplesToDo);
2090
2091     /* Apply compression, limiting sample amplitude if needed or desired. */
2092     if(Limiter) Limiter->process(samplesToDo, RealOut.Buffer.data());
2093
2094     /* Apply delays and attenuation for mismatched speaker distances. */
2095     if(ChannelDelays)
2096         ApplyDistanceComp(RealOut.Buffer, samplesToDo, ChannelDelays->mChannels.data());
2097
2098     /* Apply dithering. The compressor should have left enough headroom for the
2099      * dither noise to not saturate.
2100      */
2101     if(DitherDepth > 0.0f)
2102         ApplyDither(RealOut.Buffer, &DitherSeed, DitherDepth, samplesToDo);
2103
2104     return samplesToDo;
2105 }
2106
2107 void DeviceBase::renderSamples(const al::span<float*> outBuffers, const uint numSamples)
2108 {
2109     FPUCtl mixer_mode{};
2110     uint total{0};
2111     while(const uint todo{numSamples - total})
2112     {
2113         const uint samplesToDo{renderSamples(todo)};
2114
2115         auto *srcbuf = RealOut.Buffer.data();
2116         for(auto *dstbuf : outBuffers)
2117         {
2118             std::copy_n(srcbuf->data(), samplesToDo, dstbuf + total);
2119             ++srcbuf;
2120         }
2121
2122         total += samplesToDo;
2123     }
2124 }
2125
2126 void DeviceBase::renderSamples(void *outBuffer, const uint numSamples, const size_t frameStep)
2127 {
2128     FPUCtl mixer_mode{};
2129     uint total{0};
2130     while(const uint todo{numSamples - total})
2131     {
2132         const uint samplesToDo{renderSamples(todo)};
2133
2134         if(outBuffer) [[likely]]
2135         {
2136             /* Finally, interleave and convert samples, writing to the device's
2137              * output buffer.
2138              */
2139             switch(FmtType)
2140             {
2141 #define HANDLE_WRITE(T) case T:                                               \
2142     Write<T>(RealOut.Buffer, outBuffer, total, samplesToDo, frameStep); break;
2143             HANDLE_WRITE(DevFmtByte)
2144             HANDLE_WRITE(DevFmtUByte)
2145             HANDLE_WRITE(DevFmtShort)
2146             HANDLE_WRITE(DevFmtUShort)
2147             HANDLE_WRITE(DevFmtInt)
2148             HANDLE_WRITE(DevFmtUInt)
2149             HANDLE_WRITE(DevFmtFloat)
2150 #undef HANDLE_WRITE
2151             }
2152         }
2153
2154         total += samplesToDo;
2155     }
2156 }
2157
2158 void DeviceBase::handleDisconnect(const char *msg, ...)
2159 {
2160     IncrementRef(MixCount);
2161     if(Connected.exchange(false, std::memory_order_acq_rel))
2162     {
2163         AsyncEvent evt{AsyncEvent::Disconnected};
2164
2165         va_list args;
2166         va_start(args, msg);
2167         int msglen{vsnprintf(evt.u.disconnect.msg, sizeof(evt.u.disconnect.msg), msg, args)};
2168         va_end(args);
2169
2170         if(msglen < 0 || static_cast<size_t>(msglen) >= sizeof(evt.u.disconnect.msg))
2171             evt.u.disconnect.msg[sizeof(evt.u.disconnect.msg)-1] = 0;
2172
2173         for(ContextBase *ctx : *mContexts.load())
2174         {
2175             if(ctx->mEnabledEvts.load(std::memory_order_acquire).test(AsyncEvent::Disconnected))
2176             {
2177                 RingBuffer *ring{ctx->mAsyncEvents.get()};
2178                 auto evt_data = ring->getWriteVector().first;
2179                 if(evt_data.len > 0)
2180                 {
2181                     al::construct_at(reinterpret_cast<AsyncEvent*>(evt_data.buf), evt);
2182                     ring->writeAdvance(1);
2183                     ctx->mEventSem.post();
2184                 }
2185             }
2186
2187             if(!ctx->mStopVoicesOnDisconnect)
2188             {
2189                 ProcessVoiceChanges(ctx);
2190                 continue;
2191             }
2192
2193             auto voicelist = ctx->getVoicesSpanAcquired();
2194             auto stop_voice = [](Voice *voice) -> void
2195             {
2196                 voice->mCurrentBuffer.store(nullptr, std::memory_order_relaxed);
2197                 voice->mLoopBuffer.store(nullptr, std::memory_order_relaxed);
2198                 voice->mSourceID.store(0u, std::memory_order_relaxed);
2199                 voice->mPlayState.store(Voice::Stopped, std::memory_order_release);
2200             };
2201             std::for_each(voicelist.begin(), voicelist.end(), stop_voice);
2202         }
2203     }
2204     IncrementRef(MixCount);
2205 }