Alc/ALu.c

   1 /**
   2  * OpenAL cross platform audio library
   3  * Copyright (C) 1999-2007 by authors.
   4  * This library is free software; you can redistribute it and/or
   5  *  modify it under the terms of the GNU Library General Public
   6  *  License as published by the Free Software Foundation; either
   7  *  version 2 of the License, or (at your option) any later version.
   8  *
   9  * This library is distributed in the hope that it will be useful,
  10  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  11  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  12  *  Library General Public License for more details.
  13  *
  14  * You should have received a copy of the GNU Library General Public
  15  *  License along with this library; if not, write to the
  16  *  Free Software Foundation, Inc.,
  17  *  51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
  18  * Or go to http://www.gnu.org/copyleft/lgpl.html
  19  */
  20
  21 #include "config.h"
  22
  23 #include <math.h>
  24 #include <stdlib.h>
  25 #include <string.h>
  26 #include <ctype.h>
  27 #include <assert.h>
  28
  29 #include "alMain.h"
  30 #include "alSource.h"
  31 #include "alBuffer.h"
  32 #include "alListener.h"
  33 #include "alAuxEffectSlot.h"
  34 #include "alu.h"
  35 #include "bs2b.h"
  36 #include "hrtf.h"
  37 #include "uhjfilter.h"
  38 #include "static_assert.h"
  39
  40 #include "mixer_defs.h"
  41
  42 #include "backends/base.h"
  43
  44
  45 struct ChanMap {
  46     enum Channel channel;
  47     ALfloat angle;
  48     ALfloat elevation;
  49 };
  50
  51 /* Cone scalar */
  52 ALfloat ConeScale = 1.0f;
  53
  54 /* Localized Z scalar for mono sources */
  55 ALfloat ZScale = 1.0f;
  56
  57 extern inline ALfloat minf(ALfloat a, ALfloat b);
  58 extern inline ALfloat maxf(ALfloat a, ALfloat b);
  59 extern inline ALfloat clampf(ALfloat val, ALfloat min, ALfloat max);
  60
  61 extern inline ALdouble mind(ALdouble a, ALdouble b);
  62 extern inline ALdouble maxd(ALdouble a, ALdouble b);
  63 extern inline ALdouble clampd(ALdouble val, ALdouble min, ALdouble max);
  64
  65 extern inline ALuint minu(ALuint a, ALuint b);
  66 extern inline ALuint maxu(ALuint a, ALuint b);
  67 extern inline ALuint clampu(ALuint val, ALuint min, ALuint max);
  68
  69 extern inline ALint mini(ALint a, ALint b);
  70 extern inline ALint maxi(ALint a, ALint b);
  71 extern inline ALint clampi(ALint val, ALint min, ALint max);
  72
  73 extern inline ALint64 mini64(ALint64 a, ALint64 b);
  74 extern inline ALint64 maxi64(ALint64 a, ALint64 b);
  75 extern inline ALint64 clampi64(ALint64 val, ALint64 min, ALint64 max);
  76
  77 extern inline ALuint64 minu64(ALuint64 a, ALuint64 b);
  78 extern inline ALuint64 maxu64(ALuint64 a, ALuint64 b);
  79 extern inline ALuint64 clampu64(ALuint64 val, ALuint64 min, ALuint64 max);
  80
  81 extern inline ALfloat lerp(ALfloat val1, ALfloat val2, ALfloat mu);
  82 extern inline ALfloat resample_fir4(ALfloat val0, ALfloat val1, ALfloat val2, ALfloat val3, ALuint frac);
  83 extern inline ALfloat resample_fir8(ALfloat val0, ALfloat val1, ALfloat val2, ALfloat val3, ALfloat val4, ALfloat val5, ALfloat val6, ALfloat val7, ALuint frac);
  84
  85 extern inline void aluVectorSet(aluVector *restrict vector, ALfloat x, ALfloat y, ALfloat z, ALfloat w);
  86
  87 extern inline void aluMatrixfSetRow(aluMatrixf *matrix, ALuint row,
  88                                     ALfloat m0, ALfloat m1, ALfloat m2, ALfloat m3);
  89 extern inline void aluMatrixfSet(aluMatrixf *matrix,
  90                                  ALfloat m00, ALfloat m01, ALfloat m02, ALfloat m03,
  91                                  ALfloat m10, ALfloat m11, ALfloat m12, ALfloat m13,
  92                                  ALfloat m20, ALfloat m21, ALfloat m22, ALfloat m23,
  93                                  ALfloat m30, ALfloat m31, ALfloat m32, ALfloat m33);
  94
  95 extern inline void aluMatrixdSetRow(aluMatrixd *matrix, ALuint row,
  96                                     ALdouble m0, ALdouble m1, ALdouble m2, ALdouble m3);
  97 extern inline void aluMatrixdSet(aluMatrixd *matrix,
  98                                  ALdouble m00, ALdouble m01, ALdouble m02, ALdouble m03,
  99                                  ALdouble m10, ALdouble m11, ALdouble m12, ALdouble m13,
 100                                  ALdouble m20, ALdouble m21, ALdouble m22, ALdouble m23,
 101                                  ALdouble m30, ALdouble m31, ALdouble m32, ALdouble m33);
 102
 103
 104 /* NOTE: HRTF and UHJ are set up a bit special in the device. Normally the
 105  * device's DryBuffer, NumChannels, ChannelName, and Channel fields correspond
 106  * to the output format, and the DryBuffer is then converted and written to the
 107  * backend's audio buffer.
 108  *
 109  * With HRTF or UHJ, these fields correspond to a virtual format, and the
 110  * actual output is stored in DryBuffer[NumChannels] for the left channel and
 111  * DryBuffer[NumChannels+1] for the right. As a final output step,
 112  * the virtual channels will have HRTF filters or UHJ encoding applied and
 113  * written to the actual output.
 114  *
 115  * Sources that get mixed using HRTF directly (or that want to skip HRTF or UHJ
 116  * completely) will need to offset the output buffer so that they skip the
 117  * virtual output and write to the actual output channels. This is the reason
 118  * you'll see
 119  *
 120  * voice->Direct.OutBuffer += voice->Direct.OutChannels;
 121  * voice->Direct.OutChannels = 2;
 122  *
 123  * at various points in the code where HRTF is explicitly used or bypassed.
 124  */
 125
 126 static inline HrtfMixerFunc SelectHrtfMixer(void)
 127 {
 128 #ifdef HAVE_SSE
 129     if((CPUCapFlags&CPU_CAP_SSE))
 130         return MixHrtf_SSE;
 131 #endif
 132 #ifdef HAVE_NEON
 133     if((CPUCapFlags&CPU_CAP_NEON))
 134         return MixHrtf_Neon;
 135 #endif
 136
 137     return MixHrtf_C;
 138 }
 139
 140
 141 static inline void aluCrossproduct(const ALfloat *inVector1, const ALfloat *inVector2, ALfloat *outVector)
 142 {
 143     outVector[0] = inVector1[1]*inVector2[2] - inVector1[2]*inVector2[1];
 144     outVector[1] = inVector1[2]*inVector2[0] - inVector1[0]*inVector2[2];
 145     outVector[2] = inVector1[0]*inVector2[1] - inVector1[1]*inVector2[0];
 146 }
 147
 148 static inline ALfloat aluDotproduct(const aluVector *vec1, const aluVector *vec2)
 149 {
 150     return vec1->v[0]*vec2->v[0] + vec1->v[1]*vec2->v[1] + vec1->v[2]*vec2->v[2];
 151 }
 152
 153 static inline ALfloat aluNormalize(ALfloat *vec)
 154 {
 155     ALfloat length = sqrtf(vec[0]*vec[0] + vec[1]*vec[1] + vec[2]*vec[2]);
 156     if(length > 0.0f)
 157     {
 158         ALfloat inv_length = 1.0f/length;
 159         vec[0] *= inv_length;
 160         vec[1] *= inv_length;
 161         vec[2] *= inv_length;
 162     }
 163     return length;
 164 }
 165
 166
 167 static inline void aluCrossproductd(const ALdouble *inVector1, const ALdouble *inVector2, ALdouble *outVector)
 168 {
 169     outVector[0] = inVector1[1]*inVector2[2] - inVector1[2]*inVector2[1];
 170     outVector[1] = inVector1[2]*inVector2[0] - inVector1[0]*inVector2[2];
 171     outVector[2] = inVector1[0]*inVector2[1] - inVector1[1]*inVector2[0];
 172 }
 173
 174 static inline ALdouble aluNormalized(ALdouble *vec)
 175 {
 176     ALdouble length = sqrt(vec[0]*vec[0] + vec[1]*vec[1] + vec[2]*vec[2]);
 177     if(length > 0.0)
 178     {
 179         ALdouble inv_length = 1.0/length;
 180         vec[0] *= inv_length;
 181         vec[1] *= inv_length;
 182         vec[2] *= inv_length;
 183     }
 184     return length;
 185 }
 186
 187 static inline ALvoid aluMatrixdFloat3(ALfloat *vec, ALfloat w, const aluMatrixd *mtx)
 188 {
 189     ALdouble v[4] = { vec[0], vec[1], vec[2], w };
 190
 191     vec[0] = (ALfloat)(v[0]*mtx->m[0][0] + v[1]*mtx->m[1][0] + v[2]*mtx->m[2][0] + v[3]*mtx->m[3][0]);
 192     vec[1] = (ALfloat)(v[0]*mtx->m[0][1] + v[1]*mtx->m[1][1] + v[2]*mtx->m[2][1] + v[3]*mtx->m[3][1]);
 193     vec[2] = (ALfloat)(v[0]*mtx->m[0][2] + v[1]*mtx->m[1][2] + v[2]*mtx->m[2][2] + v[3]*mtx->m[3][2]);
 194 }
 195
 196 static inline ALvoid aluMatrixdDouble3(ALdouble *vec, ALdouble w, const aluMatrixd *mtx)
 197 {
 198     ALdouble v[4] = { vec[0], vec[1], vec[2], w };
 199
 200     vec[0] = v[0]*mtx->m[0][0] + v[1]*mtx->m[1][0] + v[2]*mtx->m[2][0] + v[3]*mtx->m[3][0];
 201     vec[1] = v[0]*mtx->m[0][1] + v[1]*mtx->m[1][1] + v[2]*mtx->m[2][1] + v[3]*mtx->m[3][1];
 202     vec[2] = v[0]*mtx->m[0][2] + v[1]*mtx->m[1][2] + v[2]*mtx->m[2][2] + v[3]*mtx->m[3][2];
 203 }
 204
 205 static inline aluVector aluMatrixdVector(const aluMatrixd *mtx, const aluVector *vec)
 206 {
 207     aluVector v;
 208     v.v[0] = (ALfloat)(vec->v[0]*mtx->m[0][0] + vec->v[1]*mtx->m[1][0] + vec->v[2]*mtx->m[2][0] + vec->v[3]*mtx->m[3][0]);
 209     v.v[1] = (ALfloat)(vec->v[0]*mtx->m[0][1] + vec->v[1]*mtx->m[1][1] + vec->v[2]*mtx->m[2][1] + vec->v[3]*mtx->m[3][1]);
 210     v.v[2] = (ALfloat)(vec->v[0]*mtx->m[0][2] + vec->v[1]*mtx->m[1][2] + vec->v[2]*mtx->m[2][2] + vec->v[3]*mtx->m[3][2]);
 211     v.v[3] = (ALfloat)(vec->v[0]*mtx->m[0][3] + vec->v[1]*mtx->m[1][3] + vec->v[2]*mtx->m[2][3] + vec->v[3]*mtx->m[3][3]);
 212     return v;
 213 }
 214
 215
 216 /* Prepares the interpolator for a given rate (determined by increment).  A
 217  * result of AL_FALSE indicates that the filter output will completely cut
 218  * the input signal.
 219  *
 220  * With a bit of work, and a trade of memory for CPU cost, this could be
 221  * modified for use with an interpolated increment for buttery-smooth pitch
 222  * changes.
 223  */
 224 static ALboolean BsincPrepare(const ALuint increment, BsincState *state)
 225 {
 226     static const ALfloat scaleBase = 1.510578918e-01f, scaleRange = 1.177936623e+00f;
 227     static const ALuint m[BSINC_SCALE_COUNT] = { 24, 24, 24, 24, 24, 24, 24, 20, 20, 20, 16, 16, 16, 12, 12, 12 };
 228     static const ALuint to[4][BSINC_SCALE_COUNT] =
 229     {
 230         { 0, 24, 408, 792, 1176, 1560, 1944, 2328, 2648, 2968, 3288, 3544, 3800, 4056, 4248, 4440 },
 231         { 4632, 5016, 5400, 5784, 6168, 6552, 6936, 7320, 7640, 7960, 8280, 8536, 8792, 9048, 9240, 0 },
 232         { 0, 9432, 9816, 10200, 10584, 10968, 11352, 11736, 12056, 12376, 12696, 12952, 13208, 13464, 13656, 13848 },
 233         { 14040, 14424, 14808, 15192, 15576, 15960, 16344, 16728, 17048, 17368, 17688, 17944, 18200, 18456, 18648, 0 }
 234     };
 235     static const ALuint tm[2][BSINC_SCALE_COUNT] =
 236     {
 237         { 0, 24, 24, 24, 24, 24, 24, 20, 20, 20, 16, 16, 16, 12, 12, 12 },
 238         { 24, 24, 24, 24, 24, 24, 24, 20, 20, 20, 16, 16, 16, 12, 12, 0 }
 239     };
 240     ALfloat sf;
 241     ALuint si, pi;
 242     ALboolean uncut = AL_TRUE;
 243
 244     if(increment > FRACTIONONE)
 245     {
 246         sf = (ALfloat)FRACTIONONE / increment;
 247         if(sf < scaleBase)
 248         {
 249             /* Signal has been completely cut.  The return result can be used
 250              * to skip the filter (and output zeros) as an optimization.
 251              */
 252             sf = 0.0f;
 253             si = 0;
 254             uncut = AL_FALSE;
 255         }
 256         else
 257         {
 258             sf = (BSINC_SCALE_COUNT - 1) * (sf - scaleBase) * scaleRange;
 259             si = fastf2u(sf);
 260             /* The interpolation factor is fit to this diagonally-symmetric
 261              * curve to reduce the transition ripple caused by interpolating
 262              * different scales of the sinc function.
 263              */
 264             sf = 1.0f - cosf(asinf(sf - si));
 265         }
 266     }
 267     else
 268     {
 269         sf = 0.0f;
 270         si = BSINC_SCALE_COUNT - 1;
 271     }
 272
 273     state->sf = sf;
 274     state->m = m[si];
 275     state->l = -(ALint)((m[si] / 2) - 1);
 276     /* The CPU cost of this table re-mapping could be traded for the memory
 277      * cost of a complete table map (1024 elements large).
 278      */
 279     for(pi = 0;pi < BSINC_PHASE_COUNT;pi++)
 280     {
 281         state->coeffs[pi].filter  = &bsincTab[to[0][si] + tm[0][si]*pi];
 282         state->coeffs[pi].scDelta = &bsincTab[to[1][si] + tm[1][si]*pi];
 283         state->coeffs[pi].phDelta = &bsincTab[to[2][si] + tm[0][si]*pi];
 284         state->coeffs[pi].spDelta = &bsincTab[to[3][si] + tm[1][si]*pi];
 285     }
 286     return uncut;
 287 }
 288
 289
 290 static ALvoid CalcListenerParams(ALlistener *Listener)
 291 {
 292     ALdouble N[3], V[3], U[3], P[3];
 293
 294     /* AT then UP */
 295     N[0] = Listener->Forward[0];
 296     N[1] = Listener->Forward[1];
 297     N[2] = Listener->Forward[2];
 298     aluNormalized(N);
 299     V[0] = Listener->Up[0];
 300     V[1] = Listener->Up[1];
 301     V[2] = Listener->Up[2];
 302     aluNormalized(V);
 303     /* Build and normalize right-vector */
 304     aluCrossproductd(N, V, U);
 305     aluNormalized(U);
 306
 307     aluMatrixdSet(&Listener->Params.Matrix,
 308         U[0], V[0], -N[0], 0.0,
 309         U[1], V[1], -N[1], 0.0,
 310         U[2], V[2], -N[2], 0.0,
 311          0.0,  0.0,   0.0, 1.0
 312     );
 313
 314     P[0] = Listener->Position.v[0];
 315     P[1] = Listener->Position.v[1];
 316     P[2] = Listener->Position.v[2];
 317     aluMatrixdDouble3(P, 1.0, &Listener->Params.Matrix);
 318     aluMatrixdSetRow(&Listener->Params.Matrix, 3, -P[0], -P[1], -P[2], 1.0f);
 319
 320     Listener->Params.Velocity = aluMatrixdVector(&Listener->Params.Matrix, &Listener->Velocity);
 321 }
 322
 323 ALvoid CalcNonAttnSourceParams(ALvoice *voice, const ALsource *ALSource, const ALCcontext *ALContext)
 324 {
 325     static const struct ChanMap MonoMap[1] = {
 326         { FrontCenter, 0.0f, 0.0f }
 327     }, StereoMap[2] = {
 328         { FrontLeft,  DEG2RAD(-30.0f), DEG2RAD(0.0f) },
 329         { FrontRight, DEG2RAD( 30.0f), DEG2RAD(0.0f) }
 330     }, RearMap[2] = {
 331         { BackLeft,  DEG2RAD(-150.0f), DEG2RAD(0.0f) },
 332         { BackRight, DEG2RAD( 150.0f), DEG2RAD(0.0f) }
 333     }, QuadMap[4] = {
 334         { FrontLeft,  DEG2RAD( -45.0f), DEG2RAD(0.0f) },
 335         { FrontRight, DEG2RAD(  45.0f), DEG2RAD(0.0f) },
 336         { BackLeft,   DEG2RAD(-135.0f), DEG2RAD(0.0f) },
 337         { BackRight,  DEG2RAD( 135.0f), DEG2RAD(0.0f) }
 338     }, X51Map[6] = {
 339         { FrontLeft,   DEG2RAD( -30.0f), DEG2RAD(0.0f) },
 340         { FrontRight,  DEG2RAD(  30.0f), DEG2RAD(0.0f) },
 341         { FrontCenter, DEG2RAD(   0.0f), DEG2RAD(0.0f) },
 342         { LFE, 0.0f, 0.0f },
 343         { SideLeft,    DEG2RAD(-110.0f), DEG2RAD(0.0f) },
 344         { SideRight,   DEG2RAD( 110.0f), DEG2RAD(0.0f) }
 345     }, X61Map[7] = {
 346         { FrontLeft,    DEG2RAD(-30.0f), DEG2RAD(0.0f) },
 347         { FrontRight,   DEG2RAD( 30.0f), DEG2RAD(0.0f) },
 348         { FrontCenter,  DEG2RAD(  0.0f), DEG2RAD(0.0f) },
 349         { LFE, 0.0f, 0.0f },
 350         { BackCenter,   DEG2RAD(180.0f), DEG2RAD(0.0f) },
 351         { SideLeft,     DEG2RAD(-90.0f), DEG2RAD(0.0f) },
 352         { SideRight,    DEG2RAD( 90.0f), DEG2RAD(0.0f) }
 353     }, X71Map[8] = {
 354         { FrontLeft,   DEG2RAD( -30.0f), DEG2RAD(0.0f) },
 355         { FrontRight,  DEG2RAD(  30.0f), DEG2RAD(0.0f) },
 356         { FrontCenter, DEG2RAD(   0.0f), DEG2RAD(0.0f) },
 357         { LFE, 0.0f, 0.0f },
 358         { BackLeft,    DEG2RAD(-150.0f), DEG2RAD(0.0f) },
 359         { BackRight,   DEG2RAD( 150.0f), DEG2RAD(0.0f) },
 360         { SideLeft,    DEG2RAD( -90.0f), DEG2RAD(0.0f) },
 361         { SideRight,   DEG2RAD(  90.0f), DEG2RAD(0.0f) }
 362     };
 363
 364     const ALCdevice *Device = ALContext->Device;
 365     ALfloat SourceVolume,ListenerGain,MinVolume,MaxVolume;
 366     ALbufferlistitem *BufferListItem;
 367     enum FmtChannels Channels;
 368     ALfloat DryGain, DryGainHF, DryGainLF;
 369     ALfloat WetGain[MAX_SENDS];
 370     ALfloat WetGainHF[MAX_SENDS];
 371     ALfloat WetGainLF[MAX_SENDS];
 372     ALeffectslot *SendSlots[MAX_SENDS];
 373     ALuint NumSends, Frequency;
 374     ALboolean Relative;
 375     const struct ChanMap *chans = NULL;
 376     ALuint num_channels = 0;
 377     ALboolean DirectChannels;
 378     ALboolean isbformat = AL_FALSE;
 379     ALfloat Pitch;
 380     ALuint i, j, c;
 381
 382     /* Get device properties */
 383     NumSends  = Device->NumAuxSends;
 384     Frequency = Device->Frequency;
 385
 386     /* Get listener properties */
 387     ListenerGain = ALContext->Listener->Gain;
 388
 389     /* Get source properties */
 390     SourceVolume    = ALSource->Gain;
 391     MinVolume       = ALSource->MinGain;
 392     MaxVolume       = ALSource->MaxGain;
 393     Pitch           = ALSource->Pitch;
 394     Relative        = ALSource->HeadRelative;
 395     DirectChannels  = ALSource->DirectChannels;
 396
 397     voice->Direct.OutBuffer = Device->DryBuffer;
 398     voice->Direct.OutChannels = Device->NumChannels;
 399     for(i = 0;i < NumSends;i++)
 400     {
 401         SendSlots[i] = ALSource->Send[i].Slot;
 402         if(!SendSlots[i] && i == 0)
 403             SendSlots[i] = Device->DefaultSlot;
 404         if(!SendSlots[i] || SendSlots[i]->EffectType == AL_EFFECT_NULL)
 405         {
 406             SendSlots[i] = NULL;
 407             voice->Send[i].OutBuffer = NULL;
 408             voice->Send[i].OutChannels = 0;
 409         }
 410         else
 411         {
 412             voice->Send[i].OutBuffer = SendSlots[i]->WetBuffer;
 413             voice->Send[i].OutChannels = SendSlots[i]->NumChannels;
 414         }
 415     }
 416
 417     /* Calculate the stepping value */
 418     Channels = FmtMono;
 419     BufferListItem = ATOMIC_LOAD(&ALSource->queue);
 420     while(BufferListItem != NULL)
 421     {
 422         ALbuffer *ALBuffer;
 423         if((ALBuffer=BufferListItem->buffer) != NULL)
 424         {
 425             Pitch = Pitch * ALBuffer->Frequency / Frequency;
 426             if(Pitch > (ALfloat)MAX_PITCH)
 427                 voice->Step = MAX_PITCH<<FRACTIONBITS;
 428             else
 429                 voice->Step = maxi(fastf2i(Pitch*FRACTIONONE + 0.5f), 1);
 430             BsincPrepare(voice->Step, &voice->SincState);
 431
 432             Channels = ALBuffer->FmtChannels;
 433             break;
 434         }
 435         BufferListItem = BufferListItem->next;
 436     }
 437
 438     /* Calculate gains */
 439     DryGain  = clampf(SourceVolume, MinVolume, MaxVolume);
 440     DryGain  *= ALSource->Direct.Gain * ListenerGain;
 441     DryGainHF = ALSource->Direct.GainHF;
 442     DryGainLF = ALSource->Direct.GainLF;
 443     for(i = 0;i < NumSends;i++)
 444     {
 445         WetGain[i] = clampf(SourceVolume, MinVolume, MaxVolume);
 446         WetGain[i]  *= ALSource->Send[i].Gain * ListenerGain;
 447         WetGainHF[i] = ALSource->Send[i].GainHF;
 448         WetGainLF[i] = ALSource->Send[i].GainLF;
 449     }
 450
 451     switch(Channels)
 452     {
 453     case FmtMono:
 454         chans = MonoMap;
 455         num_channels = 1;
 456         break;
 457
 458     case FmtStereo:
 459         chans = StereoMap;
 460         num_channels = 2;
 461         break;
 462
 463     case FmtRear:
 464         chans = RearMap;
 465         num_channels = 2;
 466         break;
 467
 468     case FmtQuad:
 469         chans = QuadMap;
 470         num_channels = 4;
 471         break;
 472
 473     case FmtX51:
 474         chans = X51Map;
 475         num_channels = 6;
 476         break;
 477
 478     case FmtX61:
 479         chans = X61Map;
 480         num_channels = 7;
 481         break;
 482
 483     case FmtX71:
 484         chans = X71Map;
 485         num_channels = 8;
 486         break;
 487
 488     case FmtBFormat2D:
 489         num_channels = 3;
 490         isbformat = AL_TRUE;
 491         DirectChannels = AL_FALSE;
 492         break;
 493
 494     case FmtBFormat3D:
 495         num_channels = 4;
 496         isbformat = AL_TRUE;
 497         DirectChannels = AL_FALSE;
 498         break;
 499     }
 500
 501     if(isbformat)
 502     {
 503         ALfloat N[3], V[3], U[3];
 504         aluMatrixf matrix;
 505         ALfloat scale;
 506
 507         /* AT then UP */
 508         N[0] = ALSource->Orientation[0][0];
 509         N[1] = ALSource->Orientation[0][1];
 510         N[2] = ALSource->Orientation[0][2];
 511         aluNormalize(N);
 512         V[0] = ALSource->Orientation[1][0];
 513         V[1] = ALSource->Orientation[1][1];
 514         V[2] = ALSource->Orientation[1][2];
 515         aluNormalize(V);
 516         if(!Relative)
 517         {
 518             const aluMatrixd *lmatrix = &ALContext->Listener->Params.Matrix;
 519             aluMatrixdFloat3(N, 0.0f, lmatrix);
 520             aluMatrixdFloat3(V, 0.0f, lmatrix);
 521         }
 522         /* Build and normalize right-vector */
 523         aluCrossproduct(N, V, U);
 524         aluNormalize(U);
 525
 526         /* Build a rotate + conversion matrix (B-Format -> N3D), and include
 527          * scaling for first-order content on second- or third-order output.
 528          */
 529         scale = Device->AmbiScale * 1.732050808f;
 530         aluMatrixfSet(&matrix,
 531             1.414213562f,        0.0f,        0.0f,        0.0f,
 532                     0.0f, -N[0]*scale,  N[1]*scale, -N[2]*scale,
 533                     0.0f,  U[0]*scale, -U[1]*scale,  U[2]*scale,
 534                     0.0f, -V[0]*scale,  V[1]*scale, -V[2]*scale
 535         );
 536
 537         for(c = 0;c < num_channels;c++)
 538             ComputeFirstOrderGains(Device->AmbiCoeffs, Device->NumChannels, matrix.m[c], DryGain,
 539                                    voice->Direct.Gains[c].Target);
 540
 541         /* Rebuild the matrix, without the second- or third-order output
 542          * scaling (effects take first-order content, and will do the scaling
 543          * themselves when mixing to the output).
 544          */
 545         scale = 1.732050808f;
 546         aluMatrixfSetRow(&matrix, 1, 0.0f, -N[0]*scale,  N[1]*scale, -N[2]*scale);
 547         aluMatrixfSetRow(&matrix, 2, 0.0f,  U[0]*scale, -U[1]*scale,  U[2]*scale);
 548         aluMatrixfSetRow(&matrix, 3, 0.0f, -V[0]*scale,  V[1]*scale, -V[2]*scale);
 549         for(i = 0;i < NumSends;i++)
 550         {
 551             if(!SendSlots[i])
 552             {
 553                 for(c = 0;c < num_channels;c++)
 554                 {
 555                     for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
 556                         voice->Send[i].Gains[c].Target[j] = 0.0f;
 557                 }
 558             }
 559             else
 560             {
 561                 for(c = 0;c < num_channels;c++)
 562                 {
 563                     const ALeffectslot *Slot = SendSlots[i];
 564                     ComputeFirstOrderGains(Slot->AmbiCoeffs, Slot->NumChannels, matrix.m[c],
 565                                            WetGain[i], voice->Send[i].Gains[c].Target);
 566                 }
 567             }
 568         }
 569
 570         voice->IsHrtf = AL_FALSE;
 571     }
 572     else
 573     {
 574         ALfloat coeffs[MAX_AMBI_COEFFS];
 575
 576         if(DirectChannels)
 577         {
 578             if(Device->Hrtf || Device->Uhj_Encoder)
 579             {
 580                 /* DirectChannels with HRTF or UHJ enabled. Skip the virtual
 581                  * channels and write FrontLeft and FrontRight inputs to the
 582                  * first and second outputs.
 583                  */
 584                 voice->Direct.OutBuffer = Device->RealOut.Buffer;
 585                 voice->Direct.OutChannels = Device->RealOut.NumChannels;
 586                 for(c = 0;c < num_channels;c++)
 587                 {
 588                     for(j = 0;j < MAX_OUTPUT_CHANNELS;j++)
 589                         voice->Direct.Gains[c].Target[j] = 0.0f;
 590
 591                     if(chans[c].channel == FrontLeft)
 592                         voice->Direct.Gains[c].Target[0] = DryGain;
 593                     else if(chans[c].channel == FrontRight)
 594                         voice->Direct.Gains[c].Target[1] = DryGain;
 595                 }
 596             }
 597             else for(c = 0;c < num_channels;c++)
 598             {
 599                 int idx;
 600                 for(j = 0;j < MAX_OUTPUT_CHANNELS;j++)
 601                     voice->Direct.Gains[c].Target[j] = 0.0f;
 602                 if((idx=GetChannelIdxByName(Device, chans[c].channel)) != -1)
 603                     voice->Direct.Gains[c].Target[idx] = DryGain;
 604             }
 605
 606             /* Auxiliary sends still use normal panning since they mix to B-Format, which can't
 607              * channel-match. */
 608             for(c = 0;c < num_channels;c++)
 609             {
 610                 CalcAngleCoeffs(chans[c].angle, chans[c].elevation, coeffs);
 611
 612                 for(i = 0;i < NumSends;i++)
 613                 {
 614                     if(!SendSlots[i])
 615                     {
 616                         for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
 617                             voice->Send[i].Gains[c].Target[j] = 0.0f;
 618                     }
 619                     else
 620                     {
 621                         const ALeffectslot *Slot = SendSlots[i];
 622                         ComputePanningGains(Slot->AmbiCoeffs, Slot->NumChannels, coeffs,
 623                                             WetGain[i], voice->Send[i].Gains[c].Target);
 624                     }
 625                 }
 626             }
 627
 628             voice->IsHrtf = AL_FALSE;
 629         }
 630         else if(Device->Render_Mode == HrtfRender)
 631         {
 632             /* Full HRTF rendering. Skip the virtual channels and render each
 633              * input channel to the real outputs.
 634              */
 635             voice->Direct.OutBuffer = Device->RealOut.Buffer;
 636             voice->Direct.OutChannels = Device->RealOut.NumChannels;
 637             for(c = 0;c < num_channels;c++)
 638             {
 639                 if(chans[c].channel == LFE)
 640                 {
 641                     /* Skip LFE */
 642                     voice->Direct.Hrtf[c].Target.Delay[0] = 0;
 643                     voice->Direct.Hrtf[c].Target.Delay[1] = 0;
 644                     for(i = 0;i < HRIR_LENGTH;i++)
 645                     {
 646                         voice->Direct.Hrtf[c].Target.Coeffs[i][0] = 0.0f;
 647                         voice->Direct.Hrtf[c].Target.Coeffs[i][1] = 0.0f;
 648                     }
 649
 650                     for(i = 0;i < NumSends;i++)
 651                     {
 652                         for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
 653                             voice->Send[i].Gains[c].Target[j] = 0.0f;
 654                     }
 655
 656                     continue;
 657                 }
 658
 659                 /* Get the static HRIR coefficients and delays for this channel. */
 660                 GetLerpedHrtfCoeffs(Device->Hrtf,
 661                     chans[c].elevation, chans[c].angle, 1.0f, DryGain,
 662                     voice->Direct.Hrtf[c].Target.Coeffs,
 663                     voice->Direct.Hrtf[c].Target.Delay
 664                 );
 665
 666                 /* Normal panning for auxiliary sends. */
 667                 CalcAngleCoeffs(chans[c].angle, chans[c].elevation, coeffs);
 668
 669                 for(i = 0;i < NumSends;i++)
 670                 {
 671                     if(!SendSlots[i])
 672                     {
 673                         for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
 674                             voice->Send[i].Gains[c].Target[j] = 0.0f;
 675                     }
 676                     else
 677                     {
 678                         const ALeffectslot *Slot = SendSlots[i];
 679                         ComputePanningGains(Slot->AmbiCoeffs, Slot->NumChannels, coeffs,
 680                                             WetGain[i], voice->Send[i].Gains[c].Target);
 681                     }
 682                 }
 683             }
 684
 685             voice->IsHrtf = AL_TRUE;
 686         }
 687         else
 688         {
 689             /* Non-HRTF rendering. Use normal panning to the output. */
 690             for(c = 0;c < num_channels;c++)
 691             {
 692                 /* Special-case LFE */
 693                 if(chans[c].channel == LFE)
 694                 {
 695                     int idx;
 696                     for(j = 0;j < MAX_OUTPUT_CHANNELS;j++)
 697                         voice->Direct.Gains[c].Target[j] = 0.0f;
 698                     if((idx=GetChannelIdxByName(Device, chans[c].channel)) != -1)
 699                         voice->Direct.Gains[c].Target[idx] = DryGain;
 700
 701                     for(i = 0;i < NumSends;i++)
 702                     {
 703                         ALuint j;
 704                         for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
 705                             voice->Send[i].Gains[c].Target[j] = 0.0f;
 706                     }
 707                     continue;
 708                 }
 709
 710                 if(Device->Render_Mode == StereoPair)
 711                 {
 712                     /* Clamp X so it remains within 30 degrees of 0 or 180 degree azimuth. */
 713                     ALfloat x = sinf(chans[c].angle) * cosf(chans[c].elevation);
 714                     coeffs[0] = clampf(-x, -0.5f, 0.5f) + 0.5;
 715                     voice->Direct.Gains[c].Target[0] = coeffs[0] * DryGain;
 716                     voice->Direct.Gains[c].Target[1] = (1.0f-coeffs[0]) * DryGain;
 717                     for(j = 2;j < MAX_OUTPUT_CHANNELS;j++)
 718                         voice->Direct.Gains[c].Target[j] = 0.0f;
 719
 720                     CalcAngleCoeffs(chans[c].angle, chans[c].elevation, coeffs);
 721                 }
 722                 else
 723                 {
 724                     CalcAngleCoeffs(chans[c].angle, chans[c].elevation, coeffs);
 725                     ComputePanningGains(Device->AmbiCoeffs, Device->NumChannels, coeffs, DryGain,
 726                                         voice->Direct.Gains[c].Target);
 727                 }
 728
 729                 for(i = 0;i < NumSends;i++)
 730                 {
 731                     if(!SendSlots[i])
 732                     {
 733                         ALuint j;
 734                         for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
 735                             voice->Send[i].Gains[c].Target[j] = 0.0f;
 736                     }
 737                     else
 738                     {
 739                         const ALeffectslot *Slot = SendSlots[i];
 740                         ComputePanningGains(Slot->AmbiCoeffs, Slot->NumChannels, coeffs,
 741                                             WetGain[i], voice->Send[i].Gains[c].Target);
 742                     }
 743                 }
 744             }
 745
 746             voice->IsHrtf = AL_FALSE;
 747         }
 748     }
 749
 750     {
 751         ALfloat hfscale = ALSource->Direct.HFReference / Frequency;
 752         ALfloat lfscale = ALSource->Direct.LFReference / Frequency;
 753         DryGainHF = maxf(DryGainHF, 0.0001f);
 754         DryGainLF = maxf(DryGainLF, 0.0001f);
 755         for(c = 0;c < num_channels;c++)
 756         {
 757             voice->Direct.Filters[c].ActiveType = AF_None;
 758             if(DryGainHF != 1.0f) voice->Direct.Filters[c].ActiveType |= AF_LowPass;
 759             if(DryGainLF != 1.0f) voice->Direct.Filters[c].ActiveType |= AF_HighPass;
 760             ALfilterState_setParams(
 761                 &voice->Direct.Filters[c].LowPass, ALfilterType_HighShelf,
 762                 DryGainHF, hfscale, calc_rcpQ_from_slope(DryGainHF, 0.75f)
 763             );
 764             ALfilterState_setParams(
 765                 &voice->Direct.Filters[c].HighPass, ALfilterType_LowShelf,
 766                 DryGainLF, lfscale, calc_rcpQ_from_slope(DryGainLF, 0.75f)
 767             );
 768         }
 769     }
 770     for(i = 0;i < NumSends;i++)
 771     {
 772         ALfloat hfscale = ALSource->Send[i].HFReference / Frequency;
 773         ALfloat lfscale = ALSource->Send[i].LFReference / Frequency;
 774         WetGainHF[i] = maxf(WetGainHF[i], 0.0001f);
 775         WetGainLF[i] = maxf(WetGainLF[i], 0.0001f);
 776         for(c = 0;c < num_channels;c++)
 777         {
 778             voice->Send[i].Filters[c].ActiveType = AF_None;
 779             if(WetGainHF[i] != 1.0f) voice->Send[i].Filters[c].ActiveType |= AF_LowPass;
 780             if(WetGainLF[i] != 1.0f) voice->Send[i].Filters[c].ActiveType |= AF_HighPass;
 781             ALfilterState_setParams(
 782                 &voice->Send[i].Filters[c].LowPass, ALfilterType_HighShelf,
 783                 WetGainHF[i], hfscale, calc_rcpQ_from_slope(WetGainHF[i], 0.75f)
 784             );
 785             ALfilterState_setParams(
 786                 &voice->Send[i].Filters[c].HighPass, ALfilterType_LowShelf,
 787                 WetGainLF[i], lfscale, calc_rcpQ_from_slope(WetGainLF[i], 0.75f)
 788             );
 789         }
 790     }
 791 }
 792
 793 ALvoid CalcSourceParams(ALvoice *voice, const ALsource *ALSource, const ALCcontext *ALContext)
 794 {
 795     const ALCdevice *Device = ALContext->Device;
 796     aluVector Position, Velocity, Direction, SourceToListener;
 797     ALfloat InnerAngle,OuterAngle,Angle,Distance,ClampedDist;
 798     ALfloat MinVolume,MaxVolume,MinDist,MaxDist,Rolloff;
 799     ALfloat ConeVolume,ConeHF,SourceVolume,ListenerGain;
 800     ALfloat DopplerFactor, SpeedOfSound;
 801     ALfloat AirAbsorptionFactor;
 802     ALfloat RoomAirAbsorption[MAX_SENDS];
 803     ALbufferlistitem *BufferListItem;
 804     ALeffectslot *SendSlots[MAX_SENDS];
 805     ALfloat Attenuation;
 806     ALfloat RoomAttenuation[MAX_SENDS];
 807     ALfloat MetersPerUnit;
 808     ALfloat RoomRolloffBase;
 809     ALfloat RoomRolloff[MAX_SENDS];
 810     ALfloat DecayDistance[MAX_SENDS];
 811     ALfloat DryGain;
 812     ALfloat DryGainHF;
 813     ALfloat DryGainLF;
 814     ALboolean DryGainHFAuto;
 815     ALfloat WetGain[MAX_SENDS];
 816     ALfloat WetGainHF[MAX_SENDS];
 817     ALfloat WetGainLF[MAX_SENDS];
 818     ALboolean WetGainAuto;
 819     ALboolean WetGainHFAuto;
 820     ALfloat Pitch;
 821     ALuint Frequency;
 822     ALint NumSends;
 823     ALint i;
 824
 825     DryGainHF = 1.0f;
 826     DryGainLF = 1.0f;
 827     for(i = 0;i < MAX_SENDS;i++)
 828     {
 829         WetGainHF[i] = 1.0f;
 830         WetGainLF[i] = 1.0f;
 831     }
 832
 833     /* Get context/device properties */
 834     DopplerFactor = ALContext->DopplerFactor * ALSource->DopplerFactor;
 835     SpeedOfSound  = ALContext->SpeedOfSound * ALContext->DopplerVelocity;
 836     NumSends      = Device->NumAuxSends;
 837     Frequency     = Device->Frequency;
 838
 839     /* Get listener properties */
 840     ListenerGain  = ALContext->Listener->Gain;
 841     MetersPerUnit = ALContext->Listener->MetersPerUnit;
 842
 843     /* Get source properties */
 844     SourceVolume   = ALSource->Gain;
 845     MinVolume      = ALSource->MinGain;
 846     MaxVolume      = ALSource->MaxGain;
 847     Pitch          = ALSource->Pitch;
 848     Position       = ALSource->Position;
 849     Direction      = ALSource->Direction;
 850     Velocity       = ALSource->Velocity;
 851     MinDist        = ALSource->RefDistance;
 852     MaxDist        = ALSource->MaxDistance;
 853     Rolloff        = ALSource->RollOffFactor;
 854     InnerAngle     = ALSource->InnerAngle;
 855     OuterAngle     = ALSource->OuterAngle;
 856     AirAbsorptionFactor = ALSource->AirAbsorptionFactor;
 857     DryGainHFAuto   = ALSource->DryGainHFAuto;
 858     WetGainAuto     = ALSource->WetGainAuto;
 859     WetGainHFAuto   = ALSource->WetGainHFAuto;
 860     RoomRolloffBase = ALSource->RoomRolloffFactor;
 861
 862     voice->Direct.OutBuffer = Device->DryBuffer;
 863     voice->Direct.OutChannels = Device->NumChannels;
 864     for(i = 0;i < NumSends;i++)
 865     {
 866         SendSlots[i] = ALSource->Send[i].Slot;
 867
 868         if(!SendSlots[i] && i == 0)
 869             SendSlots[i] = Device->DefaultSlot;
 870         if(!SendSlots[i] || SendSlots[i]->EffectType == AL_EFFECT_NULL)
 871         {
 872             SendSlots[i] = NULL;
 873             RoomRolloff[i] = 0.0f;
 874             DecayDistance[i] = 0.0f;
 875             RoomAirAbsorption[i] = 1.0f;
 876         }
 877         else if(SendSlots[i]->AuxSendAuto)
 878         {
 879             RoomRolloff[i] = RoomRolloffBase;
 880             if(IsReverbEffect(SendSlots[i]->EffectType))
 881             {
 882                 RoomRolloff[i] += SendSlots[i]->EffectProps.Reverb.RoomRolloffFactor;
 883                 DecayDistance[i] = SendSlots[i]->EffectProps.Reverb.DecayTime *
 884                                    SPEEDOFSOUNDMETRESPERSEC;
 885                 RoomAirAbsorption[i] = SendSlots[i]->EffectProps.Reverb.AirAbsorptionGainHF;
 886             }
 887             else
 888             {
 889                 DecayDistance[i] = 0.0f;
 890                 RoomAirAbsorption[i] = 1.0f;
 891             }
 892         }
 893         else
 894         {
 895             /* If the slot's auxiliary send auto is off, the data sent to the
 896              * effect slot is the same as the dry path, sans filter effects */
 897             RoomRolloff[i] = Rolloff;
 898             DecayDistance[i] = 0.0f;
 899             RoomAirAbsorption[i] = AIRABSORBGAINHF;
 900         }
 901
 902         if(!SendSlots[i])
 903         {
 904             voice->Send[i].OutBuffer = NULL;
 905             voice->Send[i].OutChannels = 0;
 906         }
 907         else
 908         {
 909             voice->Send[i].OutBuffer = SendSlots[i]->WetBuffer;
 910             voice->Send[i].OutChannels = SendSlots[i]->NumChannels;
 911         }
 912     }
 913
 914     /* Transform source to listener space (convert to head relative) */
 915     if(ALSource->HeadRelative == AL_FALSE)
 916     {
 917         const aluMatrixd *Matrix = &ALContext->Listener->Params.Matrix;
 918         /* Transform source vectors */
 919         Position = aluMatrixdVector(Matrix, &Position);
 920         Velocity = aluMatrixdVector(Matrix, &Velocity);
 921         Direction = aluMatrixdVector(Matrix, &Direction);
 922     }
 923     else
 924     {
 925         const aluVector *lvelocity = &ALContext->Listener->Params.Velocity;
 926         /* Offset the source velocity to be relative of the listener velocity */
 927         Velocity.v[0] += lvelocity->v[0];
 928         Velocity.v[1] += lvelocity->v[1];
 929         Velocity.v[2] += lvelocity->v[2];
 930     }
 931
 932     aluNormalize(Direction.v);
 933     SourceToListener.v[0] = -Position.v[0];
 934     SourceToListener.v[1] = -Position.v[1];
 935     SourceToListener.v[2] = -Position.v[2];
 936     SourceToListener.v[3] = 0.0f;
 937     Distance = aluNormalize(SourceToListener.v);
 938
 939     /* Calculate distance attenuation */
 940     ClampedDist = Distance;
 941
 942     Attenuation = 1.0f;
 943     for(i = 0;i < NumSends;i++)
 944         RoomAttenuation[i] = 1.0f;
 945     switch(ALContext->SourceDistanceModel ? ALSource->DistanceModel :
 946                                             ALContext->DistanceModel)
 947     {
 948         case InverseDistanceClamped:
 949             ClampedDist = clampf(ClampedDist, MinDist, MaxDist);
 950             if(MaxDist < MinDist)
 951                 break;
 952             /*fall-through*/
 953         case InverseDistance:
 954             if(MinDist > 0.0f)
 955             {
 956                 ALfloat dist = lerp(MinDist, ClampedDist, Rolloff);
 957                 if(dist > 0.0f) Attenuation = MinDist / dist;
 958                 for(i = 0;i < NumSends;i++)
 959                 {
 960                     dist = lerp(MinDist, ClampedDist, RoomRolloff[i]);
 961                     if(dist > 0.0f) RoomAttenuation[i] = MinDist / dist;
 962                 }
 963             }
 964             break;
 965
 966         case LinearDistanceClamped:
 967             ClampedDist = clampf(ClampedDist, MinDist, MaxDist);
 968             if(MaxDist < MinDist)
 969                 break;
 970             /*fall-through*/
 971         case LinearDistance:
 972             if(MaxDist != MinDist)
 973             {
 974                 Attenuation = 1.0f - (Rolloff*(ClampedDist-MinDist)/(MaxDist - MinDist));
 975                 Attenuation = maxf(Attenuation, 0.0f);
 976                 for(i = 0;i < NumSends;i++)
 977                 {
 978                     RoomAttenuation[i] = 1.0f - (RoomRolloff[i]*(ClampedDist-MinDist)/(MaxDist - MinDist));
 979                     RoomAttenuation[i] = maxf(RoomAttenuation[i], 0.0f);
 980                 }
 981             }
 982             break;
 983
 984         case ExponentDistanceClamped:
 985             ClampedDist = clampf(ClampedDist, MinDist, MaxDist);
 986             if(MaxDist < MinDist)
 987                 break;
 988             /*fall-through*/
 989         case ExponentDistance:
 990             if(ClampedDist > 0.0f && MinDist > 0.0f)
 991             {
 992                 Attenuation = powf(ClampedDist/MinDist, -Rolloff);
 993                 for(i = 0;i < NumSends;i++)
 994                     RoomAttenuation[i] = powf(ClampedDist/MinDist, -RoomRolloff[i]);
 995             }
 996             break;
 997
 998         case DisableDistance:
 999             ClampedDist = MinDist;
1000             break;
1001     }
1002
1003     /* Source Gain + Attenuation */
1004     DryGain = SourceVolume * Attenuation;
1005     for(i = 0;i < NumSends;i++)
1006         WetGain[i] = SourceVolume * RoomAttenuation[i];
1007
1008     /* Distance-based air absorption */
1009     if(AirAbsorptionFactor > 0.0f && ClampedDist > MinDist)
1010     {
1011         ALfloat meters = (ClampedDist-MinDist) * MetersPerUnit;
1012         DryGainHF *= powf(AIRABSORBGAINHF, AirAbsorptionFactor*meters);
1013         for(i = 0;i < NumSends;i++)
1014             WetGainHF[i] *= powf(RoomAirAbsorption[i], AirAbsorptionFactor*meters);
1015     }
1016
1017     if(WetGainAuto)
1018     {
1019         ALfloat ApparentDist = 1.0f/maxf(Attenuation, 0.00001f) - 1.0f;
1020
1021         /* Apply a decay-time transformation to the wet path, based on the
1022          * attenuation of the dry path.
1023          *
1024          * Using the apparent distance, based on the distance attenuation, the
1025          * initial decay of the reverb effect is calculated and applied to the
1026          * wet path.
1027          */
1028         for(i = 0;i < NumSends;i++)
1029         {
1030             if(DecayDistance[i] > 0.0f)
1031                 WetGain[i] *= powf(0.001f/*-60dB*/, ApparentDist/DecayDistance[i]);
1032         }
1033     }
1034
1035     /* Calculate directional soundcones */
1036     Angle = RAD2DEG(acosf(aluDotproduct(&Direction, &SourceToListener)) * ConeScale) * 2.0f;
1037     if(Angle > InnerAngle && Angle <= OuterAngle)
1038     {
1039         ALfloat scale = (Angle-InnerAngle) / (OuterAngle-InnerAngle);
1040         ConeVolume = lerp(1.0f, ALSource->OuterGain, scale);
1041         ConeHF = lerp(1.0f, ALSource->OuterGainHF, scale);
1042     }
1043     else if(Angle > OuterAngle)
1044     {
1045         ConeVolume = ALSource->OuterGain;
1046         ConeHF = ALSource->OuterGainHF;
1047     }
1048     else
1049     {
1050         ConeVolume = 1.0f;
1051         ConeHF = 1.0f;
1052     }
1053
1054     DryGain *= ConeVolume;
1055     if(WetGainAuto)
1056     {
1057         for(i = 0;i < NumSends;i++)
1058             WetGain[i] *= ConeVolume;
1059     }
1060     if(DryGainHFAuto)
1061         DryGainHF *= ConeHF;
1062     if(WetGainHFAuto)
1063     {
1064         for(i = 0;i < NumSends;i++)
1065             WetGainHF[i] *= ConeHF;
1066     }
1067
1068     /* Clamp to Min/Max Gain */
1069     DryGain = clampf(DryGain, MinVolume, MaxVolume);
1070     for(i = 0;i < NumSends;i++)
1071         WetGain[i] = clampf(WetGain[i], MinVolume, MaxVolume);
1072
1073     /* Apply gain and frequency filters */
1074     DryGain   *= ALSource->Direct.Gain * ListenerGain;
1075     DryGainHF *= ALSource->Direct.GainHF;
1076     DryGainLF *= ALSource->Direct.GainLF;
1077     for(i = 0;i < NumSends;i++)
1078     {
1079         WetGain[i]   *= ALSource->Send[i].Gain * ListenerGain;
1080         WetGainHF[i] *= ALSource->Send[i].GainHF;
1081         WetGainLF[i] *= ALSource->Send[i].GainLF;
1082     }
1083
1084     /* Calculate velocity-based doppler effect */
1085     if(DopplerFactor > 0.0f)
1086     {
1087         const aluVector *lvelocity = &ALContext->Listener->Params.Velocity;
1088         ALfloat VSS, VLS;
1089
1090         if(SpeedOfSound < 1.0f)
1091         {
1092             DopplerFactor *= 1.0f/SpeedOfSound;
1093             SpeedOfSound   = 1.0f;
1094         }
1095
1096         VSS = aluDotproduct(&Velocity, &SourceToListener) * DopplerFactor;
1097         VLS = aluDotproduct(lvelocity, &SourceToListener) * DopplerFactor;
1098
1099         Pitch *= clampf(SpeedOfSound-VLS, 1.0f, SpeedOfSound*2.0f - 1.0f) /
1100                  clampf(SpeedOfSound-VSS, 1.0f, SpeedOfSound*2.0f - 1.0f);
1101     }
1102
1103     BufferListItem = ATOMIC_LOAD(&ALSource->queue);
1104     while(BufferListItem != NULL)
1105     {
1106         ALbuffer *ALBuffer;
1107         if((ALBuffer=BufferListItem->buffer) != NULL)
1108         {
1109             /* Calculate fixed-point stepping value, based on the pitch, buffer
1110              * frequency, and output frequency. */
1111             Pitch = Pitch * ALBuffer->Frequency / Frequency;
1112             if(Pitch > (ALfloat)MAX_PITCH)
1113                 voice->Step = MAX_PITCH<<FRACTIONBITS;
1114             else
1115                 voice->Step = maxi(fastf2i(Pitch*FRACTIONONE + 0.5f), 1);
1116             BsincPrepare(voice->Step, &voice->SincState);
1117
1118             break;
1119         }
1120         BufferListItem = BufferListItem->next;
1121     }
1122
1123     if(Device->Render_Mode == HrtfRender)
1124     {
1125         /* Full HRTF rendering. Skip the virtual channels and render to the
1126          * real outputs.
1127          */
1128         aluVector dir = {{ 0.0f, 0.0f, -1.0f, 0.0f }};
1129         ALfloat ev = 0.0f, az = 0.0f;
1130         ALfloat radius = ALSource->Radius;
1131         ALfloat dirfact = 1.0f;
1132         ALfloat coeffs[MAX_AMBI_COEFFS];
1133
1134         voice->Direct.OutBuffer = Device->RealOut.Buffer;
1135         voice->Direct.OutChannels = Device->RealOut.NumChannels;
1136
1137         if(Distance > FLT_EPSILON)
1138         {
1139             dir.v[0] = -SourceToListener.v[0];
1140             dir.v[1] = -SourceToListener.v[1];
1141             dir.v[2] = -SourceToListener.v[2] * ZScale;
1142
1143             /* Calculate elevation and azimuth only when the source is not at
1144              * the listener. This prevents +0 and -0 Z from producing
1145              * inconsistent panning. Also, clamp Y in case FP precision errors
1146              * cause it to land outside of -1..+1. */
1147             ev = asinf(clampf(dir.v[1], -1.0f, 1.0f));
1148             az = atan2f(dir.v[0], -dir.v[2]);
1149         }
1150         if(radius > 0.0f)
1151         {
1152             if(radius >= Distance)
1153                 dirfact *= Distance / radius * 0.5f;
1154             else
1155                 dirfact *= 1.0f - (asinf(radius / Distance) / F_PI);
1156         }
1157
1158         /* Get the HRIR coefficients and delays. */
1159         GetLerpedHrtfCoeffs(Device->Hrtf, ev, az, dirfact, DryGain,
1160                             voice->Direct.Hrtf[0].Target.Coeffs,
1161                             voice->Direct.Hrtf[0].Target.Delay);
1162
1163         dir.v[0] *= dirfact;
1164         dir.v[1] *= dirfact;
1165         dir.v[2] *= dirfact;
1166         CalcDirectionCoeffs(dir.v, coeffs);
1167
1168         for(i = 0;i < NumSends;i++)
1169         {
1170             if(!SendSlots[i])
1171             {
1172                 ALuint j;
1173                 for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
1174                     voice->Send[i].Gains[0].Target[j] = 0.0f;
1175             }
1176             else
1177             {
1178                 const ALeffectslot *Slot = SendSlots[i];
1179                 ComputePanningGains(Slot->AmbiCoeffs, Slot->NumChannels, coeffs,
1180                                     WetGain[i], voice->Send[i].Gains[0].Target);
1181             }
1182         }
1183
1184         voice->IsHrtf = AL_TRUE;
1185     }
1186     else
1187     {
1188         /* Non-HRTF rendering. */
1189         ALfloat dir[3] = { 0.0f, 0.0f, -1.0f };
1190         ALfloat radius = ALSource->Radius;
1191         ALfloat coeffs[MAX_AMBI_COEFFS];
1192
1193         /* Get the localized direction, and compute panned gains. */
1194         if(Distance > FLT_EPSILON)
1195         {
1196             dir[0] = -SourceToListener.v[0];
1197             dir[1] = -SourceToListener.v[1];
1198             dir[2] = -SourceToListener.v[2] * ZScale;
1199         }
1200         if(radius > 0.0f)
1201         {
1202             ALfloat dirfact;
1203             if(radius >= Distance)
1204                 dirfact = Distance / radius * 0.5f;
1205             else
1206                 dirfact = 1.0f - (asinf(radius / Distance) / F_PI);
1207             dir[0] *= dirfact;
1208             dir[1] *= dirfact;
1209             dir[2] *= dirfact;
1210         }
1211
1212         if(Device->Render_Mode == StereoPair)
1213         {
1214             /* Clamp X so it remains within 30 degrees of 0 or 180 degree azimuth. */
1215             coeffs[0] = clampf(-dir[0], -0.5f, 0.5f) + 0.5;
1216             voice->Direct.Gains[0].Target[0] = coeffs[0] * DryGain;
1217             voice->Direct.Gains[0].Target[1] = (1.0f-coeffs[0]) * DryGain;
1218             for(i = 2;i < MAX_OUTPUT_CHANNELS;i++)
1219                 voice->Direct.Gains[0].Target[i] = 0.0f;
1220
1221             CalcDirectionCoeffs(dir, coeffs);
1222         }
1223         else
1224         {
1225             CalcDirectionCoeffs(dir, coeffs);
1226             ComputePanningGains(Device->AmbiCoeffs, Device->NumChannels, coeffs, DryGain,
1227                                 voice->Direct.Gains[0].Target);
1228         }
1229
1230         for(i = 0;i < NumSends;i++)
1231         {
1232             if(!SendSlots[i])
1233             {
1234                 ALuint j;
1235                 for(j = 0;j < MAX_EFFECT_CHANNELS;j++)
1236                     voice->Send[i].Gains[0].Target[j] = 0.0f;
1237             }
1238             else
1239             {
1240                 const ALeffectslot *Slot = SendSlots[i];
1241                 ComputePanningGains(Slot->AmbiCoeffs, Slot->NumChannels, coeffs,
1242                                     WetGain[i], voice->Send[i].Gains[0].Target);
1243             }
1244         }
1245
1246         voice->IsHrtf = AL_FALSE;
1247     }
1248
1249     {
1250         ALfloat hfscale = ALSource->Direct.HFReference / Frequency;
1251         ALfloat lfscale = ALSource->Direct.LFReference / Frequency;
1252         DryGainHF = maxf(DryGainHF, 0.0001f);
1253         DryGainLF = maxf(DryGainLF, 0.0001f);
1254         voice->Direct.Filters[0].ActiveType = AF_None;
1255         if(DryGainHF != 1.0f) voice->Direct.Filters[0].ActiveType |= AF_LowPass;
1256         if(DryGainLF != 1.0f) voice->Direct.Filters[0].ActiveType |= AF_HighPass;
1257         ALfilterState_setParams(
1258             &voice->Direct.Filters[0].LowPass, ALfilterType_HighShelf,
1259             DryGainHF, hfscale, calc_rcpQ_from_slope(DryGainHF, 0.75f)
1260         );
1261         ALfilterState_setParams(
1262             &voice->Direct.Filters[0].HighPass, ALfilterType_LowShelf,
1263             DryGainLF, lfscale, calc_rcpQ_from_slope(DryGainLF, 0.75f)
1264         );
1265     }
1266     for(i = 0;i < NumSends;i++)
1267     {
1268         ALfloat hfscale = ALSource->Send[i].HFReference / Frequency;
1269         ALfloat lfscale = ALSource->Send[i].LFReference / Frequency;
1270         WetGainHF[i] = maxf(WetGainHF[i], 0.0001f);
1271         WetGainLF[i] = maxf(WetGainLF[i], 0.0001f);
1272         voice->Send[i].Filters[0].ActiveType = AF_None;
1273         if(WetGainHF[i] != 1.0f) voice->Send[i].Filters[0].ActiveType |= AF_LowPass;
1274         if(WetGainLF[i] != 1.0f) voice->Send[i].Filters[0].ActiveType |= AF_HighPass;
1275         ALfilterState_setParams(
1276             &voice->Send[i].Filters[0].LowPass, ALfilterType_HighShelf,
1277             WetGainHF[i], hfscale, calc_rcpQ_from_slope(WetGainHF[i], 0.75f)
1278         );
1279         ALfilterState_setParams(
1280             &voice->Send[i].Filters[0].HighPass, ALfilterType_LowShelf,
1281             WetGainLF[i], lfscale, calc_rcpQ_from_slope(WetGainLF[i], 0.75f)
1282         );
1283     }
1284 }
1285
1286
1287 void UpdateContextSources(ALCcontext *ctx)
1288 {
1289     ALvoice *voice, *voice_end;
1290     ALsource *source;
1291
1292     if(ATOMIC_EXCHANGE(ALenum, &ctx->UpdateSources, AL_FALSE))
1293     {
1294         CalcListenerParams(ctx->Listener);
1295
1296         voice = ctx->Voices;
1297         voice_end = voice + ctx->VoiceCount;
1298         for(;voice != voice_end;++voice)
1299         {
1300             if(!(source=voice->Source)) continue;
1301             if(source->state != AL_PLAYING && source->state != AL_PAUSED)
1302                 voice->Source = NULL;
1303             else
1304             {
1305                 ATOMIC_STORE(&source->NeedsUpdate, AL_FALSE);
1306                 voice->Update(voice, source, ctx);
1307             }
1308         }
1309     }
1310     else
1311     {
1312         voice = ctx->Voices;
1313         voice_end = voice + ctx->VoiceCount;
1314         for(;voice != voice_end;++voice)
1315         {
1316             if(!(source=voice->Source)) continue;
1317             if(source->state != AL_PLAYING && source->state != AL_PAUSED)
1318                 voice->Source = NULL;
1319             else if(ATOMIC_EXCHANGE(ALenum, &source->NeedsUpdate, AL_FALSE))
1320                 voice->Update(voice, source, ctx);
1321         }
1322     }
1323 }
1324
1325
1326 /* Specialized function to clamp to [-1, +1] with only one branch. This also
1327  * converts NaN to 0. */
1328 static inline ALfloat aluClampf(ALfloat val)
1329 {
1330     if(fabsf(val) <= 1.0f) return val;
1331     return (ALfloat)((0.0f < val) - (val < 0.0f));
1332 }
1333
1334 static inline ALfloat aluF2F(ALfloat val)
1335 { return val; }
1336
1337 static inline ALint aluF2I(ALfloat val)
1338 {
1339     /* Floats only have a 24-bit mantissa, so [-16777215, +16777215] is the max
1340      * integer range normalized floats can be safely converted to.
1341      */
1342     return fastf2i(aluClampf(val)*16777215.0f)<<7;
1343 }
1344 static inline ALuint aluF2UI(ALfloat val)
1345 { return aluF2I(val)+2147483648u; }
1346
1347 static inline ALshort aluF2S(ALfloat val)
1348 { return fastf2i(aluClampf(val)*32767.0f); }
1349 static inline ALushort aluF2US(ALfloat val)
1350 { return aluF2S(val)+32768; }
1351
1352 static inline ALbyte aluF2B(ALfloat val)
1353 { return fastf2i(aluClampf(val)*127.0f); }
1354 static inline ALubyte aluF2UB(ALfloat val)
1355 { return aluF2B(val)+128; }
1356
1357 #define DECL_TEMPLATE(T, func)                                                \
1358 static void Write_##T(ALfloatBUFFERSIZE *InBuffer, ALvoid *OutBuffer,         \
1359                       ALuint SamplesToDo, ALuint numchans)                    \
1360 {                                                                             \
1361     ALuint i, j;                                                              \
1362     for(j = 0;j < numchans;j++)                                               \
1363     {                                                                         \
1364         const ALfloat *in = InBuffer[j];                                      \
1365         T *restrict out = (T*)OutBuffer + j;                                  \
1366         for(i = 0;i < SamplesToDo;i++)                                        \
1367             out[i*numchans] = func(in[i]);                                    \
1368     }                                                                         \
1369 }
1370
1371 DECL_TEMPLATE(ALfloat, aluF2F)
1372 DECL_TEMPLATE(ALuint, aluF2UI)
1373 DECL_TEMPLATE(ALint, aluF2I)
1374 DECL_TEMPLATE(ALushort, aluF2US)
1375 DECL_TEMPLATE(ALshort, aluF2S)
1376 DECL_TEMPLATE(ALubyte, aluF2UB)
1377 DECL_TEMPLATE(ALbyte, aluF2B)
1378
1379 #undef DECL_TEMPLATE
1380
1381
1382 ALvoid aluMixData(ALCdevice *device, ALvoid *buffer, ALsizei size)
1383 {
1384     ALuint SamplesToDo;
1385     ALvoice *voice, *voice_end;
1386     ALeffectslot *slot;
1387     ALsource *source;
1388     ALCcontext *ctx;
1389     FPUCtl oldMode;
1390     ALuint i, c;
1391
1392     SetMixerFPUMode(&oldMode);
1393
1394     while(size > 0)
1395     {
1396         IncrementRef(&device->MixCount);
1397
1398         SamplesToDo = minu(size, BUFFERSIZE);
1399         for(c = 0;c < device->VirtOut.NumChannels;c++)
1400             memset(device->VirtOut.Buffer[c], 0, SamplesToDo*sizeof(ALfloat));
1401         for(c = 0;c < device->RealOut.NumChannels;c++)
1402             memset(device->RealOut.Buffer[c], 0, SamplesToDo*sizeof(ALfloat));
1403
1404         V0(device->Backend,lock)();
1405
1406         if((slot=device->DefaultSlot) != NULL)
1407         {
1408             if(ATOMIC_EXCHANGE(ALenum, &slot->NeedsUpdate, AL_FALSE))
1409                 V(slot->EffectState,update)(device, slot);
1410             for(i = 0;i < slot->NumChannels;i++)
1411                 memset(slot->WetBuffer[i], 0, SamplesToDo*sizeof(ALfloat));
1412         }
1413
1414         ctx = ATOMIC_LOAD(&device->ContextList);
1415         while(ctx)
1416         {
1417             if(!ctx->DeferUpdates)
1418             {
1419                 UpdateContextSources(ctx);
1420 #define UPDATE_SLOT(iter) do {                                         \
1421     if(ATOMIC_EXCHANGE(ALenum, &(*iter)->NeedsUpdate, AL_FALSE))       \
1422         V((*iter)->EffectState,update)(device, *iter);                 \
1423     for(i = 0;i < (*iter)->NumChannels;i++)                            \
1424         memset((*iter)->WetBuffer[i], 0, SamplesToDo*sizeof(ALfloat)); \
1425 } while(0)
1426                 VECTOR_FOR_EACH(ALeffectslot*, ctx->ActiveAuxSlots, UPDATE_SLOT);
1427 #undef UPDATE_SLOT
1428             }
1429             else
1430             {
1431 #define CLEAR_WET_BUFFER(iter) do {                                    \
1432     for(i = 0;i < (*iter)->NumChannels;i++)                            \
1433         memset((*iter)->WetBuffer[i], 0, SamplesToDo*sizeof(ALfloat)); \
1434 } while(0)
1435                 VECTOR_FOR_EACH(ALeffectslot*, ctx->ActiveAuxSlots, CLEAR_WET_BUFFER);
1436 #undef CLEAR_WET_BUFFER
1437             }
1438
1439             /* source processing */
1440             voice = ctx->Voices;
1441             voice_end = voice + ctx->VoiceCount;
1442             for(;voice != voice_end;++voice)
1443             {
1444                 source = voice->Source;
1445                 if(source && source->state == AL_PLAYING)
1446                     MixSource(voice, source, device, SamplesToDo);
1447             }
1448
1449             /* effect slot processing */
1450             c = VECTOR_SIZE(ctx->ActiveAuxSlots);
1451             for(i = 0;i < c;i++)
1452             {
1453                 const ALeffectslot *slot = VECTOR_ELEM(ctx->ActiveAuxSlots, i);
1454                 ALeffectState *state = slot->EffectState;
1455                 V(state,process)(SamplesToDo, slot->WetBuffer, device->DryBuffer,
1456                                  device->NumChannels);
1457             }
1458
1459             ctx = ctx->next;
1460         }
1461
1462         if(device->DefaultSlot != NULL)
1463         {
1464             const ALeffectslot *slot = device->DefaultSlot;
1465             ALeffectState *state = slot->EffectState;
1466             V(state,process)(SamplesToDo, slot->WetBuffer, device->DryBuffer,
1467                              device->NumChannels);
1468         }
1469
1470         /* Increment the clock time. Every second's worth of samples is
1471          * converted and added to clock base so that large sample counts don't
1472          * overflow during conversion. This also guarantees an exact, stable
1473          * conversion. */
1474         device->SamplesDone += SamplesToDo;
1475         device->ClockBase += (device->SamplesDone/device->Frequency) * DEVICE_CLOCK_RES;
1476         device->SamplesDone %= device->Frequency;
1477         V0(device->Backend,unlock)();
1478
1479         if(device->Hrtf)
1480         {
1481             HrtfMixerFunc HrtfMix = SelectHrtfMixer();
1482             ALuint irsize = GetHrtfIrSize(device->Hrtf);
1483             MixHrtfParams hrtfparams;
1484             memset(&hrtfparams, 0, sizeof(hrtfparams));
1485             for(c = 0;c < device->VirtOut.NumChannels;c++)
1486             {
1487                 hrtfparams.Current = &device->Hrtf_Params[c];
1488                 hrtfparams.Target = &device->Hrtf_Params[c];
1489                 HrtfMix(device->RealOut.Buffer, device->VirtOut.Buffer[c], 0,
1490                     device->Hrtf_Offset, 0, irsize, &hrtfparams,
1491                     &device->Hrtf_State[c], SamplesToDo
1492                 );
1493             }
1494             device->Hrtf_Offset += SamplesToDo;
1495         }
1496         else
1497         {
1498             if(device->Uhj_Encoder)
1499             {
1500                 /* Encode to stereo-compatible 2-channel UHJ output. */
1501                 EncodeUhj2(device->Uhj_Encoder, device->RealOut.Buffer,
1502                            device->VirtOut.Buffer, SamplesToDo);
1503             }
1504             if(device->Bs2b)
1505             {
1506                 /* Apply binaural/crossfeed filter */
1507                 for(i = 0;i < SamplesToDo;i++)
1508                 {
1509                     float samples[2];
1510                     samples[0] = device->RealOut.Buffer[0][i];
1511                     samples[1] = device->RealOut.Buffer[1][i];
1512                     bs2b_cross_feed(device->Bs2b, samples);
1513                     device->RealOut.Buffer[0][i] = samples[0];
1514                     device->RealOut.Buffer[1][i] = samples[1];
1515                 }
1516             }
1517         }
1518
1519         if(buffer)
1520         {
1521             ALfloat (*OutBuffer)[BUFFERSIZE] = device->RealOut.Buffer;
1522             ALuint OutChannels = device->RealOut.NumChannels;;
1523
1524 #define WRITE(T, a, b, c, d) do {               \
1525     Write_##T((a), (b), (c), (d));              \
1526     buffer = (T*)buffer + (c)*(d);              \
1527 } while(0)
1528             switch(device->FmtType)
1529             {
1530                 case DevFmtByte:
1531                     WRITE(ALbyte, OutBuffer, buffer, SamplesToDo, OutChannels);
1532                     break;
1533                 case DevFmtUByte:
1534                     WRITE(ALubyte, OutBuffer, buffer, SamplesToDo, OutChannels);
1535                     break;
1536                 case DevFmtShort:
1537                     WRITE(ALshort, OutBuffer, buffer, SamplesToDo, OutChannels);
1538                     break;
1539                 case DevFmtUShort:
1540                     WRITE(ALushort, OutBuffer, buffer, SamplesToDo, OutChannels);
1541                     break;
1542                 case DevFmtInt:
1543                     WRITE(ALint, OutBuffer, buffer, SamplesToDo, OutChannels);
1544                     break;
1545                 case DevFmtUInt:
1546                     WRITE(ALuint, OutBuffer, buffer, SamplesToDo, OutChannels);
1547                     break;
1548                 case DevFmtFloat:
1549                     WRITE(ALfloat, OutBuffer, buffer, SamplesToDo, OutChannels);
1550                     break;
1551             }
1552 #undef WRITE
1553         }
1554
1555         size -= SamplesToDo;
1556         IncrementRef(&device->MixCount);
1557     }
1558
1559     RestoreFPUMode(&oldMode);
1560 }
1561
1562
1563 ALvoid aluHandleDisconnect(ALCdevice *device)
1564 {
1565     ALCcontext *Context;
1566
1567     device->Connected = ALC_FALSE;
1568
1569     Context = ATOMIC_LOAD(&device->ContextList);
1570     while(Context)
1571     {
1572         ALvoice *voice, *voice_end;
1573
1574         voice = Context->Voices;
1575         voice_end = voice + Context->VoiceCount;
1576         while(voice != voice_end)
1577         {
1578             ALsource *source = voice->Source;
1579             voice->Source = NULL;
1580
1581             if(source && source->state == AL_PLAYING)
1582             {
1583                 source->state = AL_STOPPED;
1584                 ATOMIC_STORE(&source->current_buffer, NULL);
1585                 source->position = 0;
1586                 source->position_fraction = 0;
1587             }
1588
1589             voice++;
1590         }
1591         Context->VoiceCount = 0;
1592
1593         Context = Context->next;
1594     }
1595 }