disabled SIMD adds in AudioMixer for windows

2025-04-23 01:04:06 +02:00 · 2014-07-15 12:23:02 -07:00 · 2014-07-15 12:23:02 -07:00 · a1b2bf59e9
commit a1b2bf59e9
parent 1047ec7c87
2 changed files with 34 additions and 2 deletions
--- a/assignment-client/src/audio/AudioMixer.cpp
+++ b/assignment-client/src/audio/AudioMixer.cpp
@ -231,6 +231,12 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
            delayBufferSample[0] = correctBufferSample[0] * weakChannelAmplitudeRatio;
            delayBufferSample[1] = correctBufferSample[1] * weakChannelAmplitudeRatio;
            
+#ifdef _WIN32
+            _clientSamples[s + goodChannelOffset] += correctBufferSample[0];
+            _clientSamples[s + goodChannelOffset + SINGLE_STEREO_OFFSET] += correctBufferSample[1];
+            _clientSamples[delayedChannelIndex] += delayBufferSample[0];
+            _clientSamples[delayedChannelIndex + SINGLE_STEREO_OFFSET] += delayBufferSample[1];
+#else
            __m64 bufferSamples = _mm_set_pi16(_clientSamples[s + goodChannelOffset],
                                               _clientSamples[s + goodChannelOffset + SINGLE_STEREO_OFFSET],
                                               _clientSamples[delayedChannelIndex],
@ -247,6 +253,7 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
            _clientSamples[s + goodChannelOffset + SINGLE_STEREO_OFFSET] = shortResults[2];
            _clientSamples[delayedChannelIndex] = shortResults[1];
            _clientSamples[delayedChannelIndex + SINGLE_STEREO_OFFSET] = shortResults[0];
+#endif
        }
        
        // The following code is pretty gross and redundant, but AFAIK it's the best way to avoid
@ -271,6 +278,13 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
            while (i + 3 < numSamplesDelay) {
                // handle the first cases where we can MMX add four samples at once
                int parentIndex = i * 2;
+
+#ifdef _WIN32
+                _clientSamples[parentIndex + delayedChannelOffset] += delayNextOutputStart[i] * attenuationAndWeakChannelRatio;
+                _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset] += delayNextOutputStart[i + 1] * attenuationAndWeakChannelRatio;
+                _clientSamples[parentIndex + DOUBLE_STEREO_OFFSET + delayedChannelOffset] += delayNextOutputStart[i + 2] * attenuationAndWeakChannelRatio;
+                _clientSamples[parentIndex + TRIPLE_STEREO_OFFSET + delayedChannelOffset] += delayNextOutputStart[i + 3] * attenuationAndWeakChannelRatio;
+#else
                __m64 bufferSamples = _mm_set_pi16(_clientSamples[parentIndex + delayedChannelOffset],
                                                   _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset],
                                                   _clientSamples[parentIndex + DOUBLE_STEREO_OFFSET + delayedChannelOffset],
@ -286,7 +300,8 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
                _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset] = shortResults[2];
                _clientSamples[parentIndex + DOUBLE_STEREO_OFFSET + delayedChannelOffset] = shortResults[1];
                _clientSamples[parentIndex + TRIPLE_STEREO_OFFSET + delayedChannelOffset] = shortResults[0];
-                
+#endif
+
                // push the index
                i += 4;
            }
@ -296,6 +311,11 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
            if (i + 2 < numSamplesDelay) {
                // MMX add only three delayed samples
                
+#ifdef _WIN32
+                _clientSamples[parentIndex + delayedChannelOffset] += delayNextOutputStart[i] * attenuationAndWeakChannelRatio;
+                _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset] += delayNextOutputStart[i + 1] * attenuationAndWeakChannelRatio;
+                _clientSamples[parentIndex + DOUBLE_STEREO_OFFSET + delayedChannelOffset] += delayNextOutputStart[i + 2] * attenuationAndWeakChannelRatio;
+#else
                __m64 bufferSamples = _mm_set_pi16(_clientSamples[parentIndex + delayedChannelOffset],
                                                   _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset],
                                                   _clientSamples[parentIndex + DOUBLE_STEREO_OFFSET + delayedChannelOffset],
@ -310,8 +330,15 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
                _clientSamples[parentIndex + delayedChannelOffset] = shortResults[3];
                _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset] = shortResults[2];
                _clientSamples[parentIndex + DOUBLE_STEREO_OFFSET + delayedChannelOffset] = shortResults[1];
+#endif
+
                
            } else if (i + 1 < numSamplesDelay) {
+
+#ifdef _WIN32
+                _clientSamples[parentIndex + delayedChannelOffset] += delayNextOutputStart[i] * attenuationAndWeakChannelRatio;
+                _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset] += delayNextOutputStart[i + 1] * attenuationAndWeakChannelRatio;
+#else
                // MMX add two delayed samples
                __m64 bufferSamples = _mm_set_pi16(_clientSamples[parentIndex + delayedChannelOffset],
                                                   _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset],
@ -324,9 +351,12 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
                
                _clientSamples[parentIndex + delayedChannelOffset] = shortResults[3];
                _clientSamples[parentIndex + SINGLE_STEREO_OFFSET + delayedChannelOffset] = shortResults[2];
-                
+#endif
            } else if (i < numSamplesDelay) {
                // MMX add a single delayed sample
+#ifdef _WIN32
+                _clientSamples[parentIndex + delayedChannelOffset] += delayNextOutputStart[i] * attenuationAndWeakChannelRatio;
+#else
                __m64 bufferSamples = _mm_set_pi16(_clientSamples[parentIndex + delayedChannelOffset], 0, 0, 0);
                __m64 addSamples = _mm_set_pi16(delayNextOutputStart[i] * attenuationAndWeakChannelRatio, 0, 0, 0);
                
@ -334,6 +364,7 @@ void AudioMixer::addBufferToMixForListeningNodeWithBuffer(PositionalAudioRingBuf
                int16_t* shortResults = reinterpret_cast<int16_t*>(&mmxResult);
                
                _clientSamples[parentIndex + delayedChannelOffset] = shortResults[3];
+#endif
            }
        }
    } else {
--- a/libraries/audio/src/PositionalAudioRingBuffer.cpp
+++ b/libraries/audio/src/PositionalAudioRingBuffer.cpp
@ -149,6 +149,7 @@ void PositionalAudioRingBuffer::updateNextOutputTrailingLoudness() {
    // fixes bug on Windows where _nextOutputTrailingLoudness sometimes becomes NaN.  In that case,
    // revert _nextOutputTrailingLoudness to its previous value
    if (isNaN(_nextOutputTrailingLoudness)) {
+        printf("next output trailling loudness NaN!! --------------------------------------\n");
        _nextOutputTrailingLoudness = oldNextOutputTrailingLoudness;
    }
 }