sdatkinson · sdatkinson · Jan 2, 2024 · Dec 17, 2023 · Dec 17, 2023 · Jan 2, 2024
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -7,6 +7,7 @@ set(CMAKE_MODULE_PATH "${CMAKE_SOURCE_DIR}/cmake")
 set(CMAKE_CXX_STANDARD 20)
 set(CMAKE_CXX_STANDARD_REQUIRED OFF)
 set(CMAKE_CXX_EXTENSIONS OFF)
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -stdlib=libc++ -std=c++20")
 
 if (CMAKE_SYSTEM_NAME STREQUAL "Darwin")
 	include_directories(SYSTEM /usr/local/include)

diff --git a/dsp/ImpulseResponse.cpp b/dsp/ImpulseResponse.cpp
@@ -11,7 +11,8 @@
 #include "ImpulseResponse.h"
 
 dsp::ImpulseResponse::ImpulseResponse(const char* fileName, const double sampleRate)
-: mWavState(dsp::wav::LoadReturnCode::ERROR_OTHER), mSampleRate(sampleRate)
+: mWavState(dsp::wav::LoadReturnCode::ERROR_OTHER)
+, mSampleRate(sampleRate)
 {
   // Try to load the WAV
   this->mWavState = dsp::wav::Load(fileName, this->mRawAudio, this->mRawAudioSampleRate);

diff --git a/dsp/NoiseGate.cpp b/dsp/NoiseGate.cpp
@@ -5,7 +5,7 @@
 //  Created by Steven Atkinson on 2/5/23.
 //
 
-#include <algorithm>  // std::clamp
+#include <algorithm> // std::clamp
 #include <cstring> // memcpy
 #include <cmath> // pow
 #include <sstream>

diff --git a/dsp/ResamplingContainer/Dependencies/LanczosResampler.h b/dsp/ResamplingContainer/Dependencies/LanczosResampler.h
@@ -0,0 +1,367 @@
+// File: LanczosResampler.h
+// Created Date: Saturday December 16th 2023
+// Author: Steven Atkinson ([email protected])
+
+
+// This file originally came from the iPlug2 library and has been subsequently modified;
+// the following license is copied as required from
+// https://github.com/iPlug2/iPlug2/blob/40ebb560eba68f096221e99ef0ae826611fc2bda/LICENSE.txt
+// -------------------------------------------------------------------------------------
+
+/*
+iPlug 2 C++ Plug-in Framework.
+
+Copyright (C) the iPlug 2 Developers. Portions copyright other contributors, see each source file for more information.
+
+Based on WDL-OL/iPlug by Oli Larkin (2011-2018), and the original iPlug v1 (2008) by John Schwartz / Cockos
+
+LICENSE:
+
+This software is provided 'as-is', without any express or implied warranty.  In no event will the authors be held liable
+for any damages arising from the use of this software.
+
+Permission is granted to anyone to use this software for any purpose, including commercial applications, and to alter it
+and redistribute it freely, subject to the following restrictions:
+
+1. The origin of this software must not be misrepresented; you must not claim that you wrote the original software. If
+you use this software in a product, an acknowledgment in the product documentation would be appreciated but is not
+required.
+1. Altered source versions must be plainly marked as such, and must not be misrepresented as being the original
+software.
+1. This notice may not be removed or altered from any source distribution.
+
+iPlug 2 includes the following 3rd party libraries (see each license info):
+
+* Cockos WDL https://www.cockos.com/wdl
+* NanoVG https://github.com/memononen/nanovg
+* NanoSVG https://github.com/memononen/nanosvg
+* MetalNanoVG https://github.com/ollix/MetalNanoVG
+* RTAudio https://www.music.mcgill.ca/~gary/rtaudio
+* RTMidi https://www.music.mcgill.ca/~gary/rtmidi
+*/
+// -------------------------------------------------------------------------------------
+
+/*
+ This code is derived from
+ https://github.com/surge-synthesizer/sst-basic-blocks/blob/main/include/sst/basic-blocks/dsp/LanczosResampler.h
+
+ The following license info is copied from the above file:
+
+ * sst-basic-blocks - an open source library of core audio utilities
+ * built by Surge Synth Team.
+ *
+ * Provides a collection of tools useful on the audio thread for blocks,
+ * modulation, etc... or useful for adapting code to multiple environments.
+ *
+ * Copyright 2023, various authors, as described in the GitHub
+ * transaction log. Parts of this code are derived from similar
+ * functions original in Surge or ShortCircuit.
+ *
+ * sst-basic-blocks is released under the GNU General Public Licence v3
+ * or later (GPL-3.0-or-later). The license is found in the "LICENSE"
+ * file in the root of this repository, or at
+ * https://www.gnu.org/licenses/gpl-3.0.en.html
+ *
+ * All source in sst-basic-blocks available at
+ * https://github.com/surge-synthesizer/sst-basic-blocks
+
+ * A special note on licensing: This file (and only this file)
+ * has Paul Walker (baconpaul) as the sole author to date.
+ *
+ * In order to make this handy small function based on public
+ * information available to a set of open source projects
+ * adapting hardware to software, but which are licensed under
+ * MIT or BSD or similar licenses, this file and only this file
+ * can be used in an MIT/BSD context as well as a GPL3 context, by
+ * copying it and modifying it as you see fit.
+ *
+ * If you do that, you will need to replace the `sum_ps_to_float`
+ * call below with either an hadd if you are SSE3 or higher or
+ * an appropriate reduction operator from your toolkit.
+ *
+ * But basically: Need to resample 48k to variable rate with
+ * a small window and want to use this? Go for it!
+ *
+ * For avoidance of doubt, this license exception only
+ * applies to this file.
+ */
+
+#pragma once
+
+#include <algorithm>
+#include <utility>
+#include <cmath>
+#include <cstring>
+
+#if defined AUDIODSPTOOLS_SIMDE
+  #if defined(__arm64__)
+    #define SIMDE_ENABLE_NATIVE_ALIASES
+    #include "simde/x86/sse2.h"
+  #else
+    #include <emmintrin.h>
+  #endif
+#endif
+
+// #include "IPlugConstants.h"
+
+namespace dsp
+{
+/* LanczosResampler
+ *
+ * A class that implement Lanczos resampling, optionally using SIMD instructions.
+ * Define AUDIODSPTOOLS_SIMDE at project level in order to use SIMD and if on non-x86_64
+ * include the SIMDE library in your search paths in order to translate intel
+ * intrinsics to e.g. arm64
+ *
+ * See https://en.wikipedia.org/wiki/Lanczos_resampling
+ *
+ * @tparam T the sampletype
+ * @tparam NCHANS the number of channels
+ * @tparam A The Lanczos filter size. A higher value makes the filter closer to an
+   ideal stop-band that rejects high-frequency content (anti-aliasing),
+   but at the expense of higher latency
+ */
+template <typename T = double, int NCHANS = 2, size_t A = 12>
+class LanczosResampler
+{
+private:
+#if AUDIODSPTOOLS_SIMDE
+  static_assert(std::is_same<T, float>::value, "LanczosResampler requires T to be float when using SIMD instructions");
+  static_assert(false, "SIMD version has not been checked! You need to remove this to use it at your own risk!");
+#endif
+
+  // The buffer size. This needs to be at least as large as the largest block of samples
+  // that the input side will see.
+  static constexpr size_t kBufferSize = 4096;
+  // The filter width. 2x because the filter goes from -A to A
+  static constexpr size_t kFilterWidth = A * 2;
+  // The discretization resolution for the filter table.
+  static constexpr size_t kTablePoints = 8192;
+  static constexpr double kDeltaX = 1.0 / (kTablePoints);
+
+public:
+  /** Constructor
+   * @param inputRate The input sample rate
+   * @param outputRate The output sample rate
+   */
+  LanczosResampler(float inputRate, float outputRate)
+  : mInputSampleRate(inputRate)
+  , mOutputSamplerate(outputRate)
+  , mPhaseOutIncr(mInputSampleRate / mOutputSamplerate)
+  {
+    ClearBuffer();
+
+    auto kernel = [](double x) {
+      if (std::fabs(x) < 1e-7)
+        return T(1.0);
+
+      const auto pi = iplug::PI;
+      return T(A * std::sin(pi * x) * std::sin(pi * x / A) / (pi * pi * x * x));
+    };
+
+    if (!sTablesInitialized)
+    {
+      for (auto t = 0; t < kTablePoints + 1; ++t)
+      {
+        const double x0 = kDeltaX * t;
+
+        for (auto i = 0; i < kFilterWidth; ++i)
+        {
+          const double x = x0 + i - A;
+          sTable[t][i] = kernel(x);
+        }
+      }
+
+      for (auto t = 0; t < kTablePoints; ++t)
+      {
+        for (auto i = 0; i < kFilterWidth; ++i)
+        {
+          sDeltaTable[t][i] = sTable[t + 1][i] - sTable[t][i];
+        }
+      }
+
+      for (auto i = 0; i < kFilterWidth; ++i)
+      {
+        // Wrap at the end - delta is the same
+        sDeltaTable[kTablePoints][i] = sDeltaTable[0][i];
+      }
+      sTablesInitialized = true;
+    }
+  }
+
+  inline size_t GetNumSamplesRequiredFor(size_t nOutputSamples) const
+  {
+    /*
+     * So (mPhaseIn + mPhaseInIncr * res - mPhaseOut - mPhaseOutIncr * nOutputSamples) * sri > A + 1
+     *
+     * Use the fact that mPhaseInIncr = mInputSampleRate and find
+     * res > (A+1) - (mPhaseIn - mPhaseOut + mPhaseOutIncr * desiredOutputs) * sri
+     */
+    auto res = A + 1.0 - (mPhaseIn - mPhaseOut - mPhaseOutIncr * nOutputSamples);
+
+    return static_cast<size_t>(std::max(res + 1.0, 0.0));
+  }
+
+  inline void PushBlock(T** inputs, size_t nFrames)
+  {
+    for (auto s = 0; s < nFrames; s++)
+    {
+      for (auto c = 0; c < NCHANS; c++)
+      {
+        mInputBuffer[c][mWritePos] = inputs[c][s];
+        mInputBuffer[c][mWritePos + kBufferSize] = inputs[c][s]; // this way we can always wrap
+      }
+
+      mWritePos = (mWritePos + 1) & (kBufferSize - 1);
+      mPhaseIn += mPhaseInIncr;
+    }
+  }
+
+  size_t PopBlock(T** outputs, size_t max)
+  {
+    int populated = 0;
+    while (populated < max && (mPhaseIn - mPhaseOut) > A + 1)
+    {
+      ReadSamples((mPhaseIn - mPhaseOut), outputs, populated);
+      mPhaseOut += mPhaseOutIncr;
+      populated++;
+    }
+    return populated;
+  }
+
+  inline void RenormalizePhases()
+  {
+    mPhaseIn -= mPhaseOut;
+    mPhaseOut = 0;
+  }
+
+  void Reset() { ClearBuffer(); }
+
+  void ClearBuffer() { memset(mInputBuffer, 0, NCHANS * kBufferSize * 2 * sizeof(T)); }
+
+private:
+#ifdef IPLUG_SIMDE
+  inline void ReadSamples(double xBack, T** outputs, int s) const
+  {
+    float bufferReadPosition = static_cast<float>(mWritePos - xBack);
+    int bufferReadIndex = static_cast<int>(std::floor(bufferReadPosition));
+    float bufferFracPosition = 1.0f - (bufferReadPosition - static_cast<float>(bufferReadIndex));
+
+    bufferReadIndex = (bufferReadIndex + kBufferSize) & (kBufferSize - 1);
+    bufferReadIndex += (bufferReadIndex <= static_cast<int>(A)) * kBufferSize;
+
+    float tablePosition = bufferFracPosition * kTablePoints;
+    int tableIndex = static_cast<int>(tablePosition);
+    float tableFracPosition = (tablePosition - tableIndex);
+
+    __m128 sum[NCHANS];
+    for (auto& v : sum)
+    {
+      v = _mm_setzero_ps(); // Initialize sum vectors to zero
+    }
+
+    for (int i = 0; i < A; i += 4) // Process four samples at a time
+    {
+      // Load filter coefficients and input samples into SSE registers
+      __m128 f0 = _mm_load_ps(&sTable[tableIndex][i]);
+      __m128 df0 = _mm_load_ps(&sDeltaTable[tableIndex][i]);
+      __m128 f1 = _mm_load_ps(&sTable[tableIndex][A + i]);
+      __m128 df1 = _mm_load_ps(&sDeltaTable[tableIndex][A + i]);
+
+      // Interpolate filter coefficients
+      __m128 tfp = _mm_set1_ps(tableFracPosition);
+      f0 = _mm_add_ps(f0, _mm_mul_ps(df0, tfp));
+      f1 = _mm_add_ps(f1, _mm_mul_ps(df1, tfp));
+
+      for (int c = 0; c < NCHANS; c++)
+      {
+        // Load input data
+        __m128 d0 =
+          _mm_set_ps(mInputBuffer[c][bufferReadIndex - A + i + 3], mInputBuffer[c][bufferReadIndex - A + i + 2],
+                     mInputBuffer[c][bufferReadIndex - A + i + 1], mInputBuffer[c][bufferReadIndex - A + i]);
+        __m128 d1 = _mm_set_ps(mInputBuffer[c][bufferReadIndex + i + 3], mInputBuffer[c][bufferReadIndex + i + 2],
+                               mInputBuffer[c][bufferReadIndex + i + 1], mInputBuffer[c][bufferReadIndex + i]);
+
+        // Perform multiplication and accumulate
+        __m128 result0 = _mm_mul_ps(f0, d0);
+        __m128 result1 = _mm_mul_ps(f1, d1);
+        sum[c] = _mm_add_ps(sum[c], _mm_add_ps(result0, result1));
+      }
+    }
+
+    // Extract the final sums and store them in the output
+    for (int c = 0; c < NCHANS; c++)
+    {
+      float sumArray[4];
+      _mm_store_ps(sumArray, sum[c]);
+      outputs[c][s] = sumArray[0] + sumArray[1] + sumArray[2] + sumArray[3];
+    }
+  }
+#else // scalar
+  inline void ReadSamples(double xBack, T** outputs, int s) const
+  {
+    double bufferReadPosition = mWritePos - xBack;
+    int bufferReadIndex = std::floor(bufferReadPosition);
+    double bufferFracPosition = 1.0 - (bufferReadPosition - bufferReadIndex);
+
+    bufferReadIndex = (bufferReadIndex + kBufferSize) & (kBufferSize - 1);
+    bufferReadIndex += (bufferReadIndex <= static_cast<int>(A)) * kBufferSize;
+
+    double tablePosition = bufferFracPosition * kTablePoints;
+    int tableIndex = static_cast<int>(tablePosition);
+    double tableFracPosition = (tablePosition - tableIndex);
+
+    T sum[NCHANS] = {0.0};
+
+    for (auto i = 0; i < A; i++)
+    {
+      auto f0 = sTable[tableIndex][i];
+      const auto df0 = sDeltaTable[tableIndex][i];
+      f0 += df0 * tableFracPosition;
+
+      auto f1 = sTable[tableIndex][A + i];
+      const auto df1 = sDeltaTable[tableIndex][A + i];
+      f1 += df1 * tableFracPosition;
+
+      for (auto c = 0; c < NCHANS; c++)
+      {
+        const auto d0 = mInputBuffer[c][bufferReadIndex - A + i];
+        const auto d1 = mInputBuffer[c][bufferReadIndex + i];
+        const auto rv = (f0 * d0) + (f1 * d1);
+        sum[c] += rv;
+      }
+    }
+
+    for (auto c = 0; c < NCHANS; c++)
+    {
+      outputs[c][s] = sum[c];
+    }
+  }
+#endif
+
+  static T sTable alignas(16)[kTablePoints + 1][kFilterWidth];
+  static T sDeltaTable alignas(16)[kTablePoints + 1][kFilterWidth];
+  static bool sTablesInitialized;
+
+  T mInputBuffer[NCHANS][kBufferSize * 2];
+  int mWritePos = 0;
+  const float mInputSampleRate;
+  const float mOutputSamplerate;
+  double mPhaseIn = 0.0;
+  double mPhaseOut = 0.0;
+  double mPhaseInIncr = 1.0;
+  double mPhaseOutIncr = 0.0;
+};
+
+template <typename T, int NCHANS, size_t A>
+T LanczosResampler<T, NCHANS, A>::sTable alignas(
+  16)[LanczosResampler<T, NCHANS, A>::kTablePoints + 1][LanczosResampler::kFilterWidth];
+
+template <typename T, int NCHANS, size_t A>
+T LanczosResampler<T, NCHANS, A>::sDeltaTable alignas(
+  16)[LanczosResampler<T, NCHANS, A>::kTablePoints + 1][LanczosResampler::kFilterWidth];
+
+template <typename T, int NCHANS, size_t A>
+bool LanczosResampler<T, NCHANS, A>::sTablesInitialized{false};
+
+} // namespace dsp