_mix_8cpp_source.html

/**********************************************************************


  Audacity: A Digital Audio Editor


  Mix.cpp


  Dominic Mazzoni

  Markus Meyer

  Vaughan Johnson


*******************************************************************//*******************************************************************/

#include "Mix.h"

#include "MixerSource.h"


#include <cmath>

#include "EffectStage.h"

#include "Dither.h"

#include "Resample.h"

#include "WideSampleSequence.h"

#include "float_cast.h"

#include <numeric>


namespace {

template<typename T, typename F> std::vector<T>

initVector(size_t dim1, const F &f)

{

   std::vector<T> result( dim1 );

   for (auto &row : result)

      f(row);

   return result;

}


template<typename T> std::vector<std::vector<T>>

initVector(size_t dim1, size_t dim2)

{

   return initVector<std::vector<T>>(dim1,

      [dim2](auto &row){ row.resize(dim2); });

}

}


namespace {

// Find a block size acceptable to all stages; side-effects on instances

size_t FindBufferSize(const Mixer::Inputs &inputs, size_t bufferSize)

{

   size_t blockSize = bufferSize;

   for (const auto &input : inputs) {

      const auto sequence = input.pSequence.get();

      const auto nInChannels = sequence->NChannels();

      if (!sequence) {

         assert(false);

         break;

      }

      for (const auto &stage : input.stages) {

         // Need an instance to query acceptable block size

         const auto pInstance = stage.factory();

         if (pInstance)

            blockSize = std::min(blockSize, pInstance->SetBlockSize(blockSize));

         // Cache the first factory call

         stage.mpFirstInstance = move(pInstance);

      }

   }

   return blockSize;

}

}


Mixer::Mixer(Inputs inputs,

   const bool mayThrow,

   const WarpOptions &warpOptions,

   const double startTime, const double stopTime,

   const unsigned numOutChannels,

   const size_t outBufferSize, const bool outInterleaved,

   double outRate, sampleFormat outFormat,

   const bool highQuality, MixerSpec *const mixerSpec,

   ApplyGain applyGain

)  : mNumChannels{ numOutChannels }

   , mInputs{ move(inputs) }

   , mBufferSize{ FindBufferSize(mInputs, outBufferSize) }

   , mApplyGain{ applyGain }

   , mHighQuality{ highQuality }

   , mFormat{ outFormat }

   , mInterleaved{ outInterleaved }


   , mTimesAndSpeed{ std::make_shared<TimesAndSpeed>( TimesAndSpeed{

      startTime, stopTime, warpOptions.initialSpeed, startTime

   } ) }


   // PRL:  Bug2536: see other comments below for the last, padding argument

   // TODO: more-than-two-channels

   // Issue 3565 workaround:  allocate one extra buffer when applying a

   // GVerb effect stage.  It is simply discarded

   // See also issue 3854, when the number of out channels expected by the

   // plug-in is yet larger

   , mFloatBuffers{ 3, mBufferSize, 1, 1 }


   // non-interleaved

   , mTemp{ initVector<float>(mNumChannels, mBufferSize) }

   , mBuffer{ initVector<SampleBuffer>(mInterleaved ? 1 : mNumChannels,

      [format = mFormat,

         size = mBufferSize * (mInterleaved ? mNumChannels : 1)

      ](auto &buffer){ buffer.Allocate(size, format); }

   )}

   , mEffectiveFormat{ floatSample }

{

   assert(BufferSize() <= outBufferSize);

   const auto nChannelsIn =

   std::accumulate(mInputs.begin(), mInputs.end(), size_t{},

      [](auto sum, const auto &input){

         return sum + input.pSequence->NChannels(); });


   // Examine the temporary instances that were made in FindBufferSize

   // This finds a sufficient, but not necessary, condition to do dithering

   bool needsDither = std::any_of(mInputs.begin(), mInputs.end(),

      [](const Input &input){

         return std::any_of(input.stages.begin(), input.stages.end(),

            [](const MixerOptions::StageSpecification &spec){

               return spec.mpFirstInstance &&

                  spec.mpFirstInstance->NeedsDither(); } ); } );


   auto pMixerSpec = ( mixerSpec &&

      mixerSpec->GetNumChannels() == mNumChannels &&

      mixerSpec->GetNumTracks() == nChannelsIn

   ) ? mixerSpec : nullptr;

   mHasMixerSpec = pMixerSpec != nullptr;


   // Reserve vectors first so we can take safe references to pushed elements

   mSources.reserve(nChannelsIn);

   const auto nStages = std::accumulate(mInputs.begin(), mInputs.end(), 0,

      [](auto sum, const auto &input){

         return sum + input.stages.size() * input.pSequence->NChannels(); });

   mSettings.reserve(nStages);

   mStageBuffers.reserve(nStages);


   size_t i = 0;

   for (auto &input : mInputs) {

      const auto &sequence = input.pSequence;

      if (!sequence) {

         assert(false);

         break;

      }

      auto increment = finally([&]{ i += sequence->NChannels(); });


      auto &source = mSources.emplace_back(sequence, BufferSize(), outRate,

         warpOptions, highQuality, mayThrow, mTimesAndSpeed,

         (pMixerSpec ? &pMixerSpec->mMap[i] : nullptr));

      AudioGraph::Source *pDownstream = &source;

      for (const auto &stage : input.stages) {

         // Make a mutable copy of stage.settings

         auto &settings = mSettings.emplace_back(stage.settings);

         // TODO: more-than-two-channels

         // Like mFloatBuffers but padding not needed for soxr

         // Allocate one extra buffer to hold dummy zero inputs

         // (Issue 3854)

         auto &stageInput = mStageBuffers.emplace_back(3, mBufferSize, 1);

         const auto &factory = [&stage]{

            // Avoid unnecessary repeated calls to the factory

            return stage.mpFirstInstance

               ? move(stage.mpFirstInstance)

               : stage.factory();

         };

         auto &pNewDownstream =

         mStages.emplace_back(EffectStage::Create(-1,

            *pDownstream, stageInput,

            factory, settings, outRate, std::nullopt, *sequence

         ));

         if (pNewDownstream)

            pDownstream = pNewDownstream.get();

         else {

            // Just omit the failed stage from rendering

            // TODO propagate the error?

            mStageBuffers.pop_back();

            mSettings.pop_back();

         }

      }

      mDecoratedSources.emplace_back(Source{ source, *pDownstream });

   }


   // Decide once at construction time

   std::tie(mNeedsDither, mEffectiveFormat) = NeedsDither(needsDither, outRate);

}


Mixer::~Mixer() = default;


std::pair<bool, sampleFormat>

Mixer::NeedsDither(bool needsDither, double rate) const

{

   // This will accumulate the widest effective format of any input

   // clip

   auto widestEffectiveFormat = narrowestSampleFormat;


   // needsDither may already be given as true.

   // There are many other possible disqualifiers for the avoidance of dither.

   if (std::any_of(mSources.begin(), mSources.end(),

      std::mem_fn(&MixerSource::VariableRates))

   )

      // We will call MixVariableRates(), so we need nontrivial resampling

      needsDither = true;


   for (const auto &input : mSources) {

      auto &sequence = input.GetSequence();


      if (sequence.GetRate() != rate)

         // Also leads to MixVariableRates(), needs nontrivial resampling

         needsDither = true;

      else if (mApplyGain == ApplyGain::Mixdown &&

         !mHasMixerSpec &&

         sequence.NChannels() > 1 && mNumChannels == 1)

      {

         needsDither = true;

      }

      else if (mApplyGain != ApplyGain::Discard) {

         for (auto c : {0, 1}) {

            const auto gain = sequence.GetChannelGain(c);

            if (!(gain == 0.0 || gain == 1.0))

               // Fractional gain may be applied even in MixSameRate

               needsDither = true;

         }

      }

      // Examine all tracks.  (This ignores the time bounds for the mixer.

      // If it did not, we might avoid dither in more cases.  But if we fix

      // that, remember that some mixers change their time bounds after

      // construction, as when scrubbing.)

      if (!sequence.HasTrivialEnvelope())

         // Varying or non-unit gain may be applied even in MixSameRate

         needsDither = true;

      auto effectiveFormat = sequence.WidestEffectiveFormat();

      if (effectiveFormat > mFormat)

         // Real, not just nominal, precision loss would happen in at

         // least one clip

         needsDither = true;

      widestEffectiveFormat =

         std::max(widestEffectiveFormat, effectiveFormat);

   }


   if (needsDither)

      // Results will be dithered to width mFormat

      return { true, mFormat };

   else {

      // Results will not be dithered

      assert(widestEffectiveFormat <= mFormat);

      return { false, widestEffectiveFormat };

   }

}


void Mixer::Clear()

{

   for (auto &buffer: mTemp)

      std::fill(buffer.begin(), buffer.end(), 0);

}


static void MixBuffers(unsigned numChannels,

   const unsigned char *channelFlags, const float *gains,

   const float &src, std::vector<std::vector<float>> &dests, int len)

{

   const auto pSrc = &src;

   for (unsigned int c = 0; c < numChannels; c++) {

      if (!channelFlags[c])

         continue;

      for (int j = 0; j < len; ++j)

         dests[c][j] += pSrc[j] * gains[c];   // the actual mixing process

   }

}


#define stackAllocate(T, count) static_cast<T*>(alloca(count * sizeof(T)))


size_t Mixer::Process(const size_t maxToProcess)

{

   assert(maxToProcess <= BufferSize());


   // MB: this is wrong! mT represented warped time, and mTime is too inaccurate to use

   // it here. It's also unnecessary I think.

   //if (mT >= mT1)

   //   return 0;


   size_t maxOut = 0;

   const auto channelFlags = stackAllocate(unsigned char, mNumChannels);

   const auto gains = stackAllocate(float, mNumChannels);

   if (mApplyGain == ApplyGain::Discard)

      std::fill(gains, gains + mNumChannels, 1.0f);


   // Decides which output buffers an input channel accumulates into

   auto findChannelFlags = [&channelFlags, numChannels = mNumChannels]

   (const bool *map, const WideSampleSequence &sequence, size_t iChannel){

      const auto end = channelFlags + numChannels;

      std::fill(channelFlags, end, 0);

      if (map)

         // ignore left and right when downmixing is customized

         std::copy(map, map + numChannels, channelFlags);

      else if (IsMono(sequence))

         std::fill(channelFlags, end, 1);

      else if (iChannel == 0)

         channelFlags[0] = 1;

      else if (iChannel == 1) {

         if (numChannels >= 2)

            channelFlags[1] = 1;

         else

            channelFlags[0] = 1;

      }

      return channelFlags;

   };


   auto &[mT0, mT1, _, mTime] = *mTimesAndSpeed;

   auto oldTime = mTime;

   // backwards (as possibly in scrubbing)

   const auto backwards = (mT0 > mT1);


   Clear();

   // TODO: more-than-two-channels

   auto maxChannels = std::max(2u, mFloatBuffers.Channels());


   for (auto &[ upstream, downstream ] : mDecoratedSources) {

      auto oResult = downstream.Acquire(mFloatBuffers, maxToProcess);

      // One of MixVariableRates or MixSameRate assigns into mTemp[*][*] which

      // are the sources for the CopySamples calls, and they copy into

      // mBuffer[*][*]

      if (!oResult)

         return 0;

      auto result = *oResult;

      maxOut = std::max(maxOut, result);


      // Insert effect stages here!  Passing them all channels of the track


      const auto limit = std::min<size_t>(upstream.Channels(), maxChannels);

      for (size_t j = 0; j < limit; ++j) {

         const auto pFloat = (const float *)mFloatBuffers.GetReadPosition(j);

         auto &sequence = upstream.GetSequence();

         if (mApplyGain != ApplyGain::Discard) {

            for (size_t c = 0; c < mNumChannels; ++c) {

               if (mNumChannels > 1)

                  gains[c] = sequence.GetChannelGain(c);

               else

                  gains[c] = sequence.GetChannelGain(j);

            }

            if(mApplyGain == ApplyGain::Mixdown && !mHasMixerSpec && mNumChannels == 1)

               gains[0] /= static_cast<float>(limit);

         }


         const auto flags =

            findChannelFlags(upstream.MixerSpec(j), sequence, j);

         MixBuffers(mNumChannels, flags, gains, *pFloat, mTemp, result);

      }


      downstream.Release();

      mFloatBuffers.Advance(result);

      mFloatBuffers.Rotate();

   }


   if (backwards)

      mTime = std::clamp(mTime, mT1, oldTime);

   else

      mTime = std::clamp(mTime, oldTime, mT1);


   const auto dstStride = (mInterleaved ? mNumChannels : 1);

   auto ditherType = mNeedsDither

      ? (mHighQuality ? gHighQualityDither : gLowQualityDither)

      : DitherType::none;

   for (size_t c = 0; c < mNumChannels; ++c)

      CopySamples((constSamplePtr)mTemp[c].data(), floatSample,

         (mInterleaved

            ? mBuffer[0].ptr() + (c * SAMPLE_SIZE(mFormat))

            : mBuffer[c].ptr()

         ),

         mFormat, maxOut, ditherType,

         1, dstStride);


   // MB: this doesn't take warping into account, replaced with code based on mSamplePos

   //mT += (maxOut / mRate);


   assert(maxOut <= maxToProcess);

   return maxOut;

}


constSamplePtr Mixer::GetBuffer()

{

   return mBuffer[0].ptr();

}


constSamplePtr Mixer::GetBuffer(int channel)

{

   return mBuffer[channel].ptr();

}


sampleFormat Mixer::EffectiveFormat() const

{

   return mEffectiveFormat;

}


double Mixer::MixGetCurrentTime()

{

   return mTimesAndSpeed->mTime;

}


void Mixer::Reposition(double t, bool bSkipping)

{

   const auto &[mT0, mT1, _, __] = *mTimesAndSpeed;

   auto &mTime = mTimesAndSpeed->mTime;

   mTime = t;

   const bool backwards = (mT1 < mT0);

   if (backwards)

      mTime = std::clamp(mTime, mT1, mT0);

   else

      mTime = std::clamp(mTime, mT0, mT1);


   for (auto &source : mSources)

      source.Reposition(mTime, bSkipping);

}


void Mixer::SetTimesAndSpeed(double t0, double t1, double speed, bool bSkipping)

{

   wxASSERT(std::isfinite(speed));

   auto &[mT0, mT1, mSpeed, _] = *mTimesAndSpeed;

   mT0 = t0;

   mT1 = t1;

   mSpeed = fabs(speed);

   Reposition(t0, bSkipping);

}


void Mixer::SetSpeedForKeyboardScrubbing(double speed, double startTime)

{

   wxASSERT(std::isfinite(speed));

   auto &[mT0, mT1, mSpeed, _] = *mTimesAndSpeed;


   // Check if the direction has changed

   if ((speed > 0.0 && mT1 < mT0) || (speed < 0.0 && mT1 > mT0)) {

      // It's safe to use 0 and std::numeric_limits<double>::max(),

      // because Mixer::MixVariableRates() doesn't sample past the start

      // or end of the audio in a track.

      if (speed > 0.0 && mT1 < mT0) {

         mT0 = 0;

         mT1 = std::numeric_limits<double>::max();

      }

      else {

         mT0 = std::numeric_limits<double>::max();

         mT1 = 0;

      }


      Reposition(startTime, true);

   }


   mSpeed = fabs(speed);

}

BufferSize
constexpr int BufferSize
Definition: AVIOContextWrapper.cpp:18

factory
static RegisteredToolbarFactory factory
Definition: AudioSetupToolBar.cpp:778

min
int min(int a, int b)
Definition: CompareAudioCommand.cpp:114

Dither.h

none
@ none
Definition: Dither.h:20

EffectStage.h

_
#define _(s)
Definition: Internat.h:73

MixBuffers
static void MixBuffers(unsigned numChannels, const unsigned char *channelFlags, const float *gains, const float &src, std::vector< std::vector< float > > &dests, int len)
Definition: Mix.cpp:256

stackAllocate
#define stackAllocate(T, count)
Definition: Mix.cpp:269

Mix.h

MixerSource.h

Resample.h

gLowQualityDither
DitherType gLowQualityDither
These global variables are assigned at application startup or after change of preferences.
Definition: SampleFormat.cpp:47

gHighQualityDither
DitherType gHighQualityDither
Definition: SampleFormat.cpp:48

CopySamples
void CopySamples(constSamplePtr src, sampleFormat srcFormat, samplePtr dst, sampleFormat dstFormat, size_t len, DitherType ditherType, unsigned int srcStride, unsigned int dstStride)
Copy samples from any format to any other format; apply dithering only if narrowing the format.
Definition: SampleFormat.cpp:109

floatSample
constexpr sampleFormat floatSample
Definition: SampleFormat.h:45

sampleFormat
sampleFormat
The ordering of these values with operator < agrees with the order of increasing bit width.
Definition: SampleFormat.h:30

sampleFormat::narrowestSampleFormat
@ narrowestSampleFormat
Two synonyms for previous values that might change if more values were added.

sampleFormat::floatSample
@ floatSample

SAMPLE_SIZE
#define SAMPLE_SIZE(SampleFormat)
Definition: SampleFormat.h:52

constSamplePtr
const char * constSamplePtr
Definition: SampleFormat.h:58

settings
static Settings & settings()
Definition: TrackInfo.cpp:69

WideSampleSequence.h

AudioGraph::Buffers::Advance
void Advance(size_t count)
Move the positions.
Definition: AudioGraphBuffers.cpp:89

AudioGraph::Buffers::Rotate
size_t Rotate()
Shift all data at and after the old position to position 0.
Definition: AudioGraphBuffers.cpp:144

AudioGraph::Buffers::Channels
unsigned Channels() const
Definition: AudioGraphBuffers.h:50

AudioGraph::Buffers::GetReadPosition
constSamplePtr GetReadPosition(unsigned iChannel) const
Get accumulated data for one channel.
Definition: AudioGraphBuffers.cpp:155

AudioGraph::Source
Upstream producer of sample streams, taking Buffers as external context.
Definition: AudioGraphSource.h:27

EffectStage::Create
static std::unique_ptr< EffectStage > Create(int channel, Source &upstream, Buffers &inBuffers, const Factory &factory, EffectSettings &settings, double sampleRate, std::optional< sampleCount > genLength, const WideSampleSequence &sequence)
Satisfies postcondition of constructor or returns null.
Definition: EffectStage.cpp:79

Mixer::mFloatBuffers
AudioGraph::Buffers mFloatBuffers
Definition: Mix.h:155

Mixer::ApplyGain
ApplyGain
Definition: Mix.h:48

Mixer::ApplyGain::Mixdown
@ Mixdown

Mixer::ApplyGain::Discard
@ Discard

Mixer::mApplyGain
const ApplyGain mApplyGain
Definition: Mix.h:140

Mixer::mBuffer
const std::vector< SampleBuffer > mBuffer
Definition: Mix.h:163

Mixer::Inputs
std::vector< Input > Inputs
Definition: Mix.h:45

Mixer::SetSpeedForKeyboardScrubbing
void SetSpeedForKeyboardScrubbing(double speed, double startTime)
Definition: Mix.cpp:423

Mixer::mDecoratedSources
std::vector< Source > mDecoratedSources
Definition: Mix.h:171

Mixer::EffectiveFormat
sampleFormat EffectiveFormat() const
Deduce the effective width of the output, which may be narrower than the stored format.
Definition: Mix.cpp:388

Mixer::mFormat
const sampleFormat mFormat
Definition: Mix.h:142

Mixer::~Mixer
virtual ~Mixer()

Mixer::mTemp
std::vector< std::vector< float > > mTemp
Definition: Mix.h:160

Mixer::NeedsDither
std::pair< bool, sampleFormat > NeedsDither(bool needsDither, double rate) const
Definition: Mix.cpp:189

Mixer::mNumChannels
const unsigned mNumChannels
Definition: Mix.h:128

Mixer::mEffectiveFormat
sampleFormat mEffectiveFormat
Definition: Mix.h:146

Mixer::GetBuffer
constSamplePtr GetBuffer()
Retrieve the main buffer or the interleaved buffer.
Definition: Mix.cpp:378

Mixer::mInterleaved
const bool mInterleaved
Definition: Mix.h:143

Mixer::Clear
void Clear()
Definition: Mix.cpp:250

Mixer::mNeedsDither
bool mNeedsDither
Definition: Mix.h:147

Mixer::Mixer
Mixer(Inputs inputs, bool mayThrow, const WarpOptions &warpOptions, double startTime, double stopTime, unsigned numOutChannels, size_t outBufferSize, bool outInterleaved, double outRate, sampleFormat outFormat, bool highQuality=true, MixerSpec *mixerSpec=nullptr, ApplyGain applyGain=ApplyGain::MapChannels)
Definition: Mix.cpp:71

Mixer::MixGetCurrentTime
double MixGetCurrentTime()
Current time in seconds (unwarped, i.e. always between startTime and stopTime)
Definition: Mix.cpp:393

Mixer::mHighQuality
const bool mHighQuality
Definition: Mix.h:141

Mixer::mSources
std::vector< MixerSource > mSources
Definition: Mix.h:165

Mixer::Process
size_t Process()
Definition: Mix.h:98

Mixer::BufferSize
size_t BufferSize() const
Definition: Mix.h:79

Mixer::Reposition
void Reposition(double t, bool bSkipping=false)
Reposition processing to absolute time next time Process() is called.
Definition: Mix.cpp:398

Mixer::SetTimesAndSpeed
void SetTimesAndSpeed(double t0, double t1, double speed, bool bSkipping=false)
Used in scrubbing and other nonuniform playback policies.
Definition: Mix.cpp:413

Mixer::mTimesAndSpeed
const std::shared_ptr< TimesAndSpeed > mTimesAndSpeed
Definition: Mix.h:150

Mixer::mHasMixerSpec
bool mHasMixerSpec
Definition: Mix.h:148

MixerOptions::Downmix
A matrix of booleans, one row per input channel, column per output.
Definition: MixerOptions.h:32

MixerSource::VariableRates
bool VariableRates() const
Definition: MixerSource.h:65

SampleBuffer
Definition: SampleFormat.h:124

WideSampleSequence
Definition: WideSampleSequence.h:24

size
size_t size
Definition: ffmpeg-2.3.6-single-header.h:412

float_cast.h

AudioGraph::IsMono
bool IsMono(const Channel &channel)
Whether the channel is mono.
Definition: AudioGraphChannel.h:32

anonymous_namespace{ExportPCM.cpp}::format
int format
Definition: ExportPCM.cpp:49

anonymous_namespace{Mix.cpp}::FindBufferSize
size_t FindBufferSize(const Mixer::Inputs &inputs, size_t bufferSize)
Definition: Mix.cpp:48

anonymous_namespace{Mix.cpp}::initVector
std::vector< std::vector< T > > initVector(size_t dim1, size_t dim2)
Definition: Mix.cpp:39

anonymous_namespace{StretchingSequenceIntegrationTest.cpp}::iChannel
constexpr auto iChannel
Definition: StretchingSequenceIntegrationTest.cpp:24

details::end
const char * end(const char *str) noexcept
Definition: StringUtils.h:106

staffpad::vo::copy
void copy(const T *src, T *dst, int32_t n)
Definition: VectorOps.h:40

std
STL namespace.

MixerOptions::TimesAndSpeed
Definition: MixerOptions.h:92

MixerOptions::Warp
Immutable structure is an argument to Mixer's constructor.
Definition: MixerOptions.h:56