gecko/content/media/AudioSegment.cpp

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* This Source Code Form is subject to the terms of the Mozilla Public
 * License, v. 2.0. If a copy of the MPL was not distributed with this file,
 * You can obtain one at http://mozilla.org/MPL/2.0/. */

#include "AudioSegment.h"

#include "AudioStream.h"
#include "AudioChannelFormat.h"
#include "Latency.h"

namespace mozilla {

template <class SrcT, class DestT>
static void
InterleaveAndConvertBuffer(const SrcT** aSourceChannels,
                           int32_t aLength, float aVolume,
                           int32_t aChannels,
                           DestT* aOutput)
{
  DestT* output = aOutput;
  for (int32_t i = 0; i < aLength; ++i) {
    for (int32_t channel = 0; channel < aChannels; ++channel) {
      float v = AudioSampleToFloat(aSourceChannels[channel][i])*aVolume;
      *output = FloatToAudioSample<DestT>(v);
      ++output;
    }
  }
}

void
InterleaveAndConvertBuffer(const void** aSourceChannels,
                           AudioSampleFormat aSourceFormat,
                           int32_t aLength, float aVolume,
                           int32_t aChannels,
                           AudioDataValue* aOutput)
{
  switch (aSourceFormat) {
  case AUDIO_FORMAT_FLOAT32:
    InterleaveAndConvertBuffer(reinterpret_cast<const float**>(aSourceChannels),
                               aLength,
                               aVolume,
                               aChannels,
                               aOutput);
    break;
  case AUDIO_FORMAT_S16:
    InterleaveAndConvertBuffer(reinterpret_cast<const int16_t**>(aSourceChannels),
                               aLength,
                               aVolume,
                               aChannels,
                               aOutput);
    break;
  }
}

void
AudioSegment::ApplyVolume(float aVolume)
{
  for (ChunkIterator ci(*this); !ci.IsEnded(); ci.Next()) {
    ci->mVolume *= aVolume;
  }
}

static const int AUDIO_PROCESSING_FRAMES = 640; /* > 10ms of 48KHz audio */
static const uint8_t gZeroChannel[MAX_AUDIO_SAMPLE_SIZE*AUDIO_PROCESSING_FRAMES] = {0};

void
DownmixAndInterleave(const nsTArray<const void*>& aChannelData,
                     AudioSampleFormat aSourceFormat, int32_t aDuration,
                     float aVolume, uint32_t aOutputChannels,
                     AudioDataValue* aOutput)
{
  nsAutoTArray<const void*,GUESS_AUDIO_CHANNELS> channelData;
  nsAutoTArray<float,AUDIO_PROCESSING_FRAMES*GUESS_AUDIO_CHANNELS> downmixConversionBuffer;
  nsAutoTArray<float,AUDIO_PROCESSING_FRAMES*GUESS_AUDIO_CHANNELS> downmixOutputBuffer;

  channelData.SetLength(aChannelData.Length());
  if (aSourceFormat != AUDIO_FORMAT_FLOAT32) {
    NS_ASSERTION(aSourceFormat == AUDIO_FORMAT_S16, "unknown format");
    downmixConversionBuffer.SetLength(aDuration*aChannelData.Length());
    for (uint32_t i = 0; i < aChannelData.Length(); ++i) {
      float* conversionBuf = downmixConversionBuffer.Elements() + (i*aDuration);
      const int16_t* sourceBuf = static_cast<const int16_t*>(aChannelData[i]);
      for (uint32_t j = 0; j < (uint32_t)aDuration; ++j) {
        conversionBuf[j] = AudioSampleToFloat(sourceBuf[j]);
      }
      channelData[i] = conversionBuf;
    }
  } else {
    for (uint32_t i = 0; i < aChannelData.Length(); ++i) {
      channelData[i] = aChannelData[i];
    }
  }

  downmixOutputBuffer.SetLength(aDuration*aOutputChannels);
  nsAutoTArray<float*,GUESS_AUDIO_CHANNELS> outputChannelBuffers;
  nsAutoTArray<const void*,GUESS_AUDIO_CHANNELS> outputChannelData;
  outputChannelBuffers.SetLength(aOutputChannels);
  outputChannelData.SetLength(aOutputChannels);
  for (uint32_t i = 0; i < (uint32_t)aOutputChannels; ++i) {
    outputChannelData[i] = outputChannelBuffers[i] =
        downmixOutputBuffer.Elements() + aDuration*i;
  }
  if (channelData.Length() > aOutputChannels) {
    AudioChannelsDownMix(channelData, outputChannelBuffers.Elements(),
                         aOutputChannels, aDuration);
  }
  InterleaveAndConvertBuffer(outputChannelData.Elements(), AUDIO_FORMAT_FLOAT32,
                             aDuration, aVolume, aOutputChannels, aOutput);
}

void
AudioSegment::WriteTo(uint64_t aID, AudioStream* aOutput)
{
  uint32_t outputChannels = aOutput->GetChannels();
  nsAutoTArray<AudioDataValue,AUDIO_PROCESSING_FRAMES*GUESS_AUDIO_CHANNELS> buf;
  nsAutoTArray<const void*,GUESS_AUDIO_CHANNELS> channelData;

  for (ChunkIterator ci(*this); !ci.IsEnded(); ci.Next()) {
    AudioChunk& c = *ci;
    TrackTicks offset = 0;
    while (offset < c.mDuration) {
      TrackTicks durationTicks =
        std::min<TrackTicks>(c.mDuration - offset, AUDIO_PROCESSING_FRAMES);
      if (uint64_t(outputChannels)*durationTicks > INT32_MAX || offset > INT32_MAX) {
        NS_ERROR("Buffer overflow");
        return;
      }
      uint32_t duration = uint32_t(durationTicks);
      buf.SetLength(outputChannels*duration);
      if (c.mBuffer) {
        channelData.SetLength(c.mChannelData.Length());
        for (uint32_t i = 0; i < channelData.Length(); ++i) {
          channelData[i] =
            AddAudioSampleOffset(c.mChannelData[i], c.mBufferFormat, int32_t(offset));
        }

        if (channelData.Length() < outputChannels) {
          // Up-mix. Note that this might actually make channelData have more
          // than outputChannels temporarily.
          AudioChannelsUpMix(&channelData, outputChannels, gZeroChannel);
        }

        if (channelData.Length() > outputChannels) {
          // Down-mix.
          DownmixAndInterleave(channelData, c.mBufferFormat, duration,
                               c.mVolume, outputChannels, buf.Elements());
        } else {
          InterleaveAndConvertBuffer(channelData.Elements(), c.mBufferFormat,
                                     duration, c.mVolume,
                                     outputChannels,
                                     buf.Elements());
        }
      } else {
        // Assumes that a bit pattern of zeroes == 0.0f
        memset(buf.Elements(), 0, buf.Length()*sizeof(AudioDataValue));
      }
      aOutput->Write(buf.Elements(), int32_t(duration), &(c.mTimeStamp));
      if(!c.mTimeStamp.IsNull()) {
        TimeStamp now = TimeStamp::Now();
        // would be more efficient to c.mTimeStamp to ms on create time then pass here
        LogTime(AsyncLatencyLogger::AudioMediaStreamTrack, aID,
                (now - c.mTimeStamp).ToMilliseconds(), c.mTimeStamp);
      }
      offset += duration;
    }
  }
  aOutput->Start();
}

}
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`/* -- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -- */`
			`/* This Source Code Form is subject to the terms of the Mozilla Public`
			`* License, v. 2.0. If a copy of the MPL was not distributed with this file,`
			`* You can obtain one at http://mozilla.org/MPL/2.0/. */`

			`#include "AudioSegment.h"`

			`#include "AudioStream.h"`
Bug 830707. Part 2: Mix channels to output channel count when playing audio. r=jesup --HG-- extra : rebase_source : a13d8ec691689e3aa57cd42c9d437f91197d4253 2013-01-31 20:27:02 -08:00			`#include "AudioChannelFormat.h"`
Bug 904617: Part 3 - Log latency, and adds a python script to understand the log r=padenot,jesup,ehugg 2013-01-28 10:22:37 -08:00			`#include "Latency.h"`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00
			`namespace mozilla {`

			`template <class SrcT, class DestT>`
			`static void`
Bug 827537. Refactor AudioChunk to support having separate buffers for each channel. r=jesup --HG-- extra : rebase_source : 0aa26e1c3181d9fe5158520d4b33248bae0fa5d0 2012-11-21 21:04:27 -08:00			`InterleaveAndConvertBuffer(const SrcT** aSourceChannels,`
			`int32_t aLength, float aVolume,`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`int32_t aChannels,`
			`DestT* aOutput)`
			`{`
			`DestT* output = aOutput;`
			`for (int32_t i = 0; i < aLength; ++i) {`
			`for (int32_t channel = 0; channel < aChannels; ++channel) {`
Bug 827537. Refactor AudioChunk to support having separate buffers for each channel. r=jesup --HG-- extra : rebase_source : 0aa26e1c3181d9fe5158520d4b33248bae0fa5d0 2012-11-21 21:04:27 -08:00			`float v = AudioSampleToFloat(aSourceChannels[channel][i])*aVolume;`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`*output = FloatToAudioSample<DestT>(v);`
			`++output;`
			`}`
			`}`
			`}`

Bug 842243 - Part 0: Modify MediaSegment and AudioSegment for use by MediaEncoder. r=roc 2013-06-03 02:59:50 -07:00			`void`
Bug 827537. Refactor AudioChunk to support having separate buffers for each channel. r=jesup --HG-- extra : rebase_source : 0aa26e1c3181d9fe5158520d4b33248bae0fa5d0 2012-11-21 21:04:27 -08:00			`InterleaveAndConvertBuffer(const void** aSourceChannels,`
			`AudioSampleFormat aSourceFormat,`
			`int32_t aLength, float aVolume,`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`int32_t aChannels,`
			`AudioDataValue* aOutput)`
			`{`
			`switch (aSourceFormat) {`
			`case AUDIO_FORMAT_FLOAT32:`
Bug 827537. Refactor AudioChunk to support having separate buffers for each channel. r=jesup --HG-- extra : rebase_source : 0aa26e1c3181d9fe5158520d4b33248bae0fa5d0 2012-11-21 21:04:27 -08:00			`InterleaveAndConvertBuffer(reinterpret_cast<const float**>(aSourceChannels),`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`aLength,`
			`aVolume,`
			`aChannels,`
			`aOutput);`
			`break;`
			`case AUDIO_FORMAT_S16:`
Bug 827537. Refactor AudioChunk to support having separate buffers for each channel. r=jesup --HG-- extra : rebase_source : 0aa26e1c3181d9fe5158520d4b33248bae0fa5d0 2012-11-21 21:04:27 -08:00			`InterleaveAndConvertBuffer(reinterpret_cast<const int16_t**>(aSourceChannels),`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`aLength,`
			`aVolume,`
			`aChannels,`
			`aOutput);`
			`break;`
			`}`
			`}`

			`void`
			`AudioSegment::ApplyVolume(float aVolume)`
			`{`
			`for (ChunkIterator ci(*this); !ci.IsEnded(); ci.Next()) {`
			`ci->mVolume *= aVolume;`
			`}`
			`}`

Bug 830707. Part 2: Mix channels to output channel count when playing audio. r=jesup --HG-- extra : rebase_source : a13d8ec691689e3aa57cd42c9d437f91197d4253 2013-01-31 20:27:02 -08:00			`static const int AUDIO_PROCESSING_FRAMES = 640; /* > 10ms of 48KHz audio */`
			`static const uint8_t gZeroChannel[MAX_AUDIO_SAMPLE_SIZE*AUDIO_PROCESSING_FRAMES] = {0};`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00
Bug 842243 - Part 0: Modify MediaSegment and AudioSegment for use by MediaEncoder. r=roc 2013-06-03 02:59:50 -07:00			`void`
			`DownmixAndInterleave(const nsTArray<const void*>& aChannelData,`
			`AudioSampleFormat aSourceFormat, int32_t aDuration,`
Bug 881775 - Set the correct channel count in DownmixAndInterleave, and avoid unnecessary downmixing; r=roc 2013-06-11 14:50:21 -07:00			`float aVolume, uint32_t aOutputChannels,`
Bug 842243 - Part 0: Modify MediaSegment and AudioSegment for use by MediaEncoder. r=roc 2013-06-03 02:59:50 -07:00			`AudioDataValue* aOutput)`
			`{`
			`nsAutoTArray<const void*,GUESS_AUDIO_CHANNELS> channelData;`
			`nsAutoTArray<float,AUDIO_PROCESSING_FRAMES*GUESS_AUDIO_CHANNELS> downmixConversionBuffer;`
			`nsAutoTArray<float,AUDIO_PROCESSING_FRAMES*GUESS_AUDIO_CHANNELS> downmixOutputBuffer;`

Bug 881775 - Set the correct channel count in DownmixAndInterleave, and avoid unnecessary downmixing; r=roc 2013-06-11 14:50:21 -07:00			`channelData.SetLength(aChannelData.Length());`
Bug 842243 - Part 0: Modify MediaSegment and AudioSegment for use by MediaEncoder. r=roc 2013-06-03 02:59:50 -07:00			`if (aSourceFormat != AUDIO_FORMAT_FLOAT32) {`
			`NS_ASSERTION(aSourceFormat == AUDIO_FORMAT_S16, "unknown format");`
			`downmixConversionBuffer.SetLength(aDuration*aChannelData.Length());`
			`for (uint32_t i = 0; i < aChannelData.Length(); ++i) {`
			`float* conversionBuf = downmixConversionBuffer.Elements() + (i*aDuration);`
			`const int16_t* sourceBuf = static_cast<const int16_t*>(aChannelData[i]);`
			`for (uint32_t j = 0; j < (uint32_t)aDuration; ++j) {`
			`conversionBuf[j] = AudioSampleToFloat(sourceBuf[j]);`
			`}`
			`channelData[i] = conversionBuf;`
			`}`
			`} else {`
			`for (uint32_t i = 0; i < aChannelData.Length(); ++i) {`
			`channelData[i] = aChannelData[i];`
			`}`
			`}`

			`downmixOutputBuffer.SetLength(aDuration*aOutputChannels);`
			`nsAutoTArray<float*,GUESS_AUDIO_CHANNELS> outputChannelBuffers;`
			`nsAutoTArray<const void*,GUESS_AUDIO_CHANNELS> outputChannelData;`
			`outputChannelBuffers.SetLength(aOutputChannels);`
			`outputChannelData.SetLength(aOutputChannels);`
			`for (uint32_t i = 0; i < (uint32_t)aOutputChannels; ++i) {`
			`outputChannelData[i] = outputChannelBuffers[i] =`
			`downmixOutputBuffer.Elements() + aDuration*i;`
			`}`
Bug 881775 - Set the correct channel count in DownmixAndInterleave, and avoid unnecessary downmixing; r=roc 2013-06-11 14:50:21 -07:00			`if (channelData.Length() > aOutputChannels) {`
			`AudioChannelsDownMix(channelData, outputChannelBuffers.Elements(),`
			`aOutputChannels, aDuration);`
			`}`
Bug 842243 - Part 0: Modify MediaSegment and AudioSegment for use by MediaEncoder. r=roc 2013-06-03 02:59:50 -07:00			`InterleaveAndConvertBuffer(outputChannelData.Elements(), AUDIO_FORMAT_FLOAT32,`
			`aDuration, aVolume, aOutputChannels, aOutput);`
			`}`

Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`void`
Bug 904617: Part 3 - Log latency, and adds a python script to understand the log r=padenot,jesup,ehugg 2013-01-28 10:22:37 -08:00			`AudioSegment::WriteTo(uint64_t aID, AudioStream* aOutput)`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`{`
Bug 830707. Part 2: Mix channels to output channel count when playing audio. r=jesup --HG-- extra : rebase_source : a13d8ec691689e3aa57cd42c9d437f91197d4253 2013-01-31 20:27:02 -08:00			`uint32_t outputChannels = aOutput->GetChannels();`
			`nsAutoTArray<AudioDataValue,AUDIO_PROCESSING_FRAMES*GUESS_AUDIO_CHANNELS> buf;`
			`nsAutoTArray<const void*,GUESS_AUDIO_CHANNELS> channelData;`

Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`for (ChunkIterator ci(*this); !ci.IsEnded(); ci.Next()) {`
			`AudioChunk& c = *ci;`
Bug 830707. Part 2: Mix channels to output channel count when playing audio. r=jesup --HG-- extra : rebase_source : a13d8ec691689e3aa57cd42c9d437f91197d4253 2013-01-31 20:27:02 -08:00			`TrackTicks offset = 0;`
			`while (offset < c.mDuration) {`
			`TrackTicks durationTicks =`
			`std::min<TrackTicks>(c.mDuration - offset, AUDIO_PROCESSING_FRAMES);`
			`if (uint64_t(outputChannels)*durationTicks > INT32_MAX \|\| offset > INT32_MAX) {`
			`NS_ERROR("Buffer overflow");`
			`return;`
			`}`
			`uint32_t duration = uint32_t(durationTicks);`
			`buf.SetLength(outputChannels*duration);`
			`if (c.mBuffer) {`
			`channelData.SetLength(c.mChannelData.Length());`
			`for (uint32_t i = 0; i < channelData.Length(); ++i) {`
			`channelData[i] =`
			`AddAudioSampleOffset(c.mChannelData[i], c.mBufferFormat, int32_t(offset));`
			`}`

			`if (channelData.Length() < outputChannels) {`
			`// Up-mix. Note that this might actually make channelData have more`
			`// than outputChannels temporarily.`
			`AudioChannelsUpMix(&channelData, outputChannels, gZeroChannel);`
			`}`

			`if (channelData.Length() > outputChannels) {`
			`// Down-mix.`
Bug 842243 - Part 0: Modify MediaSegment and AudioSegment for use by MediaEncoder. r=roc 2013-06-03 02:59:50 -07:00			`DownmixAndInterleave(channelData, c.mBufferFormat, duration,`
Bug 882956 - Fix WebAudio stack-buffer-overflow crash. r=ehsan. 2013-06-14 00:16:41 -07:00			`c.mVolume, outputChannels, buf.Elements());`
Bug 830707. Part 2: Mix channels to output channel count when playing audio. r=jesup --HG-- extra : rebase_source : a13d8ec691689e3aa57cd42c9d437f91197d4253 2013-01-31 20:27:02 -08:00			`} else {`
			`InterleaveAndConvertBuffer(channelData.Elements(), c.mBufferFormat,`
			`duration, c.mVolume,`
			`outputChannels,`
			`buf.Elements());`
			`}`
			`} else {`
			`// Assumes that a bit pattern of zeroes == 0.0f`
			`memset(buf.Elements(), 0, buf.Length()*sizeof(AudioDataValue));`
			`}`
Bug 920325: Add WebRTC latency logging from capture to RTP and from RTP to speakers r=padenot 2013-10-25 15:13:42 -07:00			`aOutput->Write(buf.Elements(), int32_t(duration), &(c.mTimeStamp));`
			`if(!c.mTimeStamp.IsNull()) {`
			`TimeStamp now = TimeStamp::Now();`
			`// would be more efficient to c.mTimeStamp to ms on create time then pass here`
			`LogTime(AsyncLatencyLogger::AudioMediaStreamTrack, aID,`
			`(now - c.mTimeStamp).ToMilliseconds(), c.mTimeStamp);`
			`}`
Bug 830707. Part 2: Mix channels to output channel count when playing audio. r=jesup --HG-- extra : rebase_source : a13d8ec691689e3aa57cd42c9d437f91197d4253 2013-01-31 20:27:02 -08:00			`offset += duration;`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`}`
			`}`
Bug 833578 - Start AudioSegment playing after first write rather than waiting for AudioStream's buffer to fill. r=roc 2013-01-22 21:53:10 -08:00			`aOutput->Start();`
Bug 815194 - Remove more ns prefixes on content/media classes + whitespace fixes. r=cpearce 2012-11-28 11:40:07 -08:00			`}`

			`}`