Bug 1109248: revert removal of webrtc audio ExternalRecording interface rs=jesup

2024-09-13 09:24:08 -07:00 · 2015-01-29 18:33:36 -05:00 · 2015-01-29 18:33:36 -05:00 · 05d3f1973f
commit 05d3f1973f
parent 00e69d533a
7 changed files with 395 additions and 19 deletions
--- a/media/webrtc/trunk/webrtc/engine_configurations.h
+++ b/media/webrtc/trunk/webrtc/engine_configurations.h
@ -67,6 +67,7 @@
 #define WEBRTC_VOICE_ENGINE_AGC                 // Near-end AGC
 #define WEBRTC_VOICE_ENGINE_ECHO                // Near-end AEC
 #define WEBRTC_VOICE_ENGINE_NR                  // Near-end NS
+#define WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT

 #if !defined(WEBRTC_ANDROID) && !defined(WEBRTC_IOS)
 #define WEBRTC_VOICE_ENGINE_TYPING_DETECTION    // Typing detection
--- a/media/webrtc/trunk/webrtc/voice_engine/include/voe_external_media.h
+++ b/media/webrtc/trunk/webrtc/voice_engine/include/voe_external_media.h
@ -7,6 +7,28 @@
 *  in the file PATENTS.  All contributing project authors may
 *  be found in the AUTHORS file in the root of the source tree.
 */
+
+// In some cases it is desirable to use an audio source or sink which may
+// not be available to the VoiceEngine, such as a DV camera. This sub-API
+// contains functions that allow for the use of such external recording
+// sources and playout sinks. It also describes how recorded data, or data
+// to be played out, can be modified outside the VoiceEngine.
+//
+// Usage example, omitting error checking:
+//
+//  using namespace webrtc;
+//  VoiceEngine* voe = VoiceEngine::Create();
+//  VoEBase* base = VoEBase::GetInterface(voe);
+//  VoEMediaProcess media = VoEMediaProcess::GetInterface(voe);
+//  base->Init();
+//  ...
+//  media->SetExternalRecordingStatus(true);
+//  ...
+//  base->Terminate();
+//  base->Release();
+//  media->Release();
+//  VoiceEngine::Delete(voe);
+//
 #ifndef WEBRTC_VOICE_ENGINE_VOE_EXTERNAL_MEDIA_H
 #define WEBRTC_VOICE_ENGINE_VOE_EXTERNAL_MEDIA_H

@ -61,6 +83,37 @@ public:
    virtual int DeRegisterExternalMediaProcessing(
        int channel, ProcessingTypes type) = 0;

+    // Toogles state of external recording.
+    virtual int SetExternalRecordingStatus(bool enable) = 0;
+
+    // Toogles state of external playout.
+    virtual int SetExternalPlayoutStatus(bool enable) = 0;
+
+    // This function accepts externally recorded audio. During transmission,
+    // this method should be called at as regular an interval as possible
+    // with frames of corresponding size.
+    virtual int ExternalRecordingInsertData(
+        const int16_t speechData10ms[], int lengthSamples,
+        int samplingFreqHz, int current_delay_ms) = 0;
+
+
+    // This function inserts audio written to the OS audio drivers for use
+    // as the far-end signal for AEC processing.  The length of the block
+    // must be 160, 320, 441 or 480 samples (for 16000, 32000, 44100 or
+    // 48000 kHz sampling rates respectively).
+    virtual int ExternalPlayoutData(
+        int16_t speechData10ms[], int samplingFreqHz, int num_channels,
+        int current_delay_ms, int& lengthSamples) = 0;
+
+    // This function gets audio for an external playout sink.
+    // During transmission, this function should be called every ~10 ms
+    // to obtain a new 10 ms frame of audio. The length of the block will
+    // be 160, 320, 441 or 480 samples (for 16000, 32000, 44100 or
+    // 48000 kHz sampling rates respectively).
+    virtual int ExternalPlayoutGetData(
+        int16_t speechData10ms[], int samplingFreqHz,
+        int current_delay_ms, int& lengthSamples) = 0;
+
    // Pulls an audio frame from the specified |channel| for external mixing.
    // If the |desired_sample_rate_hz| is 0, the signal will be returned with
    // its native frequency, otherwise it will be resampled. Valid frequencies
@ -71,25 +124,6 @@ public:
    // Sets the state of external mixing. Cannot be changed during playback.
    virtual int SetExternalMixing(int channel, bool enable) = 0;

-    // Don't use. To be removed.
-    virtual int SetExternalRecordingStatus(bool enable) { return -1; }
-    virtual int SetExternalPlayoutStatus(bool enable) { return -1; }
-    virtual int ExternalRecordingInsertData(
-        const int16_t speechData10ms[], int lengthSamples,
-        int samplingFreqHz, int current_delay_ms) { return -1; }
-
-    // This function inserts audio written to the OS audio drivers for use
-    // as the far-end signal for AEC processing.  The length of the block
-    // must be 160, 320, 441 or 480 samples (for 16000, 32000, 44100 or
-    // 48000 kHz sampling rates respectively).
-    virtual int ExternalPlayoutData(
-        int16_t speechData10ms[], int samplingFreqHz, int num_channels,
-        int current_delay_ms, int& lengthSamples) = 0;
-
-    virtual int ExternalPlayoutGetData(
-        int16_t speechData10ms[], int samplingFreqHz,
-        int current_delay_ms, int& lengthSamples) { return -1; }
-
 protected:
    VoEExternalMedia() {}
    virtual ~VoEExternalMedia() {}
--- a/media/webrtc/trunk/webrtc/voice_engine/test/auto_test/standard/external_media_test.cc
+++ b/media/webrtc/trunk/webrtc/voice_engine/test/auto_test/standard/external_media_test.cc
@ -28,6 +28,43 @@ class ExternalMediaTest : public AfterStreamingFixture {
  }
 };

+TEST_F(ExternalMediaTest, ManualCanRecordAndPlaybackUsingExternalPlayout) {
+  SwitchToManualMicrophone();
+
+  EXPECT_EQ(0, voe_base_->StopSend(channel_));
+  EXPECT_EQ(0, voe_base_->StopPlayout(channel_));
+  EXPECT_EQ(0, voe_xmedia_->SetExternalPlayoutStatus(true));
+  EXPECT_EQ(0, voe_base_->StartPlayout(channel_));
+  EXPECT_EQ(0, voe_base_->StartSend(channel_));
+
+  TEST_LOG("Recording data for 2 seconds starting now: please speak.\n");
+  int16_t recording[32000];
+  for (int i = 0; i < 200; i++) {
+    int sample_length = 0;
+    EXPECT_EQ(0, voe_xmedia_->ExternalPlayoutGetData(
+        &(recording[i * 160]), 16000, 100, sample_length));
+    EXPECT_EQ(160, sample_length);
+    Sleep(10);
+  }
+
+  EXPECT_EQ(0, voe_base_->StopSend(channel_));
+  EXPECT_EQ(0, voe_base_->StopPlayout(channel_));
+  EXPECT_EQ(0, voe_xmedia_->SetExternalPlayoutStatus(false));
+  EXPECT_EQ(0, voe_base_->StartPlayout(channel_));
+  EXPECT_EQ(0, voe_xmedia_->SetExternalRecordingStatus(true));
+  EXPECT_EQ(0, voe_base_->StartSend(channel_));
+
+  TEST_LOG("Playing back recording, you should hear what you said earlier.\n");
+  for (int i = 0; i < 200; i++) {
+    EXPECT_EQ(0, voe_xmedia_->ExternalRecordingInsertData(
+        &(recording[i * 160]), 160, 16000, 20));
+    Sleep(10);
+  }
+
+  EXPECT_EQ(0, voe_base_->StopSend(channel_));
+  EXPECT_EQ(0, voe_xmedia_->SetExternalRecordingStatus(false));
+}
+
 TEST_F(ExternalMediaTest,
    ManualRegisterExternalMediaProcessingOnAllChannelsAffectsPlayout) {
  TEST_LOG("Enabling external media processing: audio should be affected.\n");
--- a/media/webrtc/trunk/webrtc/voice_engine/voe_base_impl.cc
+++ b/media/webrtc/trunk/webrtc/voice_engine/voe_base_impl.cc
@ -787,6 +787,16 @@ int VoEBaseImpl::GetVersion(char version[1024])
    accLen += len;
    assert(accLen < kVoiceEngineVersionMaxMessageSize);
 #endif
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    len = AddExternalRecAndPlayoutBuild(versionPtr);
+    if (len == -1)
+    {
+        return -1;
+    }
+    versionPtr += len;
+    accLen += len;
+    assert(accLen < kVoiceEngineVersionMaxMessageSize);
+ #endif

    memcpy(version, versionBuf, accLen);
    version[accLen] = '\0';
@ -831,6 +841,13 @@ int32_t VoEBaseImpl::AddExternalTransportBuild(char* str) const
 }
 #endif

+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+int32_t VoEBaseImpl::AddExternalRecAndPlayoutBuild(char* str) const
+{
+    return sprintf(str, "External recording and playout build\n");
+}
+#endif
+
 int VoEBaseImpl::LastError()
 {
    WEBRTC_TRACE(kTraceApiCall, kTraceVoice, VoEId(_shared->instance_id(), -1),
--- a/media/webrtc/trunk/webrtc/voice_engine/voe_base_impl.h
+++ b/media/webrtc/trunk/webrtc/voice_engine/voe_base_impl.h
@ -153,6 +153,9 @@ private:
    int InitializeChannel(voe::ChannelOwner* channel_owner);
 #ifdef WEBRTC_EXTERNAL_TRANSPORT
    int32_t AddExternalTransportBuild(char* str) const;
+#endif
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    int32_t AddExternalRecAndPlayoutBuild(char* str) const;
 #endif
    VoiceEngineObserver* _voiceEngineObserverPtr;
    CriticalSectionWrapper& _callbackCritSect;
--- a/media/webrtc/trunk/webrtc/voice_engine/voe_external_media_impl.cc
+++ b/media/webrtc/trunk/webrtc/voice_engine/voe_external_media_impl.cc
@ -143,6 +143,265 @@ int VoEExternalMediaImpl::DeRegisterExternalMediaProcessing(
    return -1;
 }

+int VoEExternalMediaImpl::SetExternalRecordingStatus(bool enable)
+{
+    WEBRTC_TRACE(kTraceApiCall, kTraceVoice, VoEId(shared_->instance_id(), -1),
+                 "SetExternalRecordingStatus(enable=%d)", enable);
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    if (shared_->audio_device()->Recording())
+    {
+        shared_->SetLastError(VE_ALREADY_SENDING, kTraceError,
+            "SetExternalRecordingStatus() cannot set state while sending");
+        return -1;
+    }
+    shared_->set_ext_recording(enable);
+    return 0;
+#else
+    shared_->SetLastError(VE_FUNC_NOT_SUPPORTED, kTraceError,
+        "SetExternalRecordingStatus() external recording is not supported");
+    return -1;
+#endif
+}
+
+int VoEExternalMediaImpl::ExternalRecordingInsertData(
+        const int16_t speechData10ms[],
+        int lengthSamples,
+        int samplingFreqHz,
+        int current_delay_ms)
+{
+    WEBRTC_TRACE(kTraceStream, kTraceVoice, VoEId(shared_->instance_id(), -1),
+                 "ExternalRecordingInsertData(speechData10ms=0x%x,"
+                 " lengthSamples=%u, samplingFreqHz=%d, current_delay_ms=%d)",
+                 &speechData10ms[0], lengthSamples, samplingFreqHz,
+              current_delay_ms);
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    if (!shared_->statistics().Initialized())
+    {
+        shared_->SetLastError(VE_NOT_INITED, kTraceError);
+        return -1;
+    }
+    if (!shared_->ext_recording())
+    {
+       shared_->SetLastError(VE_INVALID_OPERATION, kTraceError,
+           "ExternalRecordingInsertData() external recording is not enabled");
+        return -1;
+    }
+    if (shared_->NumOfSendingChannels() == 0)
+    {
+        shared_->SetLastError(VE_ALREADY_SENDING, kTraceError,
+            "SetExternalRecordingStatus() no channel is sending");
+        return -1;
+    }
+    if ((16000 != samplingFreqHz) && (32000 != samplingFreqHz) &&
+        (48000 != samplingFreqHz) && (44100 != samplingFreqHz))
+    {
+         shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+             "SetExternalRecordingStatus() invalid sample rate");
+        return -1;
+    }
+    if ((0 == lengthSamples) ||
+        ((lengthSamples % (samplingFreqHz / 100)) != 0))
+    {
+         shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+             "SetExternalRecordingStatus() invalid buffer size");
+        return -1;
+    }
+    if (current_delay_ms < 0)
+    {
+        shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+            "SetExternalRecordingStatus() invalid delay)");
+        return -1;
+    }
+
+    uint16_t blockSize = samplingFreqHz / 100;
+    uint32_t nBlocks = lengthSamples / blockSize;
+    int16_t totalDelayMS = 0;
+    uint16_t playoutDelayMS = 0;
+
+    for (uint32_t i = 0; i < nBlocks; i++)
+    {
+        if (!shared_->ext_playout())
+        {
+            // Use real playout delay if external playout is not enabled.
+            if (shared_->audio_device()->PlayoutDelay(&playoutDelayMS) != 0) {
+              shared_->SetLastError(VE_AUDIO_DEVICE_MODULE_ERROR, kTraceWarning,
+                  "PlayoutDelay() unable to get the playout delay");
+            }
+            totalDelayMS = current_delay_ms + playoutDelayMS;
+        }
+        else
+        {
+            // Use stored delay value given the last call
+            // to ExternalPlayoutGetData.
+            totalDelayMS = current_delay_ms + playout_delay_ms_;
+            // Compensate for block sizes larger than 10ms
+            totalDelayMS -= (int16_t)(i*10);
+            if (totalDelayMS < 0)
+                totalDelayMS = 0;
+        }
+        shared_->transmit_mixer()->PrepareDemux(
+            (const int8_t*)(&speechData10ms[i*blockSize]),
+            blockSize,
+            1,
+            samplingFreqHz,
+            totalDelayMS,
+            0,
+            0,
+            false); // Typing detection not supported
+
+        shared_->transmit_mixer()->DemuxAndMix();
+        shared_->transmit_mixer()->EncodeAndSend();
+    }
+    return 0;
+#else
+       shared_->SetLastError(VE_FUNC_NOT_SUPPORTED, kTraceError,
+        "ExternalRecordingInsertData() external recording is not supported");
+    return -1;
+#endif
+}
+
+int VoEExternalMediaImpl::SetExternalPlayoutStatus(bool enable)
+{
+    WEBRTC_TRACE(kTraceApiCall, kTraceVoice, VoEId(shared_->instance_id(), -1),
+                 "SetExternalPlayoutStatus(enable=%d)", enable);
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    if (shared_->audio_device()->Playing())
+    {
+        shared_->SetLastError(VE_ALREADY_SENDING, kTraceError,
+            "SetExternalPlayoutStatus() cannot set state while playing");
+        return -1;
+    }
+    shared_->set_ext_playout(enable);
+    return 0;
+#else
+    shared_->SetLastError(VE_FUNC_NOT_SUPPORTED, kTraceError,
+        "SetExternalPlayoutStatus() external playout is not supported");
+    return -1;
+#endif
+}
+
+// This inserts a copy of the raw audio sent to the output drivers to use
+// as the "far end" signal for the AEC.  Currently only 10ms chunks are
+// supported unfortunately.  Since we have to rechunk to 10ms to call this,
+// thre isn't much gained by allowing N*10ms here; external code can loop
+// if needed.
+int VoEExternalMediaImpl::ExternalPlayoutData(
+    int16_t speechData10ms[],
+    int samplingFreqHz,
+    int num_channels,
+    int current_delay_ms,
+    int& lengthSamples)
+{
+    WEBRTC_TRACE(kTraceStream, kTraceVoice, VoEId(shared_->instance_id(), -1),
+                 "ExternalPlayoutData(speechData10ms=0x%x,"
+                 " lengthSamples=%u, samplingFreqHz=%d, current_delay_ms=%d)",
+                 &speechData10ms[0], lengthSamples, samplingFreqHz,
+                 current_delay_ms);
+
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    if (!shared_->statistics().Initialized())
+    {
+        shared_->SetLastError(VE_NOT_INITED, kTraceError);
+        return -1;
+    }
+    // FIX(jesup) - check if this is enabled?
+    if (shared_->NumOfSendingChannels() == 0)
+    {
+        shared_->SetLastError(VE_ALREADY_SENDING, kTraceError,
+            "SetExternalRecordingStatus() no channel is sending");
+        return -1;
+    }
+    if ((16000 != samplingFreqHz) && (32000 != samplingFreqHz) &&
+        (48000 != samplingFreqHz) && (44100 != samplingFreqHz))
+    {
+         shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+             "SetExternalRecordingStatus() invalid sample rate");
+        return -1;
+    }
+    if (current_delay_ms < 0)
+    {
+        shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+            "SetExternalRecordingStatus() invalid delay)");
+        return -1;
+    }
+
+    // Far-end data is inserted without going through neteq/etc.
+    // Only supports 10ms chunks; AnalyzeReverseStream() enforces that
+    // lower down.
+    AudioFrame audioFrame;
+    audioFrame.UpdateFrame(-1, 0xFFFFFFFF,
+                           speechData10ms,
+                           lengthSamples,
+                           samplingFreqHz,
+                           AudioFrame::kNormalSpeech,
+                           AudioFrame::kVadUnknown,
+                           num_channels);
+
+    shared_->output_mixer()->APMAnalyzeReverseStream(audioFrame);
+#endif
+    return 0;
+}
+
+int VoEExternalMediaImpl::ExternalPlayoutGetData(
+    int16_t speechData10ms[],
+    int samplingFreqHz,
+    int current_delay_ms,
+    int& lengthSamples)
+{
+    WEBRTC_TRACE(kTraceStream, kTraceVoice, VoEId(shared_->instance_id(), -1),
+                 "ExternalPlayoutGetData(speechData10ms=0x%x, samplingFreqHz=%d"
+                 ",  current_delay_ms=%d)", &speechData10ms[0], samplingFreqHz,
+                 current_delay_ms);
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    if (!shared_->statistics().Initialized())
+    {
+        shared_->SetLastError(VE_NOT_INITED, kTraceError);
+        return -1;
+    }
+    if (!shared_->ext_playout())
+    {
+       shared_->SetLastError(VE_INVALID_OPERATION, kTraceError,
+           "ExternalPlayoutGetData() external playout is not enabled");
+        return -1;
+    }
+    if ((16000 != samplingFreqHz) && (32000 != samplingFreqHz) &&
+        (48000 != samplingFreqHz) && (44100 != samplingFreqHz))
+    {
+        shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+            "ExternalPlayoutGetData() invalid sample rate");
+        return -1;
+    }
+    if (current_delay_ms < 0)
+    {
+        shared_->SetLastError(VE_INVALID_ARGUMENT, kTraceError,
+            "ExternalPlayoutGetData() invalid delay)");
+        return -1;
+    }
+
+    AudioFrame audioFrame;
+
+    // Retrieve mixed output at the specified rate
+    shared_->output_mixer()->MixActiveChannels();
+    shared_->output_mixer()->DoOperationsOnCombinedSignal(true);
+    shared_->output_mixer()->GetMixedAudio(samplingFreqHz, 1, &audioFrame);
+
+    // Deliver audio (PCM) samples to the external sink
+    memcpy(speechData10ms,
+           audioFrame.data_,
+           sizeof(int16_t)*(audioFrame.samples_per_channel_));
+    lengthSamples = audioFrame.samples_per_channel_;
+
+    // Store current playout delay (to be used by ExternalRecordingInsertData).
+    playout_delay_ms_ = current_delay_ms;
+
+    return 0;
+#else
+    shared_->SetLastError(VE_FUNC_NOT_SUPPORTED, kTraceError,
+       "ExternalPlayoutGetData() external playout is not supported");
+    return -1;
+#endif
+}
+
 int VoEExternalMediaImpl::GetAudioFrame(int channel, int desired_sample_rate_hz,
                                        AudioFrame* frame) {
    WEBRTC_TRACE(kTraceApiCall, kTraceVoice,
--- a/media/webrtc/trunk/webrtc/voice_engine/voe_external_media_impl.h
+++ b/media/webrtc/trunk/webrtc/voice_engine/voe_external_media_impl.h
@ -29,6 +29,28 @@ public:
        int channel,
        ProcessingTypes type);

+    virtual int SetExternalRecordingStatus(bool enable);
+
+    virtual int SetExternalPlayoutStatus(bool enable);
+
+    virtual int ExternalRecordingInsertData(
+        const int16_t speechData10ms[],
+        int lengthSamples,
+        int samplingFreqHz,
+        int current_delay_ms);
+
+    // Insertion of far-end data as actually played out to the OS audio driver
+    virtual int ExternalPlayoutData(
+        int16_t speechData10ms[],
+        int samplingFreqHz,
+        int num_channels,
+        int current_delay_ms,
+        int& lengthSamples);
+
+    virtual int ExternalPlayoutGetData(int16_t speechData10ms[],
+                                       int samplingFreqHz,
+                                       int current_delay_ms,
+                                       int& lengthSamples);

    virtual int GetAudioFrame(int channel, int desired_sample_rate_hz,
                              AudioFrame* frame);
@ -40,6 +62,9 @@ protected:
    virtual ~VoEExternalMediaImpl();

 private:
+#ifdef WEBRTC_VOE_EXTERNAL_REC_AND_PLAYOUT
+    int playout_delay_ms_;
+#endif
    voe::SharedData* shared_;
 };