1 files changed, 393 insertions, 0 deletions
diff --git a/third_party/libwebrtc/audio/utility/channel_mixer_unittest.cc b/third_party/libwebrtc/audio/utility/channel_mixer_unittest.cc
new file mode 100644
index 0000000000..94cb1ac7e3
--- /dev/null
+++ b/third_party/libwebrtc/audio/utility/channel_mixer_unittest.cc
@@ -0,0 +1,393 @@
+/*
+ *  Copyright (c) 2019 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "audio/utility/channel_mixer.h"
+
+#include <memory>
+
+#include "api/audio/audio_frame.h"
+#include "api/audio/channel_layout.h"
+#include "audio/utility/channel_mixing_matrix.h"
+#include "rtc_base/arraysize.h"
+#include "rtc_base/strings/string_builder.h"
+#include "test/gtest.h"
+
+namespace webrtc {
+
+namespace {
+
+constexpr uint32_t kTimestamp = 27;
+constexpr int kSampleRateHz = 16000;
+constexpr size_t kSamplesPerChannel = kSampleRateHz / 100;
+
+class ChannelMixerTest : public ::testing::Test {
+ protected:
+  ChannelMixerTest() {
+    // Use 10ms audio frames by default. Don't set values yet.
+    frame_.samples_per_channel_ = kSamplesPerChannel;
+    frame_.sample_rate_hz_ = kSampleRateHz;
+    EXPECT_TRUE(frame_.muted());
+  }
+
+  virtual ~ChannelMixerTest() {}
+
+  AudioFrame frame_;
+};
+
+void SetFrameData(int16_t data, AudioFrame* frame) {
+  int16_t* frame_data = frame->mutable_data();
+  for (size_t i = 0; i < frame->samples_per_channel() * frame->num_channels();
+       i++) {
+    frame_data[i] = data;
+  }
+}
+
+void SetMonoData(int16_t center, AudioFrame* frame) {
+  frame->num_channels_ = 1;
+  int16_t* frame_data = frame->mutable_data();
+  for (size_t i = 0; i < frame->samples_per_channel(); ++i) {
+    frame_data[i] = center;
+  }
+  EXPECT_FALSE(frame->muted());
+}
+
+void SetStereoData(int16_t left, int16_t right, AudioFrame* frame) {
+  ASSERT_LE(2 * frame->samples_per_channel(), frame->max_16bit_samples());
+  frame->num_channels_ = 2;
+  int16_t* frame_data = frame->mutable_data();
+  for (size_t i = 0; i < frame->samples_per_channel() * 2; i += 2) {
+    frame_data[i] = left;
+    frame_data[i + 1] = right;
+  }
+  EXPECT_FALSE(frame->muted());
+}
+
+void SetFiveOneData(int16_t front_left,
+                    int16_t front_right,
+                    int16_t center,
+                    int16_t lfe,
+                    int16_t side_left,
+                    int16_t side_right,
+                    AudioFrame* frame) {
+  ASSERT_LE(6 * frame->samples_per_channel(), frame->max_16bit_samples());
+  frame->num_channels_ = 6;
+  int16_t* frame_data = frame->mutable_data();
+  for (size_t i = 0; i < frame->samples_per_channel() * 6; i += 6) {
+    frame_data[i] = front_left;
+    frame_data[i + 1] = front_right;
+    frame_data[i + 2] = center;
+    frame_data[i + 3] = lfe;
+    frame_data[i + 4] = side_left;
+    frame_data[i + 5] = side_right;
+  }
+  EXPECT_FALSE(frame->muted());
+}
+
+void SetSevenOneData(int16_t front_left,
+                     int16_t front_right,
+                     int16_t center,
+                     int16_t lfe,
+                     int16_t side_left,
+                     int16_t side_right,
+                     int16_t back_left,
+                     int16_t back_right,
+                     AudioFrame* frame) {
+  ASSERT_LE(8 * frame->samples_per_channel(), frame->max_16bit_samples());
+  frame->num_channels_ = 8;
+  int16_t* frame_data = frame->mutable_data();
+  for (size_t i = 0; i < frame->samples_per_channel() * 8; i += 8) {
+    frame_data[i] = front_left;
+    frame_data[i + 1] = front_right;
+    frame_data[i + 2] = center;
+    frame_data[i + 3] = lfe;
+    frame_data[i + 4] = side_left;
+    frame_data[i + 5] = side_right;
+    frame_data[i + 6] = back_left;
+    frame_data[i + 7] = back_right;
+  }
+  EXPECT_FALSE(frame->muted());
+}
+
+bool AllSamplesEquals(int16_t sample, const AudioFrame* frame) {
+  const int16_t* frame_data = frame->data();
+  for (size_t i = 0; i < frame->samples_per_channel() * frame->num_channels();
+       i++) {
+    if (frame_data[i] != sample) {
+      return false;
+    }
+  }
+  return true;
+}
+
+void VerifyFramesAreEqual(const AudioFrame& frame1, const AudioFrame& frame2) {
+  EXPECT_EQ(frame1.num_channels(), frame2.num_channels());
+  EXPECT_EQ(frame1.samples_per_channel(), frame2.samples_per_channel());
+  const int16_t* frame1_data = frame1.data();
+  const int16_t* frame2_data = frame2.data();
+  for (size_t i = 0; i < frame1.samples_per_channel() * frame1.num_channels();
+       i++) {
+    EXPECT_EQ(frame1_data[i], frame2_data[i]);
+  }
+  EXPECT_EQ(frame1.muted(), frame2.muted());
+}
+
+}  // namespace
+
+// Test all possible layout conversions can be constructed and mixed. Don't
+// care about the actual content, simply run through all mixing combinations
+// and ensure that nothing fails.
+TEST_F(ChannelMixerTest, ConstructAllPossibleLayouts) {
+  for (ChannelLayout input_layout = CHANNEL_LAYOUT_MONO;
+       input_layout <= CHANNEL_LAYOUT_MAX;
+       input_layout = static_cast<ChannelLayout>(input_layout + 1)) {
+    for (ChannelLayout output_layout = CHANNEL_LAYOUT_MONO;
+         output_layout <= CHANNEL_LAYOUT_MAX;
+         output_layout = static_cast<ChannelLayout>(output_layout + 1)) {
+      // DISCRETE, BITSTREAM can't be tested here based on the current approach.
+      // CHANNEL_LAYOUT_STEREO_AND_KEYBOARD_MIC is not mixable.
+      // Stereo down mix should never be the output layout.
+      if (input_layout == CHANNEL_LAYOUT_BITSTREAM ||
+          input_layout == CHANNEL_LAYOUT_DISCRETE ||
+          input_layout == CHANNEL_LAYOUT_STEREO_AND_KEYBOARD_MIC ||
+          output_layout == CHANNEL_LAYOUT_BITSTREAM ||
+          output_layout == CHANNEL_LAYOUT_DISCRETE ||
+          output_layout == CHANNEL_LAYOUT_STEREO_AND_KEYBOARD_MIC ||
+          output_layout == CHANNEL_LAYOUT_STEREO_DOWNMIX) {
+        continue;
+      }
+
+      rtc::StringBuilder ss;
+      ss << "Input Layout: " << input_layout
+         << ", Output Layout: " << output_layout;
+      SCOPED_TRACE(ss.str());
+      ChannelMixer mixer(input_layout, output_layout);
+
+      frame_.UpdateFrame(kTimestamp, nullptr, kSamplesPerChannel, kSampleRateHz,
+                         AudioFrame::kNormalSpeech, AudioFrame::kVadActive,
+                         ChannelLayoutToChannelCount(input_layout));
+      EXPECT_TRUE(frame_.muted());
+      mixer.Transform(&frame_);
+    }
+  }
+}
+
+// Ensure that the audio frame is untouched when input and output channel
+// layouts are identical, i.e., the transformation should have no effect.
+// Exclude invalid mixing combinations.
+TEST_F(ChannelMixerTest, NoMixingForIdenticalChannelLayouts) {
+  for (ChannelLayout input_layout = CHANNEL_LAYOUT_MONO;
+       input_layout <= CHANNEL_LAYOUT_MAX;
+       input_layout = static_cast<ChannelLayout>(input_layout + 1)) {
+    for (ChannelLayout output_layout = CHANNEL_LAYOUT_MONO;
+         output_layout <= CHANNEL_LAYOUT_MAX;
+         output_layout = static_cast<ChannelLayout>(output_layout + 1)) {
+      if (input_layout != output_layout ||
+          input_layout == CHANNEL_LAYOUT_BITSTREAM ||
+          input_layout == CHANNEL_LAYOUT_DISCRETE ||
+          input_layout == CHANNEL_LAYOUT_STEREO_AND_KEYBOARD_MIC ||
+          output_layout == CHANNEL_LAYOUT_STEREO_DOWNMIX) {
+        continue;
+      }
+      ChannelMixer mixer(input_layout, output_layout);
+      frame_.num_channels_ = ChannelLayoutToChannelCount(input_layout);
+      SetFrameData(99, &frame_);
+      mixer.Transform(&frame_);
+      EXPECT_EQ(ChannelLayoutToChannelCount(input_layout),
+                static_cast<int>(frame_.num_channels()));
+      EXPECT_TRUE(AllSamplesEquals(99, &frame_));
+    }
+  }
+}
+
+TEST_F(ChannelMixerTest, StereoToMono) {
+  ChannelMixer mixer(CHANNEL_LAYOUT_STEREO, CHANNEL_LAYOUT_MONO);
+  //
+  //                      Input: stereo
+  //                      LEFT  RIGHT
+  // Output: mono CENTER  0.5   0.5
+  //
+  SetStereoData(7, 3, &frame_);
+  EXPECT_EQ(2u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(1u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_MONO, frame_.channel_layout());
+
+  AudioFrame mono_frame;
+  mono_frame.samples_per_channel_ = frame_.samples_per_channel();
+  SetMonoData(5, &mono_frame);
+  VerifyFramesAreEqual(mono_frame, frame_);
+
+  SetStereoData(-32768, -32768, &frame_);
+  EXPECT_EQ(2u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(1u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_MONO, frame_.channel_layout());
+  SetMonoData(-32768, &mono_frame);
+  VerifyFramesAreEqual(mono_frame, frame_);
+}
+
+TEST_F(ChannelMixerTest, StereoToMonoMuted) {
+  ASSERT_TRUE(frame_.muted());
+  ChannelMixer mixer(CHANNEL_LAYOUT_STEREO, CHANNEL_LAYOUT_MONO);
+  mixer.Transform(&frame_);
+  EXPECT_EQ(1u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_MONO, frame_.channel_layout());
+  EXPECT_TRUE(frame_.muted());
+}
+
+TEST_F(ChannelMixerTest, FiveOneToSevenOneMuted) {
+  ASSERT_TRUE(frame_.muted());
+  ChannelMixer mixer(CHANNEL_LAYOUT_5_1, CHANNEL_LAYOUT_7_1);
+  mixer.Transform(&frame_);
+  EXPECT_EQ(8u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_7_1, frame_.channel_layout());
+  EXPECT_TRUE(frame_.muted());
+}
+
+TEST_F(ChannelMixerTest, FiveOneToMono) {
+  ChannelMixer mixer(CHANNEL_LAYOUT_5_1, CHANNEL_LAYOUT_MONO);
+  //
+  //                      Input: 5.1
+  //                      LEFT   RIGHT  CENTER  LFE    SIDE_LEFT  SIDE_RIGHT
+  // Output: mono CENTER  0.707  0.707  1       0.707  0.707      0.707
+  //
+  // a = [10, 20, 15, 2, 5, 5]
+  // b = [1/sqrt(2), 1/sqrt(2), 1.0, 1/sqrt(2), 1/sqrt(2), 1/sqrt(2)] =>
+  // a * b (dot product) = 44.69848480983499,
+  // which is truncated into 44 using 16 bit representation.
+  //
+  SetFiveOneData(10, 20, 15, 2, 5, 5, &frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(1u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_MONO, frame_.channel_layout());
+
+  AudioFrame mono_frame;
+  mono_frame.samples_per_channel_ = frame_.samples_per_channel();
+  SetMonoData(44, &mono_frame);
+  VerifyFramesAreEqual(mono_frame, frame_);
+
+  SetFiveOneData(-32768, -32768, -32768, -32768, -32768, -32768, &frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(1u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_MONO, frame_.channel_layout());
+  SetMonoData(-32768, &mono_frame);
+  VerifyFramesAreEqual(mono_frame, frame_);
+}
+
+TEST_F(ChannelMixerTest, FiveOneToSevenOne) {
+  ChannelMixer mixer(CHANNEL_LAYOUT_5_1, CHANNEL_LAYOUT_7_1);
+  //
+  //                        Input: 5.1
+  //                        LEFT   RIGHT  CENTER  LFE    SIDE_LEFT  SIDE_RIGHT
+  // Output: 7.1 LEFT       1      0      0       0      0          0
+  //             RIGHT      0      1      0       0      0          0
+  //             CENTER     0      0      1       0      0          0
+  //             LFE        0      0      0       1      0          0
+  //             SIDE_LEFT  0      0      0       0      1          0
+  //             SIDE_RIGHT 0      0      0       0      0          1
+  //             BACK_LEFT  0      0      0       0      0          0
+  //             BACK_RIGHT 0      0      0       0      0          0
+  //
+  SetFiveOneData(10, 20, 15, 2, 5, 5, &frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(8u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_7_1, frame_.channel_layout());
+
+  AudioFrame seven_one_frame;
+  seven_one_frame.samples_per_channel_ = frame_.samples_per_channel();
+  SetSevenOneData(10, 20, 15, 2, 5, 5, 0, 0, &seven_one_frame);
+  VerifyFramesAreEqual(seven_one_frame, frame_);
+
+  SetFiveOneData(-32768, 32767, -32768, 32767, -32768, 32767, &frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(8u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_7_1, frame_.channel_layout());
+  SetSevenOneData(-32768, 32767, -32768, 32767, -32768, 32767, 0, 0,
+                  &seven_one_frame);
+  VerifyFramesAreEqual(seven_one_frame, frame_);
+}
+
+TEST_F(ChannelMixerTest, FiveOneBackToStereo) {
+  ChannelMixer mixer(CHANNEL_LAYOUT_5_1_BACK, CHANNEL_LAYOUT_STEREO);
+  //
+  //                      Input: 5.1
+  //                      LEFT   RIGHT  CENTER  LFE    BACK_LEFT  BACK_RIGHT
+  // Output: stereo LEFT  1      0      0.707   0.707  0.707      0
+  //                RIGHT 0      1      0.707   0.707  0          0.707
+  //
+  SetFiveOneData(20, 30, 15, 2, 5, 5, &frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(2u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_STEREO, frame_.channel_layout());
+
+  AudioFrame stereo_frame;
+  stereo_frame.samples_per_channel_ = frame_.samples_per_channel();
+  SetStereoData(35, 45, &stereo_frame);
+  VerifyFramesAreEqual(stereo_frame, frame_);
+
+  SetFiveOneData(-32768, -32768, -32768, -32768, -32768, -32768, &frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(2u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_STEREO, frame_.channel_layout());
+  SetStereoData(-32768, -32768, &stereo_frame);
+  VerifyFramesAreEqual(stereo_frame, frame_);
+}
+
+TEST_F(ChannelMixerTest, MonoToStereo) {
+  ChannelMixer mixer(CHANNEL_LAYOUT_MONO, CHANNEL_LAYOUT_STEREO);
+  //
+  //                       Input: mono
+  //                       CENTER
+  // Output: stereo LEFT   1
+  //                RIGHT  1
+  //
+  SetMonoData(44, &frame_);
+  EXPECT_EQ(1u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(2u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_STEREO, frame_.channel_layout());
+
+  AudioFrame stereo_frame;
+  stereo_frame.samples_per_channel_ = frame_.samples_per_channel();
+  SetStereoData(44, 44, &stereo_frame);
+  VerifyFramesAreEqual(stereo_frame, frame_);
+}
+
+TEST_F(ChannelMixerTest, StereoToFiveOne) {
+  ChannelMixer mixer(CHANNEL_LAYOUT_STEREO, CHANNEL_LAYOUT_5_1);
+  //
+  //                         Input: Stereo
+  //                         LEFT   RIGHT
+  // Output: 5.1 LEFT        1      0
+  //             RIGHT       0      1
+  //             CENTER      0      0
+  //             LFE         0      0
+  //             SIDE_LEFT   0      0
+  //             SIDE_RIGHT  0      0
+  //
+  SetStereoData(50, 60, &frame_);
+  EXPECT_EQ(2u, frame_.num_channels());
+  mixer.Transform(&frame_);
+  EXPECT_EQ(6u, frame_.num_channels());
+  EXPECT_EQ(CHANNEL_LAYOUT_5_1, frame_.channel_layout());
+
+  AudioFrame five_one_frame;
+  five_one_frame.samples_per_channel_ = frame_.samples_per_channel();
+  SetFiveOneData(50, 60, 0, 0, 0, 0, &five_one_frame);
+  VerifyFramesAreEqual(five_one_frame, frame_);
+}
+
+}  // namespace webrtc