/* * Copyright (c) 2020 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include "audio/voip/audio_ingress.h" #include "api/audio_codecs/builtin_audio_decoder_factory.h" #include "api/audio_codecs/builtin_audio_encoder_factory.h" #include "api/call/transport.h" #include "api/task_queue/default_task_queue_factory.h" #include "api/units/time_delta.h" #include "audio/voip/audio_egress.h" #include "modules/audio_mixer/sine_wave_generator.h" #include "modules/rtp_rtcp/source/rtp_rtcp_impl2.h" #include "rtc_base/event.h" #include "rtc_base/logging.h" #include "test/gmock.h" #include "test/gtest.h" #include "test/mock_transport.h" #include "test/run_loop.h" #include "test/time_controller/simulated_time_controller.h" namespace webrtc { namespace { using ::testing::Invoke; using ::testing::NiceMock; using ::testing::Unused; constexpr int16_t kAudioLevel = 3004; // Used for sine wave level. class AudioIngressTest : public ::testing::Test { public: const SdpAudioFormat kPcmuFormat = {"pcmu", 8000, 1}; AudioIngressTest() : wave_generator_(1000.0, kAudioLevel) { receive_statistics_ = ReceiveStatistics::Create(time_controller_.GetClock()); RtpRtcpInterface::Configuration rtp_config; rtp_config.clock = time_controller_.GetClock(); rtp_config.audio = true; rtp_config.receive_statistics = receive_statistics_.get(); rtp_config.rtcp_report_interval_ms = 5000; rtp_config.outgoing_transport = &transport_; rtp_config.local_media_ssrc = 0xdeadc0de; rtp_rtcp_ = ModuleRtpRtcpImpl2::Create(rtp_config); rtp_rtcp_->SetSendingMediaStatus(false); rtp_rtcp_->SetRTCPStatus(RtcpMode::kCompound); encoder_factory_ = CreateBuiltinAudioEncoderFactory(); decoder_factory_ = CreateBuiltinAudioDecoderFactory(); } void SetUp() override { constexpr int kPcmuPayload = 0; ingress_ = std::make_unique( rtp_rtcp_.get(), time_controller_.GetClock(), receive_statistics_.get(), decoder_factory_); ingress_->SetReceiveCodecs({{kPcmuPayload, kPcmuFormat}}); egress_ = std::make_unique( rtp_rtcp_.get(), time_controller_.GetClock(), time_controller_.GetTaskQueueFactory()); egress_->SetEncoder(kPcmuPayload, kPcmuFormat, encoder_factory_->MakeAudioEncoder( kPcmuPayload, kPcmuFormat, absl::nullopt)); egress_->StartSend(); ingress_->StartPlay(); rtp_rtcp_->SetSendingStatus(true); } void TearDown() override { rtp_rtcp_->SetSendingStatus(false); ingress_->StopPlay(); egress_->StopSend(); egress_.reset(); ingress_.reset(); } std::unique_ptr GetAudioFrame(int order) { auto frame = std::make_unique(); frame->sample_rate_hz_ = kPcmuFormat.clockrate_hz; frame->samples_per_channel_ = kPcmuFormat.clockrate_hz / 100; // 10 ms. frame->num_channels_ = kPcmuFormat.num_channels; frame->timestamp_ = frame->samples_per_channel_ * order; wave_generator_.GenerateNextFrame(frame.get()); return frame; } GlobalSimulatedTimeController time_controller_{Timestamp::Micros(123456789)}; SineWaveGenerator wave_generator_; NiceMock transport_; std::unique_ptr receive_statistics_; std::unique_ptr rtp_rtcp_; rtc::scoped_refptr encoder_factory_; rtc::scoped_refptr decoder_factory_; std::unique_ptr ingress_; std::unique_ptr egress_; }; TEST_F(AudioIngressTest, PlayingAfterStartAndStop) { EXPECT_EQ(ingress_->IsPlaying(), true); ingress_->StopPlay(); EXPECT_EQ(ingress_->IsPlaying(), false); } TEST_F(AudioIngressTest, GetAudioFrameAfterRtpReceived) { rtc::Event event; auto handle_rtp = [&](rtc::ArrayView packet, Unused) { ingress_->ReceivedRTPPacket(packet); event.Set(); return true; }; EXPECT_CALL(transport_, SendRtp).WillRepeatedly(Invoke(handle_rtp)); egress_->SendAudioData(GetAudioFrame(0)); egress_->SendAudioData(GetAudioFrame(1)); time_controller_.AdvanceTime(TimeDelta::Zero()); ASSERT_TRUE(event.Wait(TimeDelta::Seconds(1))); AudioFrame audio_frame; EXPECT_EQ( ingress_->GetAudioFrameWithInfo(kPcmuFormat.clockrate_hz, &audio_frame), AudioMixer::Source::AudioFrameInfo::kNormal); EXPECT_FALSE(audio_frame.muted()); EXPECT_EQ(audio_frame.num_channels_, 1u); EXPECT_EQ(audio_frame.samples_per_channel_, static_cast(kPcmuFormat.clockrate_hz / 100)); EXPECT_EQ(audio_frame.sample_rate_hz_, kPcmuFormat.clockrate_hz); EXPECT_NE(audio_frame.timestamp_, 0u); EXPECT_EQ(audio_frame.elapsed_time_ms_, 0); } TEST_F(AudioIngressTest, TestSpeechOutputLevelAndEnergyDuration) { // Per audio_level's kUpdateFrequency, we need more than 10 audio samples to // get audio level from output source. constexpr int kNumRtp = 6; int rtp_count = 0; rtc::Event event; auto handle_rtp = [&](rtc::ArrayView packet, Unused) { ingress_->ReceivedRTPPacket(packet); if (++rtp_count == kNumRtp) { event.Set(); } return true; }; EXPECT_CALL(transport_, SendRtp).WillRepeatedly(Invoke(handle_rtp)); for (int i = 0; i < kNumRtp * 2; i++) { egress_->SendAudioData(GetAudioFrame(i)); time_controller_.AdvanceTime(TimeDelta::Millis(10)); } event.Wait(/*give_up_after=*/TimeDelta::Seconds(1)); for (int i = 0; i < kNumRtp * 2; ++i) { AudioFrame audio_frame; EXPECT_EQ( ingress_->GetAudioFrameWithInfo(kPcmuFormat.clockrate_hz, &audio_frame), AudioMixer::Source::AudioFrameInfo::kNormal); } EXPECT_EQ(ingress_->GetOutputAudioLevel(), kAudioLevel); constexpr double kExpectedEnergy = 0.00016809565587789564; constexpr double kExpectedDuration = 0.11999999999999998; EXPECT_DOUBLE_EQ(ingress_->GetOutputTotalEnergy(), kExpectedEnergy); EXPECT_DOUBLE_EQ(ingress_->GetOutputTotalDuration(), kExpectedDuration); } TEST_F(AudioIngressTest, PreferredSampleRate) { rtc::Event event; auto handle_rtp = [&](rtc::ArrayView packet, Unused) { ingress_->ReceivedRTPPacket(packet); event.Set(); return true; }; EXPECT_CALL(transport_, SendRtp).WillRepeatedly(Invoke(handle_rtp)); egress_->SendAudioData(GetAudioFrame(0)); egress_->SendAudioData(GetAudioFrame(1)); time_controller_.AdvanceTime(TimeDelta::Zero()); ASSERT_TRUE(event.Wait(TimeDelta::Seconds(1))); AudioFrame audio_frame; EXPECT_EQ( ingress_->GetAudioFrameWithInfo(kPcmuFormat.clockrate_hz, &audio_frame), AudioMixer::Source::AudioFrameInfo::kNormal); EXPECT_EQ(ingress_->PreferredSampleRate(), kPcmuFormat.clockrate_hz); } // This test highlights the case where caller invokes StopPlay() which then // AudioIngress should play silence frame afterwards. TEST_F(AudioIngressTest, GetMutedAudioFrameAfterRtpReceivedAndStopPlay) { // StopPlay before we start sending RTP packet with sine wave. ingress_->StopPlay(); // Send 6 RTP packets to generate more than 100 ms audio sample to get // valid speech level. constexpr int kNumRtp = 6; int rtp_count = 0; rtc::Event event; auto handle_rtp = [&](rtc::ArrayView packet, Unused) { ingress_->ReceivedRTPPacket(packet); if (++rtp_count == kNumRtp) { event.Set(); } return true; }; EXPECT_CALL(transport_, SendRtp).WillRepeatedly(Invoke(handle_rtp)); for (int i = 0; i < kNumRtp * 2; i++) { egress_->SendAudioData(GetAudioFrame(i)); time_controller_.AdvanceTime(TimeDelta::Millis(10)); } event.Wait(/*give_up_after=*/TimeDelta::Seconds(1)); for (int i = 0; i < kNumRtp * 2; ++i) { AudioFrame audio_frame; EXPECT_EQ( ingress_->GetAudioFrameWithInfo(kPcmuFormat.clockrate_hz, &audio_frame), AudioMixer::Source::AudioFrameInfo::kMuted); const int16_t* audio_data = audio_frame.data(); size_t length = audio_frame.samples_per_channel_ * audio_frame.num_channels_; for (size_t j = 0; j < length; ++j) { EXPECT_EQ(audio_data[j], 0); } } // Now we should still see valid speech output level as StopPlay won't affect // the measurement. EXPECT_EQ(ingress_->GetOutputAudioLevel(), kAudioLevel); } } // namespace } // namespace webrtc