/* * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include "voice_engine/audio_level.h" #include "common_audio/signal_processing/include/signal_processing_library.h" #include "modules/include/module_common_types.h" namespace webrtc { namespace voe { // Number of bars on the indicator. // Note that the number of elements is specified because we are indexing it // in the range of 0-32 constexpr int8_t kPermutation[33] = {0, 1, 2, 3, 4, 4, 5, 5, 5, 5, 6, 6, 6, 6, 6, 7, 7, 7, 7, 8, 8, 8, 9, 9, 9, 9, 9, 9, 9, 9, 9, 9, 9}; AudioLevel::AudioLevel() : abs_max_(0), count_(0), current_level_(0), current_level_full_range_(0) { WebRtcSpl_Init(); } AudioLevel::~AudioLevel() {} int8_t AudioLevel::Level() const { rtc::CritScope cs(&crit_sect_); return current_level_; } int16_t AudioLevel::LevelFullRange() const { rtc::CritScope cs(&crit_sect_); return current_level_full_range_; } void AudioLevel::Clear() { rtc::CritScope cs(&crit_sect_); abs_max_ = 0; count_ = 0; current_level_ = 0; current_level_full_range_ = 0; } double AudioLevel::TotalEnergy() const { rtc::CritScope cs(&crit_sect_); return total_energy_; } double AudioLevel::TotalDuration() const { rtc::CritScope cs(&crit_sect_); return total_duration_; } void AudioLevel::ComputeLevel(const AudioFrame& audioFrame, double duration) { // Check speech level (works for 2 channels as well) int16_t abs_value = audioFrame.muted() ? 0 : WebRtcSpl_MaxAbsValueW16( audioFrame.data(), audioFrame.samples_per_channel_ * audioFrame.num_channels_); // Protect member access using a lock since this method is called on a // dedicated audio thread in the RecordedDataIsAvailable() callback. rtc::CritScope cs(&crit_sect_); if (abs_value > abs_max_) abs_max_ = abs_value; // Update level approximately 10 times per second if (count_++ == kUpdateFrequency) { current_level_full_range_ = abs_max_; count_ = 0; // Highest value for a int16_t is 0x7fff = 32767 // Divide with 1000 to get in the range of 0-32 which is the range of the // permutation vector int32_t position = abs_max_ / 1000; // Make it less likely that the bar stays at position 0. I.e. only if it's // in the range 0-250 (instead of 0-1000) if ((position == 0) && (abs_max_ > 250)) { position = 1; } current_level_ = kPermutation[position]; // Decay the absolute maximum (divide by 4) abs_max_ >>= 2; } // See the description for "totalAudioEnergy" in the WebRTC stats spec // (https://w3c.github.io/webrtc-stats/#dom-rtcmediastreamtrackstats-totalaudioenergy) // for an explanation of these formulas. In short, we need a value that can // be used to compute RMS audio levels over different time intervals, by // taking the difference between the results from two getStats calls. To do // this, the value needs to be of units "squared sample value * time". double additional_energy = static_cast(current_level_full_range_) / INT16_MAX; additional_energy *= additional_energy; total_energy_ += additional_energy * duration; total_duration_ += duration; } } // namespace voe } // namespace webrtc