webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc - Issue 1322973004: Fold AudioEncoderMutable into AudioEncoder

Unified Diff: webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc

Issue 1322973004: Fold AudioEncoderMutable into AudioEncoder (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master

Patch Set: review fixes Created 5 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « webrtc/modules/audio_coding/codecs/opus/audio_encoder_mutable_opus_test.cc ('k') | webrtc/modules/audio_coding/codecs/opus/interface/audio_encoder_opus.h » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc

diff --git a/webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc b/webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc

index 37ce8733fed21268db49a942eb3cb1c7a7a1b76b..e750aa1323b9bfdfa1b42be7a7869202d41307c6 100644

--- a/webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc

+++ b/webrtc/modules/audio_coding/codecs/opus/audio_encoder_opus.cc

@@ -11,6 +11,7 @@

#include "webrtc/modules/audio_coding/codecs/opus/interface/audio_encoder_opus.h"

#include "webrtc/base/checks.h"

+#include "webrtc/base/safe_conversions.h"

#include "webrtc/common_types.h"

#include "webrtc/modules/audio_coding/codecs/opus/interface/opus_interface.h"

@@ -18,36 +19,63 @@ namespace webrtc {

namespace {

+const int kSampleRateHz = 48000;

const int kMinBitrateBps = 500;

const int kMaxBitrateBps = 512000;

-// TODO(tlegrand): Remove this code when we have proper APIs to set the

-// complexity at a higher level.

-#if defined(WEBRTC_ANDROID) || defined(WEBRTC_IOS) || defined(WEBRTC_ARCH_ARM)

-// If we are on Android, iOS and/or ARM, use a lower complexity setting as

-// default, to save encoder complexity.

-const int kDefaultComplexity = 5;

-#else

-const int kDefaultComplexity = 9;

-#endif

+AudioEncoderOpus::Config CreateConfig(const CodecInst& codec_inst) {

+ AudioEncoderOpus::Config config;

+ config.frame_size_ms = rtc::CheckedDivExact(codec_inst.pacsize, 48);

+ config.num_channels = codec_inst.channels;

+ config.bitrate_bps = codec_inst.rate;

+ config.payload_type = codec_inst.pltype;

+ config.application = config.num_channels == 1 ? AudioEncoderOpus::kVoip

+ : AudioEncoderOpus::kAudio;

+ return config;

-// We always encode at 48 kHz.

-const int kSampleRateHz = 48000;

+// Optimize the loss rate to configure Opus. Basically, optimized loss rate is

+// the input loss rate rounded down to various levels, because a robustly good

+// audio quality is achieved by lowering the packet loss down.

+// Additionally, to prevent toggling, margins are used, i.e., when jumping to

+// a loss rate from below, a higher threshold is used than jumping to the same

+// level from above.

+double OptimizePacketLossRate(double new_loss_rate, double old_loss_rate) {

+ DCHECK_GE(new_loss_rate, 0.0);

+ DCHECK_LE(new_loss_rate, 1.0);

+ DCHECK_GE(old_loss_rate, 0.0);

+ DCHECK_LE(old_loss_rate, 1.0);

+ const double kPacketLossRate20 = 0.20;

+ const double kPacketLossRate10 = 0.10;

+ const double kPacketLossRate5 = 0.05;

+ const double kPacketLossRate1 = 0.01;

+ const double kLossRate20Margin = 0.02;

+ const double kLossRate10Margin = 0.01;

+ const double kLossRate5Margin = 0.01;

+ if (new_loss_rate >=

+ kPacketLossRate20 +

+ kLossRate20Margin *

+ (kPacketLossRate20 - old_loss_rate > 0 ? 1 : -1)) {

+ return kPacketLossRate20;

+ } else if (new_loss_rate >=

+ kPacketLossRate10 +

+ kLossRate10Margin *

+ (kPacketLossRate10 - old_loss_rate > 0 ? 1 : -1)) {

+ return kPacketLossRate10;

+ } else if (new_loss_rate >=

+ kPacketLossRate5 +

+ kLossRate5Margin *

+ (kPacketLossRate5 - old_loss_rate > 0 ? 1 : -1)) {

+ return kPacketLossRate5;

+ } else if (new_loss_rate >= kPacketLossRate1) {

+ return kPacketLossRate1;

+ } else {

+ return 0.0;

+ }

} // namespace

-AudioEncoderOpus::Config::Config()

- : frame_size_ms(20),

- num_channels(1),

- payload_type(120),

- application(kVoip),

- bitrate_bps(64000),

- fec_enabled(false),

- max_playback_rate_hz(48000),

- complexity(kDefaultComplexity),

- dtx_enabled(false) {

bool AudioEncoderOpus::Config::IsOk() const {

if (frame_size_ms <= 0 || frame_size_ms % 10 != 0)

return false;

@@ -61,119 +89,45 @@ bool AudioEncoderOpus::Config::IsOk() const {

}

AudioEncoderOpus::AudioEncoderOpus(const Config& config)

- : num_10ms_frames_per_packet_(

- static_cast<size_t>(rtc::CheckedDivExact(config.frame_size_ms, 10))),

- num_channels_(config.num_channels),

- payload_type_(config.payload_type),

- application_(config.application),

- dtx_enabled_(config.dtx_enabled),

- samples_per_10ms_frame_(static_cast<size_t>(

- rtc::CheckedDivExact(kSampleRateHz, 100) * num_channels_)),

- packet_loss_rate_(0.0) {

- CHECK(config.IsOk());

- input_buffer_.reserve(num_10ms_frames_per_packet_ * samples_per_10ms_frame_);

- CHECK_EQ(0, WebRtcOpus_EncoderCreate(&inst_, num_channels_, application_));

- SetTargetBitrate(config.bitrate_bps);

- if (config.fec_enabled) {

- CHECK_EQ(0, WebRtcOpus_EnableFec(inst_));

- } else {

- CHECK_EQ(0, WebRtcOpus_DisableFec(inst_));

- }

- CHECK_EQ(0,

- WebRtcOpus_SetMaxPlaybackRate(inst_, config.max_playback_rate_hz));

- CHECK_EQ(0, WebRtcOpus_SetComplexity(inst_, config.complexity));

- if (config.dtx_enabled) {

- CHECK_EQ(0, WebRtcOpus_EnableDtx(inst_));

- } else {

- CHECK_EQ(0, WebRtcOpus_DisableDtx(inst_));

- }

+ : packet_loss_rate_(0.0), inst_(nullptr) {

+ CHECK(RecreateEncoderInstance(config));

}

+AudioEncoderOpus::AudioEncoderOpus(const CodecInst& codec_inst)

+ : AudioEncoderOpus(CreateConfig(codec_inst)) {}

AudioEncoderOpus::~AudioEncoderOpus() {

CHECK_EQ(0, WebRtcOpus_EncoderFree(inst_));

}

-int AudioEncoderOpus::SampleRateHz() const {

- return kSampleRateHz;

-int AudioEncoderOpus::NumChannels() const {

- return num_channels_;

size_t AudioEncoderOpus::MaxEncodedBytes() const {

// Calculate the number of bytes we expect the encoder to produce,

// then multiply by two to give a wide margin for error.

- size_t bytes_per_millisecond =

- static_cast<size_t>(bitrate_bps_ / (1000 * 8) + 1);

- size_t approx_encoded_bytes =

- num_10ms_frames_per_packet_ * 10 * bytes_per_millisecond;

+ const size_t bytes_per_millisecond =

+ static_cast<size_t>(config_.bitrate_bps / (1000 * 8) + 1);

+ const size_t approx_encoded_bytes =

+ Num10msFramesPerPacket() * 10 * bytes_per_millisecond;

return 2 * approx_encoded_bytes;

}

-size_t AudioEncoderOpus::Num10MsFramesInNextPacket() const {

- return num_10ms_frames_per_packet_;

+int AudioEncoderOpus::SampleRateHz() const {

+ return kSampleRateHz;

}

-size_t AudioEncoderOpus::Max10MsFramesInAPacket() const {

- return num_10ms_frames_per_packet_;

+int AudioEncoderOpus::NumChannels() const {

+ return config_.num_channels;

}

-int AudioEncoderOpus::GetTargetBitrate() const {

- return bitrate_bps_;

+size_t AudioEncoderOpus::Num10MsFramesInNextPacket() const {

+ return Num10msFramesPerPacket();

}

-void AudioEncoderOpus::SetTargetBitrate(int bits_per_second) {

- bitrate_bps_ = std::max(std::min(bits_per_second, kMaxBitrateBps),

- kMinBitrateBps);

- CHECK_EQ(WebRtcOpus_SetBitRate(inst_, bitrate_bps_), 0);

+size_t AudioEncoderOpus::Max10MsFramesInAPacket() const {

+ return Num10msFramesPerPacket();

}

-void AudioEncoderOpus::SetProjectedPacketLossRate(double fraction) {

- DCHECK_GE(fraction, 0.0);

- DCHECK_LE(fraction, 1.0);

- // Optimize the loss rate to configure Opus. Basically, optimized loss rate is

- // the input loss rate rounded down to various levels, because a robustly good

- // audio quality is achieved by lowering the packet loss down.

- // Additionally, to prevent toggling, margins are used, i.e., when jumping to

- // a loss rate from below, a higher threshold is used than jumping to the same

- // level from above.

- const double kPacketLossRate20 = 0.20;

- const double kPacketLossRate10 = 0.10;

- const double kPacketLossRate5 = 0.05;

- const double kPacketLossRate1 = 0.01;

- const double kLossRate20Margin = 0.02;

- const double kLossRate10Margin = 0.01;

- const double kLossRate5Margin = 0.01;

- double opt_loss_rate;

- if (fraction >=

- kPacketLossRate20 +

- kLossRate20Margin *

- (kPacketLossRate20 - packet_loss_rate_ > 0 ? 1 : -1)) {

- opt_loss_rate = kPacketLossRate20;

- } else if (fraction >=

- kPacketLossRate10 +

- kLossRate10Margin *

- (kPacketLossRate10 - packet_loss_rate_ > 0 ? 1 : -1)) {

- opt_loss_rate = kPacketLossRate10;

- } else if (fraction >=

- kPacketLossRate5 +

- kLossRate5Margin *

- (kPacketLossRate5 - packet_loss_rate_ > 0 ? 1 : -1)) {

- opt_loss_rate = kPacketLossRate5;

- } else if (fraction >= kPacketLossRate1) {

- opt_loss_rate = kPacketLossRate1;

- } else {

- opt_loss_rate = 0;

- }

- if (packet_loss_rate_ != opt_loss_rate) {

- // Ask the encoder to change the target packet loss rate.

- CHECK_EQ(WebRtcOpus_SetPacketLossRate(

- inst_, static_cast<int32_t>(opt_loss_rate * 100 + .5)),

- 0);

- packet_loss_rate_ = opt_loss_rate;

- }

+int AudioEncoderOpus::GetTargetBitrate() const {

+ return config_.bitrate_bps;

}

AudioEncoder::EncodedInfo AudioEncoderOpus::EncodeInternal(

@@ -184,75 +138,118 @@ AudioEncoder::EncodedInfo AudioEncoderOpus::EncodeInternal(

if (input_buffer_.empty())

first_timestamp_in_buffer_ = rtp_timestamp;

input_buffer_.insert(input_buffer_.end(), audio,

- audio + samples_per_10ms_frame_);

+ audio + SamplesPer10msFrame());

if (input_buffer_.size() <

- (num_10ms_frames_per_packet_ * samples_per_10ms_frame_)) {

+ (static_cast<size_t>(Num10msFramesPerPacket()) * SamplesPer10msFrame())) {

return EncodedInfo();

}

- CHECK_EQ(input_buffer_.size(),

- num_10ms_frames_per_packet_ * samples_per_10ms_frame_);

+ CHECK_EQ(input_buffer_.size(), static_cast<size_t>(Num10msFramesPerPacket()) *

+ SamplesPer10msFrame());

int status = WebRtcOpus_Encode(

inst_, &input_buffer_[0],

rtc::CheckedDivExact(input_buffer_.size(),

- static_cast<size_t>(num_channels_)),

- max_encoded_bytes, encoded);

+ static_cast<size_t>(config_.num_channels)),

+ rtc::saturated_cast<int16_t>(max_encoded_bytes), encoded);

CHECK_GE(status, 0); // Fails only if fed invalid data.

input_buffer_.clear();

EncodedInfo info;

info.encoded_bytes = static_cast<size_t>(status);

info.encoded_timestamp = first_timestamp_in_buffer_;

- info.payload_type = payload_type_;

+ info.payload_type = config_.payload_type;

info.send_even_if_empty = true; // Allows Opus to send empty packets.

info.speech = (status > 0);

return info;

}

-namespace {

-AudioEncoderOpus::Config CreateConfig(const CodecInst& codec_inst) {

- AudioEncoderOpus::Config config;

- config.frame_size_ms = rtc::CheckedDivExact(codec_inst.pacsize, 48);

- config.num_channels = codec_inst.channels;

- config.bitrate_bps = codec_inst.rate;

- config.payload_type = codec_inst.pltype;

- config.application = (config.num_channels == 1 ? AudioEncoderOpus::kVoip

- : AudioEncoderOpus::kAudio);

- return config;

+void AudioEncoderOpus::Reset() {

+ CHECK(RecreateEncoderInstance(config_));

}

-} // namespace

-AudioEncoderMutableOpus::AudioEncoderMutableOpus(const CodecInst& codec_inst)

- : AudioEncoderMutableImpl<AudioEncoderOpus>(CreateConfig(codec_inst)) {

-bool AudioEncoderMutableOpus::SetFec(bool enable) {

- auto conf = config();

+bool AudioEncoderOpus::SetFec(bool enable) {

+ auto conf = config_;

conf.fec_enabled = enable;

- return Reconstruct(conf);

+ return RecreateEncoderInstance(conf);

}

-bool AudioEncoderMutableOpus::SetDtx(bool enable) {

- auto conf = config();

+bool AudioEncoderOpus::SetDtx(bool enable) {

+ auto conf = config_;

conf.dtx_enabled = enable;

- return Reconstruct(conf);

+ return RecreateEncoderInstance(conf);

}

-bool AudioEncoderMutableOpus::SetApplication(Application application) {

- auto conf = config();

+bool AudioEncoderOpus::SetApplication(Application application) {

+ auto conf = config_;

switch (application) {

- case kApplicationSpeech:

+ case Application::kSpeech:

conf.application = AudioEncoderOpus::kVoip;

break;

- case kApplicationAudio:

+ case Application::kAudio:

conf.application = AudioEncoderOpus::kAudio;

break;

}

- return Reconstruct(conf);

+ return RecreateEncoderInstance(conf);

}

-bool AudioEncoderMutableOpus::SetMaxPlaybackRate(int frequency_hz) {

- auto conf = config();

+bool AudioEncoderOpus::SetMaxPlaybackRate(int frequency_hz) {

+ auto conf = config_;

conf.max_playback_rate_hz = frequency_hz;

- return Reconstruct(conf);

+ return RecreateEncoderInstance(conf);

+void AudioEncoderOpus::SetProjectedPacketLossRate(double fraction) {

+ double opt_loss_rate = OptimizePacketLossRate(fraction, packet_loss_rate_);

+ if (packet_loss_rate_ != opt_loss_rate) {

+ packet_loss_rate_ = opt_loss_rate;

+ CHECK_EQ(0, WebRtcOpus_SetPacketLossRate(

+ inst_, static_cast<int32_t>(packet_loss_rate_ * 100 + .5)));

+ }

+void AudioEncoderOpus::SetTargetBitrate(int bits_per_second) {

+ config_.bitrate_bps =

+ std::max(std::min(bits_per_second, kMaxBitrateBps), kMinBitrateBps);

+ DCHECK(config_.IsOk());

+ CHECK_EQ(0, WebRtcOpus_SetBitRate(inst_, config_.bitrate_bps));

+int AudioEncoderOpus::Num10msFramesPerPacket() const {

+ return rtc::CheckedDivExact(config_.frame_size_ms, 10);

+int AudioEncoderOpus::SamplesPer10msFrame() const {

+ return rtc::CheckedDivExact(kSampleRateHz, 100) * config_.num_channels;

+// If the given config is OK, recreate the Opus encoder instance with those

+// settings, save the config, and return true. Otherwise, do nothing and return

+// false.

+bool AudioEncoderOpus::RecreateEncoderInstance(const Config& config) {

+ if (!config.IsOk())

+ return false;

+ if (inst_)

+ CHECK_EQ(0, WebRtcOpus_EncoderFree(inst_));

+ input_buffer_.clear();

+ input_buffer_.reserve(Num10msFramesPerPacket() * SamplesPer10msFrame());

+ CHECK_EQ(0, WebRtcOpus_EncoderCreate(&inst_, config.num_channels,

+ config.application));

+ CHECK_EQ(0, WebRtcOpus_SetBitRate(inst_, config.bitrate_bps));

+ if (config.fec_enabled) {

+ CHECK_EQ(0, WebRtcOpus_EnableFec(inst_));

+ } else {

+ CHECK_EQ(0, WebRtcOpus_DisableFec(inst_));

+ }

+ CHECK_EQ(0,

+ WebRtcOpus_SetMaxPlaybackRate(inst_, config.max_playback_rate_hz));

+ CHECK_EQ(0, WebRtcOpus_SetComplexity(inst_, config.complexity));

+ if (config.dtx_enabled) {

+ CHECK_EQ(0, WebRtcOpus_EnableDtx(inst_));

+ } else {

+ CHECK_EQ(0, WebRtcOpus_DisableDtx(inst_));

+ }

+ CHECK_EQ(0, WebRtcOpus_SetPacketLossRate(

+ inst_, static_cast<int32_t>(packet_loss_rate_ * 100 + .5)));

+ config_ = config;

+ return true;

}

} // namespace webrtc