webrtc/media/engine/webrtcvoiceengine.cc - Issue 2705093002: Injectable audio encoders: WebRtcVoiceEngine and company

Unified Diff: webrtc/media/engine/webrtcvoiceengine.cc

Issue 2705093002: Injectable audio encoders: WebRtcVoiceEngine and company (Closed)

Patch Set: Channel::GetSendCodec asks both its acm and its codec manager. Created 3 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: webrtc/media/engine/webrtcvoiceengine.cc

diff --git a/webrtc/media/engine/webrtcvoiceengine.cc b/webrtc/media/engine/webrtcvoiceengine.cc

index 2384ac28f173870959c97b6bc78224f931a03464..ab363420084abe181a44246056ed063c44a20b61 100644

--- a/webrtc/media/engine/webrtcvoiceengine.cc

+++ b/webrtc/media/engine/webrtcvoiceengine.cc

@@ -37,7 +37,7 @@

#include "webrtc/media/engine/payload_type_mapper.h"

#include "webrtc/media/engine/webrtcmediaengine.h"

#include "webrtc/media/engine/webrtcvoe.h"

-#include "webrtc/modules/audio_coding/acm2/rent_a_codec.h"

+#include "webrtc/modules/audio_coding/codecs/builtin_audio_encoder_factory.h"

#include "webrtc/modules/audio_mixer/audio_mixer_impl.h"

#include "webrtc/modules/audio_processing/include/audio_processing.h"

#include "webrtc/system_wrappers/include/field_trial.h"

@@ -66,27 +66,9 @@ constexpr int kNackRtpHistoryMs = 5000;

#error "Set WEBRTC_INTELLIGIBILITY_ENHANCER to either 0 or 1"

#endif

-// Codec parameters for Opus.

-// draft-spittka-payload-rtp-opus-03

-// Recommended bitrates:

-// 8-12 kb/s for NB speech,

-// 16-20 kb/s for WB speech,

-// 28-40 kb/s for FB speech,

-// 48-64 kb/s for FB mono music, and

-// 64-128 kb/s for FB stereo music.

-// The current implementation applies the following values to mono signals,

-// and multiplies them by 2 for stereo.

-const int kOpusBitrateNbBps = 12000;

-const int kOpusBitrateWbBps = 20000;

-const int kOpusBitrateFbBps = 32000;

-// Opus bitrate should be in the range between 6000 and 510000.

+// For SendSideBwe, Opus bitrate should be in the range between 6000 and 32000.

const int kOpusMinBitrateBps = 6000;

-const int kOpusMaxBitrateBps = 510000;

-// iSAC bitrate should be <= 56000.

-const int kIsacMaxBitrateBps = 56000;

+const int kOpusBitrateFbBps = 32000;

// Default audio dscp value.

// See http://tools.ietf.org/html/rfc2474 for details.

@@ -125,8 +107,15 @@ bool ValidateStreamParams(const StreamParams& sp) {

// Dumps an AudioCodec in RFC 2327-ish format.

std::string ToString(const AudioCodec& codec) {

std::stringstream ss;

- ss << codec.name << "/" << codec.clockrate << "/" << codec.channels

- << " (" << codec.id << ")";

+ ss << codec.name << "/" << codec.clockrate << "/" << codec.channels;

+ if (!codec.params.empty()) {

+ ss << " {";

+ for (const auto& param : codec.params) {

+ ss << " " << param.first << "=" << param.second;

+ }

+ ss << " }";

+ }

+ ss << " (" << codec.id << ")";

return ss.str();

}

@@ -134,10 +123,6 @@ bool IsCodec(const AudioCodec& codec, const char* ref_name) {

return (_stricmp(codec.name.c_str(), ref_name) == 0);

}

-bool IsCodec(const webrtc::CodecInst& codec, const char* ref_name) {

- return (_stricmp(codec.plname, ref_name) == 0);

bool FindCodec(const std::vector<AudioCodec>& codecs,

const AudioCodec& codec,

AudioCodec* found_codec) {

@@ -165,12 +150,6 @@ bool VerifyUniquePayloadTypes(const std::vector<AudioCodec>& codecs) {

return it == payload_types.end();

}

-// Return true if codec.params[feature] == "1", false otherwise.

-bool IsCodecFeatureEnabled(const AudioCodec& codec, const char* feature) {

- int value;

- return codec.GetParam(feature, &value) && value == 1;

rtc::Optional<std::string> GetAudioNetworkAdaptorConfig(

const AudioOptions& options) {

if (options.audio_network_adaptor && *options.audio_network_adaptor &&

@@ -182,85 +161,6 @@ rtc::Optional<std::string> GetAudioNetworkAdaptorConfig(

return rtc::Optional<std::string>();

}

-// Returns integer parameter params[feature] if it is defined. Returns

-// |default_value| otherwise.

-int GetCodecFeatureInt(const AudioCodec& codec,

- const char* feature,

- int default_value) {

- int value = 0;

- if (codec.GetParam(feature, &value)) {

- return value;

- }

- return default_value;

-// Use params[kCodecParamMaxAverageBitrate] if it is defined, use codec.bitrate

-// otherwise. If the value (either from params or codec.bitrate) <=0, use the

-// default configuration. If the value is beyond feasible bit rate of Opus,

-// clamp it. Returns the Opus bit rate for operation.

-int GetOpusBitrate(const AudioCodec& codec, int max_playback_rate) {

- int bitrate = 0;

- bool use_param = true;

- if (!codec.GetParam(kCodecParamMaxAverageBitrate, &bitrate)) {

- bitrate = codec.bitrate;

- use_param = false;

- }

- if (bitrate <= 0) {

- if (max_playback_rate <= 8000) {

- bitrate = kOpusBitrateNbBps;

- } else if (max_playback_rate <= 16000) {

- bitrate = kOpusBitrateWbBps;

- } else {

- bitrate = kOpusBitrateFbBps;

- }

- if (IsCodecFeatureEnabled(codec, kCodecParamStereo)) {

- bitrate *= 2;

- }

- } else if (bitrate < kOpusMinBitrateBps || bitrate > kOpusMaxBitrateBps) {

- bitrate = (bitrate < kOpusMinBitrateBps) ? kOpusMinBitrateBps

- : kOpusMaxBitrateBps;

- std::string rate_source =

- use_param ? "Codec parameter \"maxaveragebitrate\"" :

- "Supplied Opus bitrate";

- LOG(LS_WARNING) << rate_source

- << " is invalid and is replaced by: "

- << bitrate;

- }

- return bitrate;

-void GetOpusConfig(const AudioCodec& codec,

- webrtc::CodecInst* voe_codec,

- bool* enable_codec_fec,

- int* max_playback_rate,

- bool* enable_codec_dtx,

- int* min_ptime_ms,

- int* max_ptime_ms) {

- *enable_codec_fec = IsCodecFeatureEnabled(codec, kCodecParamUseInbandFec);

- *enable_codec_dtx = IsCodecFeatureEnabled(codec, kCodecParamUseDtx);

- *max_playback_rate = GetCodecFeatureInt(codec, kCodecParamMaxPlaybackRate,

- kOpusDefaultMaxPlaybackRate);

- *max_ptime_ms =

- GetCodecFeatureInt(codec, kCodecParamMaxPTime, kOpusDefaultMaxPTime);

- *min_ptime_ms =

- GetCodecFeatureInt(codec, kCodecParamMinPTime, kOpusDefaultMinPTime);

- if (*max_ptime_ms < *min_ptime_ms) {

- // If min ptime or max ptime defined by codec parameter is wrong, we use

- // the default values.

- *max_ptime_ms = kOpusDefaultMaxPTime;

- *min_ptime_ms = kOpusDefaultMinPTime;

- }

- // If OPUS, change what we send according to the "stereo" codec

- // parameter, and not the "channels" parameter. We set

- // voe_codec.channels to 2 if "stereo=1" and 1 otherwise. If

- // the bitrate is not specified, i.e. is <= zero, we set it to the

- // appropriate default value for mono or stereo Opus.

- voe_codec->channels = IsCodecFeatureEnabled(codec, kCodecParamStereo) ? 2 : 1;

- voe_codec->rate = GetOpusBitrate(codec, *max_playback_rate);

webrtc::AudioState::Config MakeAudioStateConfig(

VoEWrapper* voe_wrapper,

rtc::scoped_refptr<webrtc::AudioMixer> audio_mixer) {

@@ -274,283 +174,41 @@ webrtc::AudioState::Config MakeAudioStateConfig(

return config;

}

-class WebRtcVoiceCodecs final {

- public:

- // TODO(solenberg): Do this filtering once off-line, add a simple AudioCodec

- // list and add a test which verifies VoE supports the listed codecs.

- static std::vector<AudioCodec> SupportedSendCodecs() {

- std::vector<AudioCodec> result;

- // Iterate first over our preferred codecs list, so that the results are

- // added in order of preference.

- for (size_t i = 0; i < arraysize(kCodecPrefs); ++i) {

- const CodecPref* pref = &kCodecPrefs[i];

- for (webrtc::CodecInst voe_codec : webrtc::acm2::RentACodec::Database()) {

- // Change the sample rate of G722 to 8000 to match SDP.

- MaybeFixupG722(&voe_codec, 8000);

- // Skip uncompressed formats.

- if (IsCodec(voe_codec, kL16CodecName)) {

- continue;

- }

- if (!IsCodec(voe_codec, pref->name) ||

- pref->clockrate != voe_codec.plfreq ||

- pref->channels != voe_codec.channels) {

- // Not a match.

- continue;

- }

- AudioCodec codec(pref->payload_type, voe_codec.plname, voe_codec.plfreq,

- voe_codec.rate, voe_codec.channels);

- LOG(LS_INFO) << "Adding supported codec: " << ToString(codec);

- if (IsCodec(codec, kIsacCodecName)) {

- // Indicate auto-bitrate in signaling.

- codec.bitrate = 0;

- }

- if (IsCodec(codec, kOpusCodecName)) {

- // Only add fmtp parameters that differ from the spec.

- if (kPreferredMinPTime != kOpusDefaultMinPTime) {

- codec.params[kCodecParamMinPTime] =

- rtc::ToString(kPreferredMinPTime);

- }

- if (kPreferredMaxPTime != kOpusDefaultMaxPTime) {

- codec.params[kCodecParamMaxPTime] =

- rtc::ToString(kPreferredMaxPTime);

- }

- codec.SetParam(kCodecParamUseInbandFec, 1);

- codec.AddFeedbackParam(

- FeedbackParam(kRtcpFbParamTransportCc, kParamValueEmpty));

- // TODO(hellner): Add ptime, sprop-stereo, and stereo

- // when they can be set to values other than the default.

- }

- result.push_back(codec);

- }

- return result;

- }

- static bool ToCodecInst(const AudioCodec& in,

- webrtc::CodecInst* out) {

- for (webrtc::CodecInst voe_codec : webrtc::acm2::RentACodec::Database()) {

- // Change the sample rate of G722 to 8000 to match SDP.

- MaybeFixupG722(&voe_codec, 8000);

- AudioCodec codec(voe_codec.pltype, voe_codec.plname, voe_codec.plfreq,

- voe_codec.rate, voe_codec.channels);

- bool multi_rate = IsCodecMultiRate(voe_codec);

- // Allow arbitrary rates for ISAC to be specified.

- if (multi_rate) {

- // Set codec.bitrate to 0 so the check for codec.Matches() passes.

- codec.bitrate = 0;

- }

- if (codec.Matches(in)) {

- if (out) {

- // Fixup the payload type.

- voe_codec.pltype = in.id;

- // Set bitrate if specified.

- if (multi_rate && in.bitrate != 0) {

- voe_codec.rate = in.bitrate;

- }

- // Reset G722 sample rate to 16000 to match WebRTC.

- MaybeFixupG722(&voe_codec, 16000);

- *out = voe_codec;

- }

- return true;

- }

- return false;

- }

- static bool IsCodecMultiRate(const webrtc::CodecInst& codec) {

- for (size_t i = 0; i < arraysize(kCodecPrefs); ++i) {

- if (IsCodec(codec, kCodecPrefs[i].name) &&

- kCodecPrefs[i].clockrate == codec.plfreq) {

- return kCodecPrefs[i].is_multi_rate;

- }

- return false;

- }

- static int MaxBitrateBps(const webrtc::CodecInst& codec) {

- for (size_t i = 0; i < arraysize(kCodecPrefs); ++i) {

- if (IsCodec(codec, kCodecPrefs[i].name) &&

- kCodecPrefs[i].clockrate == codec.plfreq) {

- return kCodecPrefs[i].max_bitrate_bps;

- }

- return 0;

- }

- static rtc::ArrayView<const int> GetPacketSizesMs(

- const webrtc::CodecInst& codec) {

- for (size_t i = 0; i < arraysize(kCodecPrefs); ++i) {

- if (IsCodec(codec, kCodecPrefs[i].name)) {

- size_t num_packet_sizes = kMaxNumPacketSize;

- for (int index = 0; index < kMaxNumPacketSize; index++) {

- if (kCodecPrefs[i].packet_sizes_ms[index] == 0) {

- num_packet_sizes = index;

- break;

- }

- return rtc::ArrayView<const int>(kCodecPrefs[i].packet_sizes_ms,

- num_packet_sizes);

- }

- return rtc::ArrayView<const int>();

- }

- // If the AudioCodec param kCodecParamPTime is set, then we will set it to

- // codec pacsize if it's valid, or we will pick the next smallest value we

- // support.

- // TODO(Brave): Query supported packet sizes from ACM when the API is ready.

- static bool SetPTimeAsPacketSize(webrtc::CodecInst* codec, int ptime_ms) {

- for (const CodecPref& codec_pref : kCodecPrefs) {

- if ((IsCodec(*codec, codec_pref.name) &&

- codec_pref.clockrate == codec->plfreq) ||

- IsCodec(*codec, kG722CodecName)) {

- int packet_size_ms = SelectPacketSize(codec_pref, ptime_ms);

- if (packet_size_ms) {

- // Convert unit from milli-seconds to samples.

- codec->pacsize = (codec->plfreq / 1000) * packet_size_ms;

- return true;

- }

- return false;

- }

- static const AudioCodec* GetPreferredCodec(

- const std::vector<AudioCodec>& codecs,

- webrtc::CodecInst* out) {

- RTC_DCHECK(out);

- // Select the preferred send codec (the first non-telephone-event/CN codec).

- for (const AudioCodec& codec : codecs) {

- if (IsCodec(codec, kDtmfCodecName) || IsCodec(codec, kCnCodecName)) {

- // Skip telephone-event/CN codecs - they will be handled later.

- continue;

- }

- // We'll use the first codec in the list to actually send audio data.

- // Be sure to use the payload type requested by the remote side.

- // Ignore codecs we don't know about. The negotiation step should prevent

- // this, but double-check to be sure.

- if (!ToCodecInst(codec, out)) {

- LOG(LS_WARNING) << "Unknown codec " << ToString(codec);

- continue;

- }

- return &codec;

- }

- return nullptr;

- }

- private:

- static const int kMaxNumPacketSize = 6;

- struct CodecPref {

- const char* name;

- int clockrate;

- size_t channels;

- int payload_type;

- bool is_multi_rate;

- int packet_sizes_ms[kMaxNumPacketSize];

- int max_bitrate_bps;

- };

- // Note: keep the supported packet sizes in ascending order.

- static const CodecPref kCodecPrefs[14];

- static int SelectPacketSize(const CodecPref& codec_pref, int ptime_ms) {

- int selected_packet_size_ms = codec_pref.packet_sizes_ms[0];

- for (int packet_size_ms : codec_pref.packet_sizes_ms) {

- if (packet_size_ms && packet_size_ms <= ptime_ms) {

- selected_packet_size_ms = packet_size_ms;

- }

- return selected_packet_size_ms;

- }

- // Changes RTP timestamp rate of G722. This is due to the "bug" in the RFC

- // which says that G722 should be advertised as 8 kHz although it is a 16 kHz

- // codec.

- static void MaybeFixupG722(webrtc::CodecInst* voe_codec, int new_plfreq) {

- if (IsCodec(*voe_codec, kG722CodecName)) {

- // If the DCHECK triggers, the codec definition in WebRTC VoiceEngine

- // has changed, and this special case is no longer needed.

- RTC_DCHECK(voe_codec->plfreq != new_plfreq);

- voe_codec->plfreq = new_plfreq;

- }

-};

-const WebRtcVoiceCodecs::CodecPref WebRtcVoiceCodecs::kCodecPrefs[14] = {

-#if WEBRTC_OPUS_SUPPORT_120MS_PTIME

- {kOpusCodecName, 48000, 2, 111, true, {10, 20, 40, 60, 120},

- kOpusMaxBitrateBps},

-#else

- {kOpusCodecName, 48000, 2, 111, true, {10, 20, 40, 60}, kOpusMaxBitrateBps},

-#endif

- {kIsacCodecName, 16000, 1, 103, true, {30, 60}, kIsacMaxBitrateBps},

- {kIsacCodecName, 32000, 1, 104, true, {30}, kIsacMaxBitrateBps},

- // G722 should be advertised as 8000 Hz because of the RFC "bug".

- {kG722CodecName, 8000, 1, 9, false, {10, 20, 30, 40, 50, 60}},

- {kIlbcCodecName, 8000, 1, 102, false, {20, 30, 40, 60}},

- {kPcmuCodecName, 8000, 1, 0, false, {10, 20, 30, 40, 50, 60}},

- {kPcmaCodecName, 8000, 1, 8, false, {10, 20, 30, 40, 50, 60}},

- {kCnCodecName, 32000, 1, 106, false, {}},

- {kCnCodecName, 16000, 1, 105, false, {}},

- {kCnCodecName, 8000, 1, 13, false, {}},

- {kDtmfCodecName, 48000, 1, 110, false, {}},

- {kDtmfCodecName, 32000, 1, 112, false, {}},

- {kDtmfCodecName, 16000, 1, 113, false, {}},

- {kDtmfCodecName, 8000, 1, 126, false, {}}

-};

// |max_send_bitrate_bps| is the bitrate from "b=" in SDP.

// |rtp_max_bitrate_bps| is the bitrate from RtpSender::SetParameters.

rtc::Optional<int> ComputeSendBitrate(int max_send_bitrate_bps,

rtc::Optional<int> rtp_max_bitrate_bps,

- const webrtc::CodecInst& codec_inst) {

+ const webrtc::AudioCodecSpec& spec) {

// If application-configured bitrate is set, take minimum of that and SDP

// bitrate.

const int bps = rtp_max_bitrate_bps

? MinPositive(max_send_bitrate_bps, *rtp_max_bitrate_bps)

: max_send_bitrate_bps;

- const int codec_rate = codec_inst.rate;

if (bps <= 0) {

- return rtc::Optional<int>(codec_rate);

- }

- if (codec_inst.pltype == -1) {

- return rtc::Optional<int>(codec_rate);

- ;

- }

- if (WebRtcVoiceCodecs::IsCodecMultiRate(codec_inst)) {

- // If codec is multi-rate then just set the bitrate.

- return rtc::Optional<int>(

- std::min(bps, WebRtcVoiceCodecs::MaxBitrateBps(codec_inst)));

+ return rtc::Optional<int>(spec.info.default_bitrate_bps);

}

- if (bps < codec_inst.rate) {

+ if (bps < spec.info.min_bitrate_bps) {

// If codec is not multi-rate and |bps| is less than the fixed bitrate then

// fail. If codec is not multi-rate and |bps| exceeds or equal the fixed

// bitrate then ignore.

- LOG(LS_ERROR) << "Failed to set codec " << codec_inst.plname

+ LOG(LS_ERROR) << "Failed to set codec " << spec.format.name

<< " to bitrate " << bps << " bps"

- << ", requires at least " << codec_inst.rate << " bps.";

+ << ", requires at least " << spec.info.min_bitrate_bps

+ << " bps.";

return rtc::Optional<int>();

}

- return rtc::Optional<int>(codec_rate);

+ if (spec.info.HasFixedBitrate()) {

+ return rtc::Optional<int>(spec.info.default_bitrate_bps);

+ } else {

+ // If codec is multi-rate then just set the bitrate.

+ return rtc::Optional<int>(std::min(bps, spec.info.max_bitrate_bps));

+ }

}

} // namespace

-bool WebRtcVoiceEngine::ToCodecInst(const AudioCodec& in,

- webrtc::CodecInst* out) {

- return WebRtcVoiceCodecs::ToCodecInst(in, out);

WebRtcVoiceEngine::WebRtcVoiceEngine(

webrtc::AudioDeviceModule* adm,

const rtc::scoped_refptr<webrtc::AudioDecoderFactory>& decoder_factory,

@@ -565,7 +223,10 @@ WebRtcVoiceEngine::WebRtcVoiceEngine(

const rtc::scoped_refptr<webrtc::AudioDecoderFactory>& decoder_factory,

rtc::scoped_refptr<webrtc::AudioMixer> audio_mixer,

VoEWrapper* voe_wrapper)

- : adm_(adm), decoder_factory_(decoder_factory), voe_wrapper_(voe_wrapper) {

+ : adm_(adm),

+ encoder_factory_(webrtc::CreateBuiltinAudioEncoderFactory()),

+ decoder_factory_(decoder_factory),

+ voe_wrapper_(voe_wrapper) {

RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

LOG(LS_INFO) << "WebRtcVoiceEngine::WebRtcVoiceEngine";

RTC_DCHECK(voe_wrapper);

@@ -575,13 +236,13 @@ WebRtcVoiceEngine::WebRtcVoiceEngine(

// Load our audio codec list.

LOG(LS_INFO) << "Supported send codecs in order of preference:";

- send_codecs_ = WebRtcVoiceCodecs::SupportedSendCodecs();

+ send_codecs_ = CollectCodecs(encoder_factory_->GetSupportedEncoders());

for (const AudioCodec& codec : send_codecs_) {

LOG(LS_INFO) << ToString(codec);

}

LOG(LS_INFO) << "Supported recv codecs in order of preference:";

- recv_codecs_ = CollectRecvCodecs();

+ recv_codecs_ = CollectCodecs(decoder_factory_->GetSupportedDecoders());

for (const AudioCodec& codec : recv_codecs_) {

LOG(LS_INFO) << ToString(codec);

}

@@ -1056,11 +717,10 @@ webrtc::voe::TransmitMixer* WebRtcVoiceEngine::transmit_mixer() {

return transmit_mixer_;

}

-AudioCodecs WebRtcVoiceEngine::CollectRecvCodecs() const {

+AudioCodecs WebRtcVoiceEngine::CollectCodecs(

+ const std::vector<webrtc::AudioCodecSpec>& specs) const {

PayloadTypeMapper mapper;

AudioCodecs out;

- const std::vector<webrtc::AudioCodecSpec>& specs =

- decoder_factory_->GetSupportedDecoders();

// Only generate CN payload types for these clockrates:

std::map<int, bool, std::greater<int>> generate_cn = {{ 8000, false },

@@ -1140,12 +800,14 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

webrtc::AudioTransport* voe_audio_transport,

uint32_t ssrc,

const std::string& c_name,

- const webrtc::AudioSendStream::Config::SendCodecSpec& send_codec_spec,

+ const rtc::Optional<webrtc::AudioSendStream::Config::SendCodecSpec>&

+ send_codec_spec,

const std::vector<webrtc::RtpExtension>& extensions,

int max_send_bitrate_bps,

const rtc::Optional<std::string>& audio_network_adaptor_config,

webrtc::Call* call,

- webrtc::Transport* send_transport)

+ webrtc::Transport* send_transport,

+ const rtc::scoped_refptr<webrtc::AudioEncoderFactory>& encoder_factory)

: voe_audio_transport_(voe_audio_transport),

call_(call),

config_(send_transport),

@@ -1157,13 +819,20 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

// TODO(solenberg): Once we're not using FakeWebRtcVoiceEngine anymore:

// RTC_DCHECK(voe_audio_transport);

RTC_DCHECK(call);

+ RTC_DCHECK(encoder_factory);

config_.rtp.ssrc = ssrc;

config_.rtp.c_name = c_name;

config_.voe_channel_id = ch;

config_.rtp.extensions = extensions;

config_.audio_network_adaptor_config = audio_network_adaptor_config;

+ config_.encoder_factory = encoder_factory;

rtp_parameters_.encodings[0].ssrc = rtc::Optional<uint32_t>(ssrc);

- RecreateAudioSendStream(send_codec_spec);

+ if (send_codec_spec) {

+ UpdateSendCodecSpec(*send_codec_spec);

+ }

+ stream_ = call_->CreateAudioSendStream(config_);

}

~WebRtcAudioSendStream() override {

@@ -1172,56 +841,45 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

call_->DestroyAudioSendStream(stream_);

}

- void RecreateAudioSendStream(

+ void SetSendCodecSpec(

const webrtc::AudioSendStream::Config::SendCodecSpec& send_codec_spec) {

- RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

- send_codec_spec_ = send_codec_spec;

- config_.rtp.nack.rtp_history_ms =

- send_codec_spec_.nack_enabled ? kNackRtpHistoryMs : 0;

- config_.send_codec_spec = send_codec_spec_;

- auto send_rate = ComputeSendBitrate(

- max_send_bitrate_bps_, rtp_parameters_.encodings[0].max_bitrate_bps,

- send_codec_spec.codec_inst);

- if (send_rate) {

- // Apply a send rate that abides by |max_send_bitrate_bps_| and

- // |rtp_parameters_| when possible. Otherwise use the codec rate.

- config_.send_codec_spec.codec_inst.rate = *send_rate;

- }

- RecreateAudioSendStream();

+ UpdateSendCodecSpec(send_codec_spec);

+ ReconfigureAudioSendStream();

}

- void RecreateAudioSendStream(

- const std::vector<webrtc::RtpExtension>& extensions) {

+ void SetRtpExtensions(const std::vector<webrtc::RtpExtension>& extensions) {

RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

config_.rtp.extensions = extensions;

- RecreateAudioSendStream();

+ ReconfigureAudioSendStream();

}

- void RecreateAudioSendStream(

+ void SetAudioNetworkAdaptorConfig(

const rtc::Optional<std::string>& audio_network_adaptor_config) {

RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

if (config_.audio_network_adaptor_config == audio_network_adaptor_config) {

return;

}

config_.audio_network_adaptor_config = audio_network_adaptor_config;

- RecreateAudioSendStream();

+ UpdateAllowedBitrateRange();

+ ReconfigureAudioSendStream();

}

bool SetMaxSendBitrate(int bps) {

RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

- auto send_rate =

- ComputeSendBitrate(bps, rtp_parameters_.encodings[0].max_bitrate_bps,

- send_codec_spec_.codec_inst);

+ RTC_DCHECK(config_.send_codec_spec);

+ RTC_DCHECK(audio_codec_spec_);

+ auto send_rate = ComputeSendBitrate(

+ bps, rtp_parameters_.encodings[0].max_bitrate_bps, *audio_codec_spec_);

if (!send_rate) {

return false;

}

max_send_bitrate_bps_ = bps;

- if (config_.send_codec_spec.codec_inst.rate != *send_rate) {

- // Recreate AudioSendStream with new bit rate.

- config_.send_codec_spec.codec_inst.rate = *send_rate;

- RecreateAudioSendStream();

+ if (send_rate != config_.send_codec_spec->target_bitrate_bps) {

+ config_.send_codec_spec->target_bitrate_bps = send_rate;

+ ReconfigureAudioSendStream();

}

return true;

}

@@ -1337,11 +995,15 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

if (!ValidateRtpParameters(parameters)) {

return false;

}

- auto send_rate = ComputeSendBitrate(max_send_bitrate_bps_,

- parameters.encodings[0].max_bitrate_bps,

- send_codec_spec_.codec_inst);

- if (!send_rate) {

- return false;

+ rtc::Optional<int> send_rate;

+ if (audio_codec_spec_) {

+ send_rate = ComputeSendBitrate(max_send_bitrate_bps_,

+ parameters.encodings[0].max_bitrate_bps,

+ *audio_codec_spec_);

+ if (!send_rate) {

+ return false;

+ }

}

const rtc::Optional<int> old_rtp_max_bitrate =

@@ -1350,9 +1012,12 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

rtp_parameters_ = parameters;

if (rtp_parameters_.encodings[0].max_bitrate_bps != old_rtp_max_bitrate) {

- // Recreate AudioSendStream with new bit rate.

- config_.send_codec_spec.codec_inst.rate = *send_rate;

- RecreateAudioSendStream();

+ // Reconfigure AudioSendStream with new bit rate.

+ if (send_rate) {

+ config_.send_codec_spec->target_bitrate_bps = send_rate;

+ }

+ UpdateAllowedBitrateRange();

+ ReconfigureAudioSendStream();

} else {

// parameters.encodings[0].active could have changed.

UpdateSendState();

@@ -1372,18 +1037,17 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

}

- void RecreateAudioSendStream() {

+ void UpdateAllowedBitrateRange() {

RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

- if (stream_) {

- call_->DestroyAudioSendStream(stream_);

- stream_ = nullptr;

- }

- RTC_DCHECK(!stream_);

- if (webrtc::field_trial::IsEnabled("WebRTC-Audio-SendSideBwe")) {

+ const bool is_opus =

+ config_.send_codec_spec &&

+ !STR_CASE_CMP(config_.send_codec_spec->format.name.c_str(),

+ kOpusCodecName);

+ if (is_opus && webrtc::field_trial::IsEnabled("WebRTC-Audio-SendSideBwe")) {

config_.min_bitrate_bps = kOpusMinBitrateBps;

// This means that when RtpParameters is reset, we may change the

- // encoder's bit rate immediately (through call_->CreateAudioSendStream),

+ // encoder's bit rate immediately (through ReconfigureAudioSendStream()),

// meanwhile change the cap to the output of BWE.

config_.max_bitrate_bps =

rtp_parameters_.encodings[0].max_bitrate_bps

@@ -1393,48 +1057,65 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

// TODO(mflodman): Keep testing this and set proper values.

// Note: This is an early experiment currently only supported by Opus.

if (send_side_bwe_with_overhead_) {

- auto packet_sizes_ms = WebRtcVoiceCodecs::GetPacketSizesMs(

- config_.send_codec_spec.codec_inst);

- if (!packet_sizes_ms.empty()) {

- int max_packet_size_ms =

- *std::max_element(packet_sizes_ms.begin(), packet_sizes_ms.end());

- // Audio network adaptor will just use 20ms and 60ms frame lengths.

- // The adaptor will only be active for the Opus encoder.

- if (config_.audio_network_adaptor_config &&

- IsCodec(config_.send_codec_spec.codec_inst, kOpusCodecName)) {

-#if WEBRTC_OPUS_SUPPORT_120MS_PTIME

- max_packet_size_ms = 120;

-#else

- max_packet_size_ms = 60;

-#endif

- }

- // OverheadPerPacket = Ipv4(20B) + UDP(8B) + SRTP(10B) + RTP(12)

- constexpr int kOverheadPerPacket = 20 + 8 + 10 + 12;

- int min_overhead_bps =

- kOverheadPerPacket * 8 * 1000 / max_packet_size_ms;

- // We assume that |config_.max_bitrate_bps| before the next line is

- // a hard limit on the payload bitrate, so we add min_overhead_bps to

- // it to ensure that, when overhead is deducted, the payload rate

- // never goes beyond the limit.

- // Note: this also means that if a higher overhead is forced, we

- // cannot reach the limit.

- // TODO(minyue): Reconsider this when the signaling to BWE is done

- // through a dedicated API.

- config_.max_bitrate_bps += min_overhead_bps;

- // In contrast to max_bitrate_bps, we let min_bitrate_bps always be

- // reachable.

- config_.min_bitrate_bps += min_overhead_bps;

- }

+ const int max_packet_size_ms =

+ WEBRTC_OPUS_SUPPORT_120MS_PTIME ? 120 : 60;

+ // OverheadPerPacket = Ipv4(20B) + UDP(8B) + SRTP(10B) + RTP(12)

+ constexpr int kOverheadPerPacket = 20 + 8 + 10 + 12;

+ int min_overhead_bps =

+ kOverheadPerPacket * 8 * 1000 / max_packet_size_ms;

+ // We assume that |config_.max_bitrate_bps| before the next line is

+ // a hard limit on the payload bitrate, so we add min_overhead_bps to

+ // it to ensure that, when overhead is deducted, the payload rate

+ // never goes beyond the limit.

+ // Note: this also means that if a higher overhead is forced, we

+ // cannot reach the limit.

+ // TODO(minyue): Reconsider this when the signaling to BWE is done

+ // through a dedicated API.

+ config_.max_bitrate_bps += min_overhead_bps;

+ // In contrast to max_bitrate_bps, we let min_bitrate_bps always be

+ // reachable.

+ config_.min_bitrate_bps += min_overhead_bps;

}

- stream_ = call_->CreateAudioSendStream(config_);

- RTC_CHECK(stream_);

- UpdateSendState();

+ }

+ void UpdateSendCodecSpec(

+ const webrtc::AudioSendStream::Config::SendCodecSpec& send_codec_spec) {

+ RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

+ config_.rtp.nack.rtp_history_ms =

+ send_codec_spec.nack_enabled ? kNackRtpHistoryMs : 0;

+ config_.send_codec_spec =

+ rtc::Optional<webrtc::AudioSendStream::Config::SendCodecSpec>(

+ send_codec_spec);

+ auto info =

+ config_.encoder_factory->QueryAudioEncoder(send_codec_spec.format);

+ RTC_DCHECK(info);

+ // If a specific target bitrate has been set for the stream, use that as

+ // the new default bitrate when computing send bitrate.

+ if (send_codec_spec.target_bitrate_bps) {

+ info->default_bitrate_bps = std::max(

+ info->min_bitrate_bps,

+ std::min(info->max_bitrate_bps, *send_codec_spec.target_bitrate_bps));

+ }

+ audio_codec_spec_.emplace(

+ webrtc::AudioCodecSpec{send_codec_spec.format, *info});

+ config_.send_codec_spec->target_bitrate_bps = ComputeSendBitrate(

+ max_send_bitrate_bps_, rtp_parameters_.encodings[0].max_bitrate_bps,

+ *audio_codec_spec_);

+ UpdateAllowedBitrateRange();

+ }

+ void ReconfigureAudioSendStream() {

+ RTC_DCHECK(worker_thread_checker_.CalledOnValidThread());

+ RTC_DCHECK(stream_);

+ stream_->Reconfigure(config_);

}

rtc::ThreadChecker worker_thread_checker_;

@@ -1455,7 +1136,7 @@ class WebRtcVoiceMediaChannel::WebRtcAudioSendStream

bool muted_ = false;

int max_send_bitrate_bps_;

webrtc::RtpParameters rtp_parameters_;

- webrtc::AudioSendStream::Config::SendCodecSpec send_codec_spec_;

+ rtc::Optional<webrtc::AudioCodecSpec> audio_codec_spec_;

RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(WebRtcAudioSendStream);

};

@@ -1661,7 +1342,7 @@ bool WebRtcVoiceMediaChannel::SetSendParameters(

if (send_rtp_extensions_ != filtered_extensions) {

send_rtp_extensions_.swap(filtered_extensions);

for (auto& it : send_streams_) {

- it.second->RecreateAudioSendStream(send_rtp_extensions_);

+ it.second->SetRtpExtensions(send_rtp_extensions_);

}

@@ -1828,10 +1509,10 @@ bool WebRtcVoiceMediaChannel::SetOptions(const AudioOptions& options) {

return false;

}

- rtc::Optional<std::string> audio_network_adatptor_config =

+ rtc::Optional<std::string> audio_network_adaptor_config =

GetAudioNetworkAdaptorConfig(options_);

for (auto& it : send_streams_) {

- it.second->RecreateAudioSendStream(audio_network_adatptor_config);

+ it.second->SetAudioNetworkAdaptorConfig(audio_network_adaptor_config);

}

LOG(LS_INFO) << "Set voice channel options. Current options: "

@@ -1941,86 +1622,66 @@ bool WebRtcVoiceMediaChannel::SetSendCodecs(

}

- // Scan through the list to figure out the codec to use for sending, along

- // with the proper configuration for VAD, CNG, NACK and Opus-specific

- // parameters.

- // TODO(solenberg): Refactor this logic once we create AudioEncoders here.

- webrtc::AudioSendStream::Config::SendCodecSpec send_codec_spec;

+ // Scan through the list to figure out the codec to use for sending.

+ rtc::Optional<webrtc::AudioSendStream::Config::SendCodecSpec> send_codec_spec;

webrtc::Call::Config::BitrateConfig bitrate_config;

- {

- send_codec_spec.nack_enabled = send_codec_spec_.nack_enabled;

- // Find send codec (the first non-telephone-event/CN codec).

- const AudioCodec* codec = WebRtcVoiceCodecs::GetPreferredCodec(

- codecs, &send_codec_spec.codec_inst);

- if (!codec) {

- LOG(LS_WARNING) << "Received empty list of codecs.";

- return false;

- }

- send_codec_spec.transport_cc_enabled = HasTransportCc(*codec);

- send_codec_spec.nack_enabled = HasNack(*codec);

- bitrate_config = GetBitrateConfigForCodec(*codec);

- // For Opus as the send codec, we are to determine inband FEC, maximum

- // playback rate, and opus internal dtx.

- if (IsCodec(*codec, kOpusCodecName)) {

- GetOpusConfig(*codec, &send_codec_spec.codec_inst,

- &send_codec_spec.enable_codec_fec,

- &send_codec_spec.opus_max_playback_rate,

- &send_codec_spec.enable_opus_dtx,

- &send_codec_spec.min_ptime_ms,

- &send_codec_spec.max_ptime_ms);

- }

+ rtc::Optional<webrtc::AudioCodecInfo> voice_codec_info;

+ for (const AudioCodec& voice_codec : codecs) {

+ if (!(IsCodec(voice_codec, kCnCodecName) ||

+ IsCodec(voice_codec, kDtmfCodecName) ||

+ IsCodec(voice_codec, kRedCodecName))) {

+ webrtc::SdpAudioFormat format(voice_codec.name, voice_codec.clockrate,

+ voice_codec.channels, voice_codec.params);

+ voice_codec_info = engine()->encoder_factory_->QueryAudioEncoder(format);

+ if (!voice_codec_info) {

+ LOG(LS_WARNING) << "Unknown codec " << ToString(voice_codec);

+ continue;

+ }

- // Set packet size if the AudioCodec param kCodecParamPTime is set.

- int ptime_ms = 0;

- if (codec->GetParam(kCodecParamPTime, &ptime_ms)) {

- if (!WebRtcVoiceCodecs::SetPTimeAsPacketSize(

- &send_codec_spec.codec_inst, ptime_ms)) {

- LOG(LS_WARNING) << "Failed to set packet size for codec "

- << send_codec_spec.codec_inst.plname;

- return false;

+ send_codec_spec =

+ rtc::Optional<webrtc::AudioSendStream::Config::SendCodecSpec>(

+ {voice_codec.id, format});

+ if (voice_codec.bitrate > 0) {

+ send_codec_spec->target_bitrate_bps =

+ rtc::Optional<int>(voice_codec.bitrate);

}

+ send_codec_spec->transport_cc_enabled = HasTransportCc(voice_codec);

+ send_codec_spec->nack_enabled = HasNack(voice_codec);

+ bitrate_config = GetBitrateConfigForCodec(voice_codec);

+ break;

}

+ }

+ if (!send_codec_spec) {

+ return false;

+ }

+ RTC_DCHECK(voice_codec_info);

+ if (voice_codec_info->allow_comfort_noise) {

// Loop through the codecs list again to find the CN codec.

// TODO(solenberg): Break out into a separate function?

for (const AudioCodec& cn_codec : codecs) {

- // Ignore codecs we don't know about. The negotiation step should prevent

- // this, but double-check to be sure.

- webrtc::CodecInst voe_codec = {0};

- if (!WebRtcVoiceEngine::ToCodecInst(cn_codec, &voe_codec)) {

- LOG(LS_WARNING) << "Unknown codec " << ToString(cn_codec);

- continue;

- }

if (IsCodec(cn_codec, kCnCodecName) &&

- cn_codec.clockrate == codec->clockrate) {

- // Turn voice activity detection/comfort noise on if supported.

- // Set the wideband CN payload type appropriately.

- // (narrowband always uses the static payload type 13).

- int cng_plfreq = -1;

+ cn_codec.clockrate == send_codec_spec->format.clockrate_hz) {

switch (cn_codec.clockrate) {

case 8000:

case 16000:

case 32000:

- cng_plfreq = cn_codec.clockrate;

+ send_codec_spec->cng_payload_type = rtc::Optional<int>(cn_codec.id);

break;

default:

LOG(LS_WARNING) << "CN frequency " << cn_codec.clockrate

<< " not supported.";

- continue;

+ break;

}

- send_codec_spec.cng_payload_type = cn_codec.id;

- send_codec_spec.cng_plfreq = cng_plfreq;

break;

}

// Find the telephone-event PT exactly matching the preferred send codec.

for (const AudioCodec& dtmf_codec : dtmf_codecs) {

- if (dtmf_codec.clockrate == codec->clockrate) {

+ if (dtmf_codec.clockrate == send_codec_spec->format.clockrate_hz) {

dtmf_payload_type_ = rtc::Optional<int>(dtmf_codec.id);

dtmf_payload_freq_ = dtmf_codec.clockrate;

break;

@@ -2032,7 +1693,7 @@ bool WebRtcVoiceMediaChannel::SetSendCodecs(

send_codec_spec_ = std::move(send_codec_spec);

// Apply new settings to all streams.

for (const auto& kv : send_streams_) {

- kv.second->RecreateAudioSendStream(send_codec_spec_);

+ kv.second->SetSendCodecSpec(*send_codec_spec_);

}

} else {

// If the codec isn't changing, set the start bitrate to -1 which means

@@ -2043,12 +1704,12 @@ bool WebRtcVoiceMediaChannel::SetSendCodecs(

// Check if the transport cc feedback or NACK status has changed on the

// preferred send codec, and in that case reconfigure all receive streams.

- if (recv_transport_cc_enabled_ != send_codec_spec_.transport_cc_enabled ||

- recv_nack_enabled_ != send_codec_spec_.nack_enabled) {

+ if (recv_transport_cc_enabled_ != send_codec_spec_->transport_cc_enabled ||

+ recv_nack_enabled_ != send_codec_spec_->nack_enabled) {

LOG(LS_INFO) << "Recreate all the receive streams because the send "

"codec has changed.";

- recv_transport_cc_enabled_ = send_codec_spec_.transport_cc_enabled;

- recv_nack_enabled_ = send_codec_spec_.nack_enabled;

+ recv_transport_cc_enabled_ = send_codec_spec_->transport_cc_enabled;

+ recv_nack_enabled_ = send_codec_spec_->nack_enabled;

for (auto& kv : recv_streams_) {

kv.second->RecreateAudioReceiveStream(recv_transport_cc_enabled_,

recv_nack_enabled_);

@@ -2171,7 +1832,7 @@ bool WebRtcVoiceMediaChannel::AddSendStream(const StreamParams& sp) {

WebRtcAudioSendStream* stream = new WebRtcAudioSendStream(

channel, audio_transport, ssrc, sp.cname, send_codec_spec_,

send_rtp_extensions_, max_send_bitrate_bps_, audio_network_adaptor_config,

- call_, this);

+ call_, this, engine()->encoder_factory_);

send_streams_.insert(std::make_pair(ssrc, stream));

// At this point the stream's local SSRC has been updated. If it is the first

« no previous file with comments | « webrtc/media/engine/webrtcvoiceengine.h ('k') | webrtc/media/engine/webrtcvoiceengine_unittest.cc » ('j') | webrtc/voice_engine/channel.cc » ('J')