webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc - Issue 2195633002: Revert of Rewrote UpdateToMix in the audio mixer.

Unified Diff: webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc

Issue 2195633002: Revert of Rewrote UpdateToMix in the audio mixer. (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@remove_memory_pool

Patch Set: Created 4 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.h ('k') | webrtc/modules/audio_mixer/test/audio_mixer_unittest.cc » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc

diff --git a/webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc b/webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc

index 861fb14b581da2ec03f9e4dbf089d1300ba57b2e..c1a49f221bcaf815158e1e58a5fc4fa66f1a89fb 100644

--- a/webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc

+++ b/webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.cc

@@ -11,7 +11,6 @@

#include "webrtc/modules/audio_mixer/source/new_audio_conference_mixer_impl.h"

#include <algorithm>

-#include <functional>

#include "webrtc/modules/audio_conference_mixer/source/audio_frame_manipulator.h"

#include "webrtc/modules/audio_mixer/include/audio_mixer_defines.h"

@@ -23,43 +22,15 @@

namespace webrtc {

namespace {

-class SourceFrame {

- public:

- SourceFrame(MixerAudioSource* p,

- AudioFrame* a,

- bool m,

- bool was_mixed_before)

- : audio_source_(p),

- audio_frame_(a),

- muted_(m),

- was_mixed_before_(was_mixed_before) {

- if (!muted_) {

- energy_ = CalculateEnergy(*a);

- }

- // a.shouldMixBefore(b) is used to select mixer participants.

- bool shouldMixBefore(const SourceFrame& other) const {

- if (muted_ != other.muted_) {

- return other.muted_;

- }

- auto our_activity = audio_frame_->vad_activity_;

- auto other_activity = other.audio_frame_->vad_activity_;

- if (our_activity != other_activity) {

- return our_activity == AudioFrame::kVadActive;

- }

- return energy_ > other.energy_;

- }

- MixerAudioSource* audio_source_;

- AudioFrame* audio_frame_;

- bool muted_;

- uint32_t energy_;

- bool was_mixed_before_;

+struct AudioSourceWithFrame {

+ AudioSourceWithFrame(MixerAudioSource* p, AudioFrame* a, bool m)

+ : audio_source(p), audio_frame(a), muted(m) {}

+ MixerAudioSource* audio_source;

+ AudioFrame* audio_frame;

+ bool muted;

};

+typedef std::list<AudioSourceWithFrame*> AudioSourceWithFrameList;

// Mix |frame| into |mixed_frame|, with saturation protection and upmixing.

// These effects are applied to |frame| itself prior to mixing. Assumes that

@@ -196,6 +167,7 @@

size_t remainingAudioSourcesAllowedToMix = kMaximumAmountOfMixedAudioSources;

RTC_DCHECK(thread_checker_.CalledOnValidThread());

AudioFrameList mixList;

+ AudioFrameList rampOutList;

AudioFrameList additionalFramesList;

std::map<int, MixerAudioSource*> mixedAudioSourcesMap;

{

@@ -242,17 +214,20 @@

}

- mixList = UpdateToMix(remainingAudioSourcesAllowedToMix);

- remainingAudioSourcesAllowedToMix -= mixList.size();

+ UpdateToMix(&mixList, &rampOutList, &mixedAudioSourcesMap,

+ &remainingAudioSourcesAllowedToMix);

GetAdditionalAudio(&additionalFramesList);

+ UpdateMixedStatus(mixedAudioSourcesMap);

}

// TODO(aleloi): it might be better to decide the number of channels

// with an API instead of dynamically.

// Find the max channels over all mixing lists.

- const size_t num_mixed_channels =

- std::max(MaxNumChannels(&mixList), MaxNumChannels(&additionalFramesList));

+ const size_t num_mixed_channels = std::max(

+ MaxNumChannels(&mixList), std::max(MaxNumChannels(&additionalFramesList),

+ MaxNumChannels(&rampOutList)));

audio_frame_for_mixing->UpdateFrame(

-1, _timeStamp, NULL, 0, _outputFrequency, AudioFrame::kNormalSpeech,

@@ -270,6 +245,7 @@

{

CriticalSectionScoped cs(_crit.get());

MixAnonomouslyFromList(audio_frame_for_mixing, additionalFramesList);

+ MixAnonomouslyFromList(audio_frame_for_mixing, rampOutList);

if (audio_frame_for_mixing->samples_per_channel_ == 0) {

// Nothing was mixed, set the audio samples to silence.

@@ -280,6 +256,10 @@

LimitMixedAudio(audio_frame_for_mixing);

}

+ ClearAudioFrameList(&mixList);

+ ClearAudioFrameList(&rampOutList);

+ ClearAudioFrameList(&additionalFramesList);

return;

}

@@ -446,62 +426,177 @@

return highestFreq;

}

-AudioFrameList NewAudioConferenceMixerImpl::UpdateToMix(

- size_t maxAudioFrameCounter) const {

- AudioFrameList result;

- std::vector<SourceFrame> audioSourceMixingDataList;

- // Get audio source audio and put it in the struct vector.

- for (MixerAudioSource* audio_source : audio_source_list_) {

- auto audio_frame_with_info = audio_source->GetAudioFrameWithMuted(

- _id, static_cast<int>(_outputFrequency));

- auto audio_frame_info = audio_frame_with_info.audio_frame_info;

- AudioFrame* audio_source_audio_frame = audio_frame_with_info.audio_frame;

- if (audio_frame_info == MixerAudioSource::AudioFrameInfo::kError) {

+void NewAudioConferenceMixerImpl::UpdateToMix(

+ AudioFrameList* mixList,

+ AudioFrameList* rampOutList,

+ std::map<int, MixerAudioSource*>* mixAudioSourceList,

+ size_t* maxAudioFrameCounter) const {

+ WEBRTC_TRACE(kTraceStream, kTraceAudioMixerServer, _id,

+ "UpdateToMix(mixList,rampOutList,mixAudioSourceList,%d)",

+ *maxAudioFrameCounter);

+ const size_t mixListStartSize = mixList->size();

+ AudioFrameList activeList;

+ // Struct needed by the passive lists to keep track of which AudioFrame

+ // belongs to which MixerAudioSource.

+ AudioSourceWithFrameList passiveWasNotMixedList;

+ AudioSourceWithFrameList passiveWasMixedList;

+ for (MixerAudioSourceList::const_iterator audio_source =

+ audio_source_list_.begin();

+ audio_source != audio_source_list_.end(); ++audio_source) {

+ // Stop keeping track of passive audioSources if there are already

+ // enough audio sources available (they wont be mixed anyway).

+ bool mustAddToPassiveList =

+ (*maxAudioFrameCounter >

+ (activeList.size() + passiveWasMixedList.size() +

+ passiveWasNotMixedList.size()));

+ bool wasMixed = false;

+ wasMixed = (*audio_source)->_mixHistory->WasMixed();

+ auto audio_frame_with_info =

+ (*audio_source)->GetAudioFrameWithMuted(_id, _outputFrequency);

+ auto ret = audio_frame_with_info.audio_frame_info;

+ AudioFrame* audio_frame = audio_frame_with_info.audio_frame;

+ if (ret == MixerAudioSource::AudioFrameInfo::kError) {

+ continue;

+ }

+ const bool muted = (ret == MixerAudioSource::AudioFrameInfo::kMuted);

+ if (audio_source_list_.size() != 1) {

+ // TODO(wu): Issue 3390, add support for multiple audio sources case.

+ audio_frame->ntp_time_ms_ = -1;

+ }

+ // TODO(aleloi): this assert triggers in some test cases where SRTP is

+ // used which prevents NetEQ from making a VAD. Temporarily disable this

+ // assert until the problem is fixed on a higher level.

+ // RTC_DCHECK_NE(audio_frame->vad_activity_, AudioFrame::kVadUnknown);

+ if (audio_frame->vad_activity_ == AudioFrame::kVadUnknown) {

WEBRTC_TRACE(kTraceWarning, kTraceAudioMixerServer, _id,

- "failed to GetAudioFrameWithMuted() from participant");

- continue;

- }

- audioSourceMixingDataList.emplace_back(

- audio_source, audio_source_audio_frame,

- audio_frame_info == MixerAudioSource::AudioFrameInfo::kMuted,

- audio_source->_mixHistory->WasMixed());

- }

- // Sort frames by sorting function.

- std::sort(audioSourceMixingDataList.begin(), audioSourceMixingDataList.end(),

- std::mem_fn(&SourceFrame::shouldMixBefore));

- // Go through list in order and put things in mixList.

- for (SourceFrame& p : audioSourceMixingDataList) {

- // Filter muted.

- if (p.muted_) {

- p.audio_source_->_mixHistory->SetIsMixed(false);

- continue;

- }

- // Add frame to result vector for mixing.

- bool is_mixed = false;

- if (maxAudioFrameCounter > 0) {

- --maxAudioFrameCounter;

- if (!p.was_mixed_before_) {

- RampIn(*p.audio_frame_);

+ "invalid VAD state from audio source");

+ }

+ if (audio_frame->vad_activity_ == AudioFrame::kVadActive) {

+ if (!wasMixed && !muted) {

+ RampIn(*audio_frame);

}

- result.emplace_back(p.audio_frame_, false);

- is_mixed = true;

- }

- // Ramp out unmuted.

- if (p.was_mixed_before_ && !is_mixed) {

- RampOut(*p.audio_frame_);

- result.emplace_back(p.audio_frame_, false);

- }

- p.audio_source_->_mixHistory->SetIsMixed(is_mixed);

- }

- return result;

+ if (activeList.size() >= *maxAudioFrameCounter) {

+ // There are already more active audio sources than should be

+ // mixed. Only keep the ones with the highest energy.

+ AudioFrameList::iterator replaceItem;

+ uint32_t lowestEnergy = muted ? 0 : CalculateEnergy(*audio_frame);

+ bool found_replace_item = false;

+ for (AudioFrameList::iterator iter = activeList.begin();

+ iter != activeList.end(); ++iter) {

+ const uint32_t energy = muted ? 0 : CalculateEnergy(*iter->frame);

+ if (energy < lowestEnergy) {

+ replaceItem = iter;

+ lowestEnergy = energy;

+ found_replace_item = true;

+ }

+ if (found_replace_item) {

+ RTC_DCHECK(!muted); // Cannot replace with a muted frame.

+ FrameAndMuteInfo replaceFrame = *replaceItem;

+ bool replaceWasMixed = false;

+ std::map<int, MixerAudioSource*>::const_iterator it =

+ mixAudioSourceList->find(replaceFrame.frame->id_);

+ // When a frame is pushed to |activeList| it is also pushed

+ // to mixAudioSourceList with the frame's id. This means

+ // that the Find call above should never fail.

+ RTC_DCHECK(it != mixAudioSourceList->end());

+ replaceWasMixed = it->second->_mixHistory->WasMixed();

+ mixAudioSourceList->erase(replaceFrame.frame->id_);

+ activeList.erase(replaceItem);

+ activeList.push_front(FrameAndMuteInfo(audio_frame, muted));

+ (*mixAudioSourceList)[audio_frame->id_] = *audio_source;

+ RTC_DCHECK_LE(mixAudioSourceList->size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ if (replaceWasMixed) {

+ if (!replaceFrame.muted) {

+ RampOut(*replaceFrame.frame);

+ }

+ rampOutList->push_back(replaceFrame);

+ RTC_DCHECK_LE(

+ rampOutList->size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ }

+ } else {

+ if (wasMixed) {

+ if (!muted) {

+ RampOut(*audio_frame);

+ }

+ rampOutList->push_back(FrameAndMuteInfo(audio_frame, muted));

+ RTC_DCHECK_LE(

+ rampOutList->size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ }

+ } else {

+ activeList.push_front(FrameAndMuteInfo(audio_frame, muted));

+ (*mixAudioSourceList)[audio_frame->id_] = *audio_source;

+ RTC_DCHECK_LE(mixAudioSourceList->size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ }

+ } else {

+ if (wasMixed) {

+ AudioSourceWithFrame* part_struct =

+ new AudioSourceWithFrame(*audio_source, audio_frame, muted);

+ passiveWasMixedList.push_back(part_struct);

+ } else if (mustAddToPassiveList) {

+ if (!muted) {

+ RampIn(*audio_frame);

+ }

+ AudioSourceWithFrame* part_struct =

+ new AudioSourceWithFrame(*audio_source, audio_frame, muted);

+ passiveWasNotMixedList.push_back(part_struct);

+ }

+ RTC_DCHECK_LE(activeList.size(), *maxAudioFrameCounter);

+ // At this point it is known which audio sources should be mixed. Transfer

+ // this information to this functions output parameters.

+ for (AudioFrameList::const_iterator iter = activeList.begin();

+ iter != activeList.end(); ++iter) {

+ mixList->push_back(*iter);

+ }

+ activeList.clear();

+ // Always mix a constant number of AudioFrames. If there aren't enough

+ // active audio sources mix passive ones. Starting with those that was mixed

+ // last iteration.

+ for (AudioSourceWithFrameList::const_iterator iter =

+ passiveWasMixedList.begin();

+ iter != passiveWasMixedList.end(); ++iter) {

+ if (mixList->size() < *maxAudioFrameCounter + mixListStartSize) {

+ mixList->push_back(

+ FrameAndMuteInfo((*iter)->audio_frame, (*iter)->muted));

+ (*mixAudioSourceList)[(*iter)->audio_frame->id_] = (*iter)->audio_source;

+ RTC_DCHECK_LE(mixAudioSourceList->size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ }

+ delete *iter;

+ }

+ // And finally the ones that have not been mixed for a while.

+ for (AudioSourceWithFrameList::const_iterator iter =

+ passiveWasNotMixedList.begin();

+ iter != passiveWasNotMixedList.end(); ++iter) {

+ if (mixList->size() < *maxAudioFrameCounter + mixListStartSize) {

+ mixList->push_back(

+ FrameAndMuteInfo((*iter)->audio_frame, (*iter)->muted));

+ (*mixAudioSourceList)[(*iter)->audio_frame->id_] = (*iter)->audio_source;

+ RTC_DCHECK_LE(mixAudioSourceList->size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ }

+ delete *iter;

+ }

+ RTC_DCHECK_GE(*maxAudioFrameCounter + mixListStartSize, mixList->size());

+ *maxAudioFrameCounter += mixListStartSize - mixList->size();

}

void NewAudioConferenceMixerImpl::GetAdditionalAudio(

@@ -538,6 +633,38 @@

}

+void NewAudioConferenceMixerImpl::UpdateMixedStatus(

+ const std::map<int, MixerAudioSource*>& mixedAudioSourcesMap) const {

+ WEBRTC_TRACE(kTraceStream, kTraceAudioMixerServer, _id,

+ "UpdateMixedStatus(mixedAudioSourcesMap)");

+ RTC_DCHECK_LE(mixedAudioSourcesMap.size(),

+ static_cast<size_t>(kMaximumAmountOfMixedAudioSources));

+ // Loop through all audio_sources. If they are in the mix map they

+ // were mixed.

+ for (MixerAudioSourceList::const_iterator audio_source =

+ audio_source_list_.begin();

+ audio_source != audio_source_list_.end(); ++audio_source) {

+ bool isMixed = false;

+ for (std::map<int, MixerAudioSource*>::const_iterator it =

+ mixedAudioSourcesMap.begin();

+ it != mixedAudioSourcesMap.end(); ++it) {

+ if (it->second == *audio_source) {

+ isMixed = true;

+ break;

+ }

+ (*audio_source)->_mixHistory->SetIsMixed(isMixed);

+ }

+void NewAudioConferenceMixerImpl::ClearAudioFrameList(

+ AudioFrameList* audioFrameList) const {

+ WEBRTC_TRACE(kTraceStream, kTraceAudioMixerServer, _id,

+ "ClearAudioFrameList(audioFrameList)");

+ audioFrameList->clear();

bool NewAudioConferenceMixerImpl::IsAudioSourceInList(

const MixerAudioSource& audio_source,

const MixerAudioSourceList& audioSourceList) const {