webrtc/modules/audio_processing/test/conversational_speech/simulator.cc - Issue 2790933002: Conversational speech tool, simualtor + unit tests

Side by Side Diff: webrtc/modules/audio_processing/test/conversational_speech/simulator.cc

Issue 2790933002: Conversational speech tool, simualtor + unit tests (Closed)

Patch Set: Using AppendFolder() to build paths to folders Created 3 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

« webrtc/modules/audio_processing/test/conversational_speech/simulator.h ('K') | « webrtc/modules/audio_processing/test/conversational_speech/simulator.h ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
(Empty)
	1 /*

	2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.

	3 *

	4 * Use of this source code is governed by a BSD-style license

	5 * that can be found in the LICENSE file in the root of the source

	6 * tree. An additional intellectual property rights grant can be found

	7 * in the file PATENTS. All contributing project authors may

	8 * be found in the AUTHORS file in the root of the source tree.

	9 */

	10

	11 #include "webrtc/modules/audio_processing/test/conversational_speech/simulator.h "

	12

	13 #include <set>

	14 #include <utility>

	15 #include <vector>

	16

	17 #include "webrtc/base/array_view.h"

	18 #include "webrtc/base/constructormagic.h"

	19 #include "webrtc/base/logging.h"

	20 #include "webrtc/base/pathutils.h"

	21 #include "webrtc/base/ptr_util.h"

	22 #include "webrtc/common_audio/wav_file.h"

	23 #include "webrtc/modules/audio_processing/test/conversational_speech/wavreader_i nterface.h"

	24

	25 namespace webrtc {

	26 namespace test {

	27 namespace {

	28

	29 using conversational_speech::MultiEndCall;

	30 using conversational_speech::SpeakerOutputFilePaths;

	31 using conversational_speech::WavReaderInterface;

	32

	33 // Combines output path and speaker names to define the output file paths for

	34 // the near-end and far=end audio tracks.

	35 std::unique_ptr<std::map<std::string, SpeakerOutputFilePaths>>
	minyue-webrtc 2017/04/07 13:24:30 I don't know the benefit of passing a unique_ptr o I don't know the benefit of passing a unique_ptr of a map. Map has clear copy-ctor, passing by value should not be bad. WDYT? AleBzk 2017/04/10 08:24:48 I'm not a move semantics expert, but I'd say that Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > I don't know the benefit of passing a unique_ptr of a map. Map has clear > copy-ctor, passing by value should not be bad. WDYT? I'm not a move semantics expert, but I'd say that in this case returning a unique pointer should be more lightweight than copying a map - the map keys are strings, the values are pairs of strings. However, it's also true that the map is not expected huge. But I don't see too much overhead in the code for using unique pointers. This is why I personally prefer this solution. But please, let me know if the comparison above (namely, passing unique ptr vs copying a map) is wrong.
	36 InitSpeakerOutputFilePaths(const std::set<std::string>& speaker_names,

	37 const std::string& output_path) {

	38 // Create map.

	39 auto speaker_output_file_paths_map = rtc::MakeUnique<

	40 std::map<std::string, SpeakerOutputFilePaths>>();

	41

	42 // Add near-end and far-end output paths into the map.

	43 for (const auto& speaker_name : speaker_names) {

	44 const rtc::Pathname near_end_path(

	45 output_path, "s_" + speaker_name + "-near_end.wav");

	46 LOG(LS_VERBOSE) << "creating " << near_end_path.pathname();

	47

	48 const rtc::Pathname far_end_path(

	49 output_path, "s_" + speaker_name + "-far_end.wav");

	50 LOG(LS_VERBOSE) << "creating " << far_end_path.pathname();

	51

	52 // Add to map.

	53 speaker_output_file_paths_map->emplace(

	54 std::piecewise_construct,

	55 std::forward_as_tuple(speaker_name),

	56 std::forward_as_tuple(near_end_path.pathname(),

	57 far_end_path.pathname()));

	58 }

	59

	60 return speaker_output_file_paths_map;

	61 }

	62

	63 // Class that provides one WavWriter for the near-end and one for the far-end

	64 // output track of a speaker.

	65 class SpeakerWavWriters {

	66 public:

	67 SpeakerWavWriters(

	68 const SpeakerOutputFilePaths& output_file_paths, int sample_rate)

	69 : near_end_(output_file_paths.near_end, sample_rate, 1u),

	70 far_end_(output_file_paths.far_end, sample_rate, 1u) {}

	71 WavWriter& near_end() {

	72 return near_end_;

	73 }

	74 WavWriter& far_end() {

	75 return far_end_;

	76 }

	77 private:

	78 WavWriter near_end_;

	79 WavWriter far_end_;

	80

	81 // RTC_DISALLOW_COPY_AND_ASSIGN(SpeakerWavWriters);
	minyue-webrtc 2017/04/07 13:24:30 why commented out? why commented out? AleBzk 2017/04/10 08:24:48 yet another leftover. Removed. Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > why commented out? yet another leftover. Removed.
	82 };

	83

	84 // Initializes one WavWriter instance for each speaker and both the near-end and

	85 // far-end output tracks.

	86 std::unique_ptr<std::map<std::string, SpeakerWavWriters>>

	87 InitSpeakersWavWriters(const std::map<std::string, SpeakerOutputFilePaths>&

	88 speaker_output_file_paths, int sample_rate) {

	89 // Create map.

	90 auto speaker_wav_writers_map = rtc::MakeUnique<

	91 std::map<std::string, SpeakerWavWriters>>();

	92

	93 // Add SpeakerWavWriters instance into the map.

	94 for (auto it = speaker_output_file_paths.begin();

	95 it != speaker_output_file_paths.end(); ++it) {

	96 speaker_wav_writers_map->emplace(

	97 std::piecewise_construct,

	98 std::forward_as_tuple(it->first),

	99 std::forward_as_tuple(it->second, sample_rate));

	100 }

	101

	102 return speaker_wav_writers_map;

	103 }

	104

	105 // Reads all the samples for each audio track.

	106 std::unique_ptr<std::map<std::string, std::vector<int16_t>>> PreloadAudioTracks(

	107 const std::map<std::string, std::unique_ptr<WavReaderInterface>>&

	108 audiotrack_readers) {

	109 // Create map.

	110 auto audiotracks_map = rtc::MakeUnique<

	111 std::map<std::string, std::vector<int16_t>>>();

	112

	113 // Add audio track vectors.

	114 for (auto it = audiotrack_readers.begin(); it != audiotrack_readers.end();

	115 ++it) {

	116 // Add map entry.

	117 audiotracks_map->emplace(

	118 std::piecewise_construct,

	119 std::forward_as_tuple(it->first),

	120 std::forward_as_tuple(it->second->NumSamples()));

	121

	122 // Read samples.

	123 it->second->ReadInt16Samples(audiotracks_map->at(it->first));

	124 }

	125

	126 return audiotracks_map;

	127 }

	128

	129 // Writes all the values in source_samples via wav_writer. If the number of

	130 // previously written samples in wav_writer is less than interval.begin, it adds
	minyue-webrtc 2017/04/07 13:24:31 \|interval_begin\|, (1. underscore, 2. put \|\| on var \|interval_begin\|, (1. underscore, 2. put \|\| on var names) AleBzk 2017/04/10 08:24:48 Done. Show quoted text On 2017/04/07 13:24:31, minyue-webrtc wrote: > \|interval_begin\|, (1. underscore, 2. put \|\| on var names) Done.
	131 // zeros as left padding. The padding corresponds to intervals during which a

	132 // speaker is not active.

	133 void PadLeftWriteChunk(const std::vector<int16_t>& source_samples,
	minyue-webrtc 2017/04/07 13:24:30 consider using ArrayView instead of vector consider using ArrayView instead of vector AleBzk 2017/04/10 08:24:48 Done. Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > consider using ArrayView instead of vector Done.
	134 std::size_t interval_begin, WavWriter* wav_writer) {
	minyue-webrtc 2017/04/07 13:24:30 no need for std:: no need for std:: AleBzk 2017/04/10 08:24:48 Done. Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > no need for std:: Done.
	135 // Add left padding.

	136 RTC_CHECK(wav_writer);

	137 std::size_t padding_size = interval_begin - wav_writer->num_samples();

	138 RTC_CHECK(padding_size >= 0);
	minyue-webrtc 2017/04/07 13:24:30 size_t never is negative RTC_CHECK_GE(interval_be size_t never is negative RTC_CHECK_GE(interval_begin, wav_writer->num_samples()) before subtraction AleBzk 2017/04/10 08:24:48 Done. Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > size_t never is negative > > RTC_CHECK_GE(interval_begin, wav_writer->num_samples()) before subtraction Done.
	139 if (padding_size > 0) {
	minyue-webrtc 2017/04/07 13:24:30 no need for "if" if you check before no need for "if" if you check before AleBzk 2017/04/10 08:24:48 I still need it because padding_size can be 0. If Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > no need for "if" if you check before I still need it because padding_size can be 0. If so, I don't have to write anything.
	140 const std::vector<int16_t> padding(padding_size, 0);

	141 wav_writer->WriteSamples(padding.data(), padding_size);

	142 }

	143

	144 // Write source samples.

	145 wav_writer->WriteSamples(source_samples.data(), source_samples.size());

	146 }

	147

	148 // Appends zeros via wav_writer. The number of zeros is always non-negative and

	149 // equal to the difference between the previously written samples and

	150 // duration_samples.

	151 void PadRight(WavWriter* wav_writer, std::size_t duration_samples) {
	minyue-webrtc 2017/04/07 13:24:30 duration is normally a time concept. Say either du duration is normally a time concept. Say either duration_ms or simply pad_samples minyue-webrtc 2017/04/07 13:24:31 This looks similar to PadLeftWriteChunk but functi This looks similar to PadLeftWriteChunk but function names differ too much AleBzk 2017/04/10 08:24:48 duration_samples -> pad_samples done PadRight -> Show quoted text On 2017/04/07 13:24:30, minyue-webrtc wrote: > duration is normally a time concept. Say either duration_ms or simply > pad_samples duration_samples -> pad_samples done PadRight -> PadRightWrite done I'm not using Chunk here because only zeros are written and no chunk is copied - as done instead in PadLeftWriteChunk.
	152 RTC_CHECK(wav_writer);

	153 std::size_t padding_size = duration_samples - wav_writer->num_samples();

	154 RTC_CHECK(padding_size >= 0);
	minyue-webrtc 2017/04/07 13:24:31 again, checking something always true :) again, checking something always true :) AleBzk 2017/04/10 08:24:48 Done. Show quoted text On 2017/04/07 13:24:31, minyue-webrtc wrote: > again, checking something always true :) Done.
	155 if (padding_size > 0) {

	156 const std::vector<int16_t> padding(padding_size, 0);

	157 wav_writer->WriteSamples(padding.data(), padding_size);

	158 }

	159 }

	160

	161 } // namespace

	162

	163 namespace conversational_speech {

	164

	165 std::unique_ptr<std::map<std::string, SpeakerOutputFilePaths>> Simulate(
	minyue-webrtc 2017/04/07 13:24:30 Are you not gonna write this in any class? Are you not gonna write this in any class? minyue-webrtc 2017/04/07 13:24:31 and same comment on unique_ptr<map> and same comment on unique_ptr<map> AleBzk 2017/04/10 08:24:48 Are you not gonna write this in any class? No. In Show quoted text On 2017/04/07 13:24:31, minyue-webrtc wrote: > and same comment on unique_ptr<map> Are you not gonna write this in any class? No. In this way, I'm hiding a lot of includes in the .cc file making .h lightweight to include. unique_ptr<map> See my previous answer. It applies here as well. Let me know what you think.
	166 const MultiEndCall& multiend_call, const std::string& output_path) {

	167 // Set output file paths and initialize wav writers.

	168 const auto& speaker_names = multiend_call.speaker_names();

	169 auto speaker_output_file_paths = InitSpeakerOutputFilePaths(

	170 speaker_names, output_path);

	171 auto speakers_wav_writers = InitSpeakersWavWriters(

	172 *speaker_output_file_paths, multiend_call.sample_rate());

	173

	174 // Preload all the input audio tracks.

	175 const auto& audiotrack_readers = multiend_call.audiotrack_readers();

	176 auto audiotracks = PreloadAudioTracks(audiotrack_readers);

	177

	178 // TODO(alessiob): When speaker_names.size() == 2, near-end and far-end

	179 // across the 2 speakers are symmetric; hence, the code below could be

	180 // replaced by only creating the near-end or the far-end. However, this would

	181 // require to split the unit tests and document the behavior in README.md.

	182 // In practice, it should not be an issue since the files are not expected to

	183 // be signinificant.

	184

	185 // Write near-end and far-end output tracks.

	186 const auto& speaking_turns = multiend_call.speaking_turns();

	187 for (const auto& speaking_turn : speaking_turns) {

	188 const std::string& active_speaker_name = speaking_turn.speaker_name;

	189 auto source_audiotrack = audiotracks->at(

	190 speaking_turn.audiotrack_file_name);

	191

	192 // Write active speaker's chunk to active speaker's near-end.

	193 PadLeftWriteChunk(source_audiotrack, speaking_turn.begin,

	194 &speakers_wav_writers->at(

	195 active_speaker_name).near_end());

	196

	197 // Write active speaker's chunk to other participants' far-ends.

	198 for (const std::string& speaker_name : speaker_names) {

	199 if (speaker_name == active_speaker_name)

	200 continue;

	201 PadLeftWriteChunk(source_audiotrack, speaking_turn.begin,

	202 &speakers_wav_writers->at(speaker_name).far_end());

	203 }

	204 }

	205

	206 // Finalize all the output tracks with right padding.

	207 // This is required to make all the output tracks duration equal.

	208 std::size_t duration_samples = multiend_call.total_duration_samples();

	209 for (const std::string& speaker_name : speaker_names) {

	210 PadRight(&speakers_wav_writers->at(speaker_name).near_end(),

	211 duration_samples);

	212 PadRight(&speakers_wav_writers->at(speaker_name).far_end(),

	213 duration_samples);

	214 }

	215

	216 return speaker_output_file_paths;

	217 }

	218

	219 } // namespace conversational_speech

	220 } // namespace test

	221 } // namespace webrtc

OLD	NEW