Chromium Code Reviews| OLD | NEW |
|---|---|
| (Empty) | |
| 1 /* | |
| 2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. | |
| 3 * | |
| 4 * Use of this source code is governed by a BSD-style license | |
| 5 * that can be found in the LICENSE file in the root of the source | |
| 6 * tree. An additional intellectual property rights grant can be found | |
| 7 * in the file PATENTS. All contributing project authors may | |
| 8 * be found in the AUTHORS file in the root of the source tree. | |
| 9 */ | |
| 10 | |
| 11 #include "webrtc/modules/audio_processing/test/conversational_speech/simulator.h " | |
| 12 | |
| 13 #include <set> | |
| 14 #include <utility> | |
| 15 #include <vector> | |
| 16 | |
| 17 #include "webrtc/base/array_view.h" | |
| 18 #include "webrtc/base/constructormagic.h" | |
| 19 #include "webrtc/base/logging.h" | |
| 20 #include "webrtc/base/pathutils.h" | |
| 21 #include "webrtc/base/ptr_util.h" | |
| 22 #include "webrtc/common_audio/wav_file.h" | |
| 23 #include "webrtc/modules/audio_processing/test/conversational_speech/wavreader_i nterface.h" | |
| 24 | |
| 25 namespace webrtc { | |
| 26 namespace test { | |
| 27 namespace { | |
| 28 | |
| 29 using conversational_speech::MultiEndCall; | |
| 30 using conversational_speech::SpeakerOutputFilePaths; | |
| 31 using conversational_speech::WavReaderInterface; | |
| 32 | |
| 33 // Combines output path and speaker names to define the output file paths for | |
| 34 // the near-end and far=end audio tracks. | |
| 35 std::unique_ptr<std::map<std::string, SpeakerOutputFilePaths>> | |
|
minyue-webrtc
2017/04/07 13:24:30
I don't know the benefit of passing a unique_ptr o
AleBzk
2017/04/10 08:24:48
I'm not a move semantics expert, but I'd say that
| |
| 36 InitSpeakerOutputFilePaths(const std::set<std::string>& speaker_names, | |
| 37 const std::string& output_path) { | |
| 38 // Create map. | |
| 39 auto speaker_output_file_paths_map = rtc::MakeUnique< | |
| 40 std::map<std::string, SpeakerOutputFilePaths>>(); | |
| 41 | |
| 42 // Add near-end and far-end output paths into the map. | |
| 43 for (const auto& speaker_name : speaker_names) { | |
| 44 const rtc::Pathname near_end_path( | |
| 45 output_path, "s_" + speaker_name + "-near_end.wav"); | |
| 46 LOG(LS_VERBOSE) << "creating " << near_end_path.pathname(); | |
| 47 | |
| 48 const rtc::Pathname far_end_path( | |
| 49 output_path, "s_" + speaker_name + "-far_end.wav"); | |
| 50 LOG(LS_VERBOSE) << "creating " << far_end_path.pathname(); | |
| 51 | |
| 52 // Add to map. | |
| 53 speaker_output_file_paths_map->emplace( | |
| 54 std::piecewise_construct, | |
| 55 std::forward_as_tuple(speaker_name), | |
| 56 std::forward_as_tuple(near_end_path.pathname(), | |
| 57 far_end_path.pathname())); | |
| 58 } | |
| 59 | |
| 60 return speaker_output_file_paths_map; | |
| 61 } | |
| 62 | |
| 63 // Class that provides one WavWriter for the near-end and one for the far-end | |
| 64 // output track of a speaker. | |
| 65 class SpeakerWavWriters { | |
| 66 public: | |
| 67 SpeakerWavWriters( | |
| 68 const SpeakerOutputFilePaths& output_file_paths, int sample_rate) | |
| 69 : near_end_(output_file_paths.near_end, sample_rate, 1u), | |
| 70 far_end_(output_file_paths.far_end, sample_rate, 1u) {} | |
| 71 WavWriter& near_end() { | |
| 72 return near_end_; | |
| 73 } | |
| 74 WavWriter& far_end() { | |
| 75 return far_end_; | |
| 76 } | |
| 77 private: | |
| 78 WavWriter near_end_; | |
| 79 WavWriter far_end_; | |
| 80 | |
| 81 // RTC_DISALLOW_COPY_AND_ASSIGN(SpeakerWavWriters); | |
|
minyue-webrtc
2017/04/07 13:24:30
why commented out?
AleBzk
2017/04/10 08:24:48
yet another leftover. Removed.
| |
| 82 }; | |
| 83 | |
| 84 // Initializes one WavWriter instance for each speaker and both the near-end and | |
| 85 // far-end output tracks. | |
| 86 std::unique_ptr<std::map<std::string, SpeakerWavWriters>> | |
| 87 InitSpeakersWavWriters(const std::map<std::string, SpeakerOutputFilePaths>& | |
| 88 speaker_output_file_paths, int sample_rate) { | |
| 89 // Create map. | |
| 90 auto speaker_wav_writers_map = rtc::MakeUnique< | |
| 91 std::map<std::string, SpeakerWavWriters>>(); | |
| 92 | |
| 93 // Add SpeakerWavWriters instance into the map. | |
| 94 for (auto it = speaker_output_file_paths.begin(); | |
| 95 it != speaker_output_file_paths.end(); ++it) { | |
| 96 speaker_wav_writers_map->emplace( | |
| 97 std::piecewise_construct, | |
| 98 std::forward_as_tuple(it->first), | |
| 99 std::forward_as_tuple(it->second, sample_rate)); | |
| 100 } | |
| 101 | |
| 102 return speaker_wav_writers_map; | |
| 103 } | |
| 104 | |
| 105 // Reads all the samples for each audio track. | |
| 106 std::unique_ptr<std::map<std::string, std::vector<int16_t>>> PreloadAudioTracks( | |
| 107 const std::map<std::string, std::unique_ptr<WavReaderInterface>>& | |
| 108 audiotrack_readers) { | |
| 109 // Create map. | |
| 110 auto audiotracks_map = rtc::MakeUnique< | |
| 111 std::map<std::string, std::vector<int16_t>>>(); | |
| 112 | |
| 113 // Add audio track vectors. | |
| 114 for (auto it = audiotrack_readers.begin(); it != audiotrack_readers.end(); | |
| 115 ++it) { | |
| 116 // Add map entry. | |
| 117 audiotracks_map->emplace( | |
| 118 std::piecewise_construct, | |
| 119 std::forward_as_tuple(it->first), | |
| 120 std::forward_as_tuple(it->second->NumSamples())); | |
| 121 | |
| 122 // Read samples. | |
| 123 it->second->ReadInt16Samples(audiotracks_map->at(it->first)); | |
| 124 } | |
| 125 | |
| 126 return audiotracks_map; | |
| 127 } | |
| 128 | |
| 129 // Writes all the values in source_samples via wav_writer. If the number of | |
| 130 // previously written samples in wav_writer is less than interval.begin, it adds | |
|
minyue-webrtc
2017/04/07 13:24:31
|interval_begin|, (1. underscore, 2. put || on var
AleBzk
2017/04/10 08:24:48
Done.
| |
| 131 // zeros as left padding. The padding corresponds to intervals during which a | |
| 132 // speaker is not active. | |
| 133 void PadLeftWriteChunk(const std::vector<int16_t>& source_samples, | |
|
minyue-webrtc
2017/04/07 13:24:30
consider using ArrayView instead of vector
AleBzk
2017/04/10 08:24:48
Done.
| |
| 134 std::size_t interval_begin, WavWriter* wav_writer) { | |
|
minyue-webrtc
2017/04/07 13:24:30
no need for std::
AleBzk
2017/04/10 08:24:48
Done.
| |
| 135 // Add left padding. | |
| 136 RTC_CHECK(wav_writer); | |
| 137 std::size_t padding_size = interval_begin - wav_writer->num_samples(); | |
| 138 RTC_CHECK(padding_size >= 0); | |
|
minyue-webrtc
2017/04/07 13:24:30
size_t never is negative
RTC_CHECK_GE(interval_be
AleBzk
2017/04/10 08:24:48
Done.
| |
| 139 if (padding_size > 0) { | |
|
minyue-webrtc
2017/04/07 13:24:30
no need for "if" if you check before
AleBzk
2017/04/10 08:24:48
I still need it because padding_size can be 0. If
| |
| 140 const std::vector<int16_t> padding(padding_size, 0); | |
| 141 wav_writer->WriteSamples(padding.data(), padding_size); | |
| 142 } | |
| 143 | |
| 144 // Write source samples. | |
| 145 wav_writer->WriteSamples(source_samples.data(), source_samples.size()); | |
| 146 } | |
| 147 | |
| 148 // Appends zeros via wav_writer. The number of zeros is always non-negative and | |
| 149 // equal to the difference between the previously written samples and | |
| 150 // duration_samples. | |
| 151 void PadRight(WavWriter* wav_writer, std::size_t duration_samples) { | |
|
minyue-webrtc
2017/04/07 13:24:30
duration is normally a time concept. Say either du
minyue-webrtc
2017/04/07 13:24:31
This looks similar to PadLeftWriteChunk but functi
AleBzk
2017/04/10 08:24:48
duration_samples -> pad_samples done
PadRight ->
| |
| 152 RTC_CHECK(wav_writer); | |
| 153 std::size_t padding_size = duration_samples - wav_writer->num_samples(); | |
| 154 RTC_CHECK(padding_size >= 0); | |
|
minyue-webrtc
2017/04/07 13:24:31
again, checking something always true :)
AleBzk
2017/04/10 08:24:48
Done.
| |
| 155 if (padding_size > 0) { | |
| 156 const std::vector<int16_t> padding(padding_size, 0); | |
| 157 wav_writer->WriteSamples(padding.data(), padding_size); | |
| 158 } | |
| 159 } | |
| 160 | |
| 161 } // namespace | |
| 162 | |
| 163 namespace conversational_speech { | |
| 164 | |
| 165 std::unique_ptr<std::map<std::string, SpeakerOutputFilePaths>> Simulate( | |
|
minyue-webrtc
2017/04/07 13:24:30
Are you not gonna write this in any class?
minyue-webrtc
2017/04/07 13:24:31
and same comment on unique_ptr<map>
AleBzk
2017/04/10 08:24:48
Are you not gonna write this in any class?
No. In
| |
| 166 const MultiEndCall& multiend_call, const std::string& output_path) { | |
| 167 // Set output file paths and initialize wav writers. | |
| 168 const auto& speaker_names = multiend_call.speaker_names(); | |
| 169 auto speaker_output_file_paths = InitSpeakerOutputFilePaths( | |
| 170 speaker_names, output_path); | |
| 171 auto speakers_wav_writers = InitSpeakersWavWriters( | |
| 172 *speaker_output_file_paths, multiend_call.sample_rate()); | |
| 173 | |
| 174 // Preload all the input audio tracks. | |
| 175 const auto& audiotrack_readers = multiend_call.audiotrack_readers(); | |
| 176 auto audiotracks = PreloadAudioTracks(audiotrack_readers); | |
| 177 | |
| 178 // TODO(alessiob): When speaker_names.size() == 2, near-end and far-end | |
| 179 // across the 2 speakers are symmetric; hence, the code below could be | |
| 180 // replaced by only creating the near-end or the far-end. However, this would | |
| 181 // require to split the unit tests and document the behavior in README.md. | |
| 182 // In practice, it should not be an issue since the files are not expected to | |
| 183 // be signinificant. | |
| 184 | |
| 185 // Write near-end and far-end output tracks. | |
| 186 const auto& speaking_turns = multiend_call.speaking_turns(); | |
| 187 for (const auto& speaking_turn : speaking_turns) { | |
| 188 const std::string& active_speaker_name = speaking_turn.speaker_name; | |
| 189 auto source_audiotrack = audiotracks->at( | |
| 190 speaking_turn.audiotrack_file_name); | |
| 191 | |
| 192 // Write active speaker's chunk to active speaker's near-end. | |
| 193 PadLeftWriteChunk(source_audiotrack, speaking_turn.begin, | |
| 194 &speakers_wav_writers->at( | |
| 195 active_speaker_name).near_end()); | |
| 196 | |
| 197 // Write active speaker's chunk to other participants' far-ends. | |
| 198 for (const std::string& speaker_name : speaker_names) { | |
| 199 if (speaker_name == active_speaker_name) | |
| 200 continue; | |
| 201 PadLeftWriteChunk(source_audiotrack, speaking_turn.begin, | |
| 202 &speakers_wav_writers->at(speaker_name).far_end()); | |
| 203 } | |
| 204 } | |
| 205 | |
| 206 // Finalize all the output tracks with right padding. | |
| 207 // This is required to make all the output tracks duration equal. | |
| 208 std::size_t duration_samples = multiend_call.total_duration_samples(); | |
| 209 for (const std::string& speaker_name : speaker_names) { | |
| 210 PadRight(&speakers_wav_writers->at(speaker_name).near_end(), | |
| 211 duration_samples); | |
| 212 PadRight(&speakers_wav_writers->at(speaker_name).far_end(), | |
| 213 duration_samples); | |
| 214 } | |
| 215 | |
| 216 return speaker_output_file_paths; | |
| 217 } | |
| 218 | |
| 219 } // namespace conversational_speech | |
| 220 } // namespace test | |
| 221 } // namespace webrtc | |
| OLD | NEW |