Index: webrtc/modules/interface/module_common_types.h |
diff --git a/webrtc/modules/interface/module_common_types.h b/webrtc/modules/interface/module_common_types.h |
deleted file mode 100644 |
index 8d968707038267e16ad1fe2e6e1355a35f395a18..0000000000000000000000000000000000000000 |
--- a/webrtc/modules/interface/module_common_types.h |
+++ /dev/null |
@@ -1,812 +0,0 @@ |
-/* |
- * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
- * |
- * Use of this source code is governed by a BSD-style license |
- * that can be found in the LICENSE file in the root of the source |
- * tree. An additional intellectual property rights grant can be found |
- * in the file PATENTS. All contributing project authors may |
- * be found in the AUTHORS file in the root of the source tree. |
- */ |
- |
-#ifndef WEBRTC_MODULES_INCLUDE_MODULE_COMMON_TYPES_H_ |
-#define WEBRTC_MODULES_INCLUDE_MODULE_COMMON_TYPES_H_ |
- |
-#pragma message("WARNING: webrtc/modules/include is DEPRECATED; use webrtc/modules/include") |
- |
-#include <assert.h> |
-#include <string.h> // memcpy |
- |
-#include <algorithm> |
-#include <limits> |
- |
-#include "webrtc/base/constructormagic.h" |
-#include "webrtc/common_types.h" |
-#include "webrtc/common_video/rotation.h" |
-#include "webrtc/typedefs.h" |
- |
-namespace webrtc { |
- |
-struct RTPAudioHeader { |
- uint8_t numEnergy; // number of valid entries in arrOfEnergy |
- uint8_t arrOfEnergy[kRtpCsrcSize]; // one energy byte (0-9) per channel |
- bool isCNG; // is this CNG |
- uint8_t channel; // number of channels 2 = stereo |
-}; |
- |
-const int16_t kNoPictureId = -1; |
-const int16_t kMaxOneBytePictureId = 0x7F; // 7 bits |
-const int16_t kMaxTwoBytePictureId = 0x7FFF; // 15 bits |
-const int16_t kNoTl0PicIdx = -1; |
-const uint8_t kNoTemporalIdx = 0xFF; |
-const uint8_t kNoSpatialIdx = 0xFF; |
-const uint8_t kNoGofIdx = 0xFF; |
-const size_t kMaxVp9RefPics = 3; |
-const size_t kMaxVp9FramesInGof = 0xFF; // 8 bits |
-const size_t kMaxVp9NumberOfSpatialLayers = 8; |
-const int kNoKeyIdx = -1; |
- |
-struct RTPVideoHeaderVP8 { |
- void InitRTPVideoHeaderVP8() { |
- nonReference = false; |
- pictureId = kNoPictureId; |
- tl0PicIdx = kNoTl0PicIdx; |
- temporalIdx = kNoTemporalIdx; |
- layerSync = false; |
- keyIdx = kNoKeyIdx; |
- partitionId = 0; |
- beginningOfPartition = false; |
- } |
- |
- bool nonReference; // Frame is discardable. |
- int16_t pictureId; // Picture ID index, 15 bits; |
- // kNoPictureId if PictureID does not exist. |
- int16_t tl0PicIdx; // TL0PIC_IDX, 8 bits; |
- // kNoTl0PicIdx means no value provided. |
- uint8_t temporalIdx; // Temporal layer index, or kNoTemporalIdx. |
- bool layerSync; // This frame is a layer sync frame. |
- // Disabled if temporalIdx == kNoTemporalIdx. |
- int keyIdx; // 5 bits; kNoKeyIdx means not used. |
- int partitionId; // VP8 partition ID |
- bool beginningOfPartition; // True if this packet is the first |
- // in a VP8 partition. Otherwise false |
-}; |
- |
-enum TemporalStructureMode { |
- kTemporalStructureMode1, // 1 temporal layer structure - i.e., IPPP... |
- kTemporalStructureMode2, // 2 temporal layers 0-1-0-1... |
- kTemporalStructureMode3 // 3 temporal layers 0-2-1-2-0-2-1-2... |
-}; |
- |
-struct GofInfoVP9 { |
- void SetGofInfoVP9(TemporalStructureMode tm) { |
- switch (tm) { |
- case kTemporalStructureMode1: |
- num_frames_in_gof = 1; |
- temporal_idx[0] = 0; |
- temporal_up_switch[0] = false; |
- num_ref_pics[0] = 1; |
- pid_diff[0][0] = 1; |
- break; |
- case kTemporalStructureMode2: |
- num_frames_in_gof = 2; |
- temporal_idx[0] = 0; |
- temporal_up_switch[0] = false; |
- num_ref_pics[0] = 1; |
- pid_diff[0][0] = 2; |
- |
- temporal_idx[1] = 1; |
- temporal_up_switch[1] = true; |
- num_ref_pics[1] = 1; |
- pid_diff[1][0] = 1; |
- break; |
- case kTemporalStructureMode3: |
- num_frames_in_gof = 4; |
- temporal_idx[0] = 0; |
- temporal_up_switch[0] = false; |
- num_ref_pics[0] = 1; |
- pid_diff[0][0] = 4; |
- |
- temporal_idx[1] = 2; |
- temporal_up_switch[1] = true; |
- num_ref_pics[1] = 1; |
- pid_diff[1][0] = 1; |
- |
- temporal_idx[2] = 1; |
- temporal_up_switch[2] = true; |
- num_ref_pics[2] = 1; |
- pid_diff[2][0] = 2; |
- |
- temporal_idx[3] = 2; |
- temporal_up_switch[3] = false; |
- num_ref_pics[3] = 2; |
- pid_diff[3][0] = 1; |
- pid_diff[3][1] = 2; |
- break; |
- default: |
- assert(false); |
- } |
- } |
- |
- void CopyGofInfoVP9(const GofInfoVP9& src) { |
- num_frames_in_gof = src.num_frames_in_gof; |
- for (size_t i = 0; i < num_frames_in_gof; ++i) { |
- temporal_idx[i] = src.temporal_idx[i]; |
- temporal_up_switch[i] = src.temporal_up_switch[i]; |
- num_ref_pics[i] = src.num_ref_pics[i]; |
- for (uint8_t r = 0; r < num_ref_pics[i]; ++r) { |
- pid_diff[i][r] = src.pid_diff[i][r]; |
- } |
- } |
- } |
- |
- size_t num_frames_in_gof; |
- uint8_t temporal_idx[kMaxVp9FramesInGof]; |
- bool temporal_up_switch[kMaxVp9FramesInGof]; |
- uint8_t num_ref_pics[kMaxVp9FramesInGof]; |
- uint8_t pid_diff[kMaxVp9FramesInGof][kMaxVp9RefPics]; |
-}; |
- |
-struct RTPVideoHeaderVP9 { |
- void InitRTPVideoHeaderVP9() { |
- inter_pic_predicted = false; |
- flexible_mode = false; |
- beginning_of_frame = false; |
- end_of_frame = false; |
- ss_data_available = false; |
- picture_id = kNoPictureId; |
- max_picture_id = kMaxTwoBytePictureId; |
- tl0_pic_idx = kNoTl0PicIdx; |
- temporal_idx = kNoTemporalIdx; |
- spatial_idx = kNoSpatialIdx; |
- temporal_up_switch = false; |
- inter_layer_predicted = false; |
- gof_idx = kNoGofIdx; |
- num_ref_pics = 0; |
- num_spatial_layers = 1; |
- } |
- |
- bool inter_pic_predicted; // This layer frame is dependent on previously |
- // coded frame(s). |
- bool flexible_mode; // This frame is in flexible mode. |
- bool beginning_of_frame; // True if this packet is the first in a VP9 layer |
- // frame. |
- bool end_of_frame; // True if this packet is the last in a VP9 layer frame. |
- bool ss_data_available; // True if SS data is available in this payload |
- // descriptor. |
- int16_t picture_id; // PictureID index, 15 bits; |
- // kNoPictureId if PictureID does not exist. |
- int16_t max_picture_id; // Maximum picture ID index; either 0x7F or 0x7FFF; |
- int16_t tl0_pic_idx; // TL0PIC_IDX, 8 bits; |
- // kNoTl0PicIdx means no value provided. |
- uint8_t temporal_idx; // Temporal layer index, or kNoTemporalIdx. |
- uint8_t spatial_idx; // Spatial layer index, or kNoSpatialIdx. |
- bool temporal_up_switch; // True if upswitch to higher frame rate is possible |
- // starting from this frame. |
- bool inter_layer_predicted; // Frame is dependent on directly lower spatial |
- // layer frame. |
- |
- uint8_t gof_idx; // Index to predefined temporal frame info in SS data. |
- |
- uint8_t num_ref_pics; // Number of reference pictures used by this layer |
- // frame. |
- uint8_t pid_diff[kMaxVp9RefPics]; // P_DIFF signaled to derive the PictureID |
- // of the reference pictures. |
- int16_t ref_picture_id[kMaxVp9RefPics]; // PictureID of reference pictures. |
- |
- // SS data. |
- size_t num_spatial_layers; // Always populated. |
- bool spatial_layer_resolution_present; |
- uint16_t width[kMaxVp9NumberOfSpatialLayers]; |
- uint16_t height[kMaxVp9NumberOfSpatialLayers]; |
- GofInfoVP9 gof; |
-}; |
- |
-// The packetization types that we support: single, aggregated, and fragmented. |
-enum H264PacketizationTypes { |
- kH264SingleNalu, // This packet contains a single NAL unit. |
- kH264StapA, // This packet contains STAP-A (single time |
- // aggregation) packets. If this packet has an |
- // associated NAL unit type, it'll be for the |
- // first such aggregated packet. |
- kH264FuA, // This packet contains a FU-A (fragmentation |
- // unit) packet, meaning it is a part of a frame |
- // that was too large to fit into a single packet. |
-}; |
- |
-struct RTPVideoHeaderH264 { |
- uint8_t nalu_type; // The NAL unit type. If this is a header for a |
- // fragmented packet, it's the NAL unit type of |
- // the original data. If this is the header for an |
- // aggregated packet, it's the NAL unit type of |
- // the first NAL unit in the packet. |
- H264PacketizationTypes packetization_type; |
-}; |
- |
-union RTPVideoTypeHeader { |
- RTPVideoHeaderVP8 VP8; |
- RTPVideoHeaderVP9 VP9; |
- RTPVideoHeaderH264 H264; |
-}; |
- |
-enum RtpVideoCodecTypes { |
- kRtpVideoNone, |
- kRtpVideoGeneric, |
- kRtpVideoVp8, |
- kRtpVideoVp9, |
- kRtpVideoH264 |
-}; |
-// Since RTPVideoHeader is used as a member of a union, it can't have a |
-// non-trivial default constructor. |
-struct RTPVideoHeader { |
- uint16_t width; // size |
- uint16_t height; |
- VideoRotation rotation; |
- |
- bool isFirstPacket; // first packet in frame |
- uint8_t simulcastIdx; // Index if the simulcast encoder creating |
- // this frame, 0 if not using simulcast. |
- RtpVideoCodecTypes codec; |
- RTPVideoTypeHeader codecHeader; |
-}; |
-union RTPTypeHeader { |
- RTPAudioHeader Audio; |
- RTPVideoHeader Video; |
-}; |
- |
-struct WebRtcRTPHeader { |
- RTPHeader header; |
- FrameType frameType; |
- RTPTypeHeader type; |
- // NTP time of the capture time in local timebase in milliseconds. |
- int64_t ntp_time_ms; |
-}; |
- |
-class RTPFragmentationHeader { |
- public: |
- RTPFragmentationHeader() |
- : fragmentationVectorSize(0), |
- fragmentationOffset(NULL), |
- fragmentationLength(NULL), |
- fragmentationTimeDiff(NULL), |
- fragmentationPlType(NULL) {}; |
- |
- ~RTPFragmentationHeader() { |
- delete[] fragmentationOffset; |
- delete[] fragmentationLength; |
- delete[] fragmentationTimeDiff; |
- delete[] fragmentationPlType; |
- } |
- |
- void CopyFrom(const RTPFragmentationHeader& src) { |
- if (this == &src) { |
- return; |
- } |
- |
- if (src.fragmentationVectorSize != fragmentationVectorSize) { |
- // new size of vectors |
- |
- // delete old |
- delete[] fragmentationOffset; |
- fragmentationOffset = NULL; |
- delete[] fragmentationLength; |
- fragmentationLength = NULL; |
- delete[] fragmentationTimeDiff; |
- fragmentationTimeDiff = NULL; |
- delete[] fragmentationPlType; |
- fragmentationPlType = NULL; |
- |
- if (src.fragmentationVectorSize > 0) { |
- // allocate new |
- if (src.fragmentationOffset) { |
- fragmentationOffset = new size_t[src.fragmentationVectorSize]; |
- } |
- if (src.fragmentationLength) { |
- fragmentationLength = new size_t[src.fragmentationVectorSize]; |
- } |
- if (src.fragmentationTimeDiff) { |
- fragmentationTimeDiff = new uint16_t[src.fragmentationVectorSize]; |
- } |
- if (src.fragmentationPlType) { |
- fragmentationPlType = new uint8_t[src.fragmentationVectorSize]; |
- } |
- } |
- // set new size |
- fragmentationVectorSize = src.fragmentationVectorSize; |
- } |
- |
- if (src.fragmentationVectorSize > 0) { |
- // copy values |
- if (src.fragmentationOffset) { |
- memcpy(fragmentationOffset, src.fragmentationOffset, |
- src.fragmentationVectorSize * sizeof(size_t)); |
- } |
- if (src.fragmentationLength) { |
- memcpy(fragmentationLength, src.fragmentationLength, |
- src.fragmentationVectorSize * sizeof(size_t)); |
- } |
- if (src.fragmentationTimeDiff) { |
- memcpy(fragmentationTimeDiff, src.fragmentationTimeDiff, |
- src.fragmentationVectorSize * sizeof(uint16_t)); |
- } |
- if (src.fragmentationPlType) { |
- memcpy(fragmentationPlType, src.fragmentationPlType, |
- src.fragmentationVectorSize * sizeof(uint8_t)); |
- } |
- } |
- } |
- |
- void VerifyAndAllocateFragmentationHeader(const size_t size) { |
- assert(size <= std::numeric_limits<uint16_t>::max()); |
- const uint16_t size16 = static_cast<uint16_t>(size); |
- if (fragmentationVectorSize < size16) { |
- uint16_t oldVectorSize = fragmentationVectorSize; |
- { |
- // offset |
- size_t* oldOffsets = fragmentationOffset; |
- fragmentationOffset = new size_t[size16]; |
- memset(fragmentationOffset + oldVectorSize, 0, |
- sizeof(size_t) * (size16 - oldVectorSize)); |
- // copy old values |
- memcpy(fragmentationOffset, oldOffsets, |
- sizeof(size_t) * oldVectorSize); |
- delete[] oldOffsets; |
- } |
- // length |
- { |
- size_t* oldLengths = fragmentationLength; |
- fragmentationLength = new size_t[size16]; |
- memset(fragmentationLength + oldVectorSize, 0, |
- sizeof(size_t) * (size16 - oldVectorSize)); |
- memcpy(fragmentationLength, oldLengths, |
- sizeof(size_t) * oldVectorSize); |
- delete[] oldLengths; |
- } |
- // time diff |
- { |
- uint16_t* oldTimeDiffs = fragmentationTimeDiff; |
- fragmentationTimeDiff = new uint16_t[size16]; |
- memset(fragmentationTimeDiff + oldVectorSize, 0, |
- sizeof(uint16_t) * (size16 - oldVectorSize)); |
- memcpy(fragmentationTimeDiff, oldTimeDiffs, |
- sizeof(uint16_t) * oldVectorSize); |
- delete[] oldTimeDiffs; |
- } |
- // payload type |
- { |
- uint8_t* oldTimePlTypes = fragmentationPlType; |
- fragmentationPlType = new uint8_t[size16]; |
- memset(fragmentationPlType + oldVectorSize, 0, |
- sizeof(uint8_t) * (size16 - oldVectorSize)); |
- memcpy(fragmentationPlType, oldTimePlTypes, |
- sizeof(uint8_t) * oldVectorSize); |
- delete[] oldTimePlTypes; |
- } |
- fragmentationVectorSize = size16; |
- } |
- } |
- |
- uint16_t fragmentationVectorSize; // Number of fragmentations |
- size_t* fragmentationOffset; // Offset of pointer to data for each |
- // fragmentation |
- size_t* fragmentationLength; // Data size for each fragmentation |
- uint16_t* fragmentationTimeDiff; // Timestamp difference relative "now" for |
- // each fragmentation |
- uint8_t* fragmentationPlType; // Payload type of each fragmentation |
- |
- private: |
- RTC_DISALLOW_COPY_AND_ASSIGN(RTPFragmentationHeader); |
-}; |
- |
-struct RTCPVoIPMetric { |
- // RFC 3611 4.7 |
- uint8_t lossRate; |
- uint8_t discardRate; |
- uint8_t burstDensity; |
- uint8_t gapDensity; |
- uint16_t burstDuration; |
- uint16_t gapDuration; |
- uint16_t roundTripDelay; |
- uint16_t endSystemDelay; |
- uint8_t signalLevel; |
- uint8_t noiseLevel; |
- uint8_t RERL; |
- uint8_t Gmin; |
- uint8_t Rfactor; |
- uint8_t extRfactor; |
- uint8_t MOSLQ; |
- uint8_t MOSCQ; |
- uint8_t RXconfig; |
- uint16_t JBnominal; |
- uint16_t JBmax; |
- uint16_t JBabsMax; |
-}; |
- |
-// Types for the FEC packet masks. The type |kFecMaskRandom| is based on a |
-// random loss model. The type |kFecMaskBursty| is based on a bursty/consecutive |
-// loss model. The packet masks are defined in |
-// modules/rtp_rtcp/fec_private_tables_random(bursty).h |
-enum FecMaskType { |
- kFecMaskRandom, |
- kFecMaskBursty, |
-}; |
- |
-// Struct containing forward error correction settings. |
-struct FecProtectionParams { |
- int fec_rate; |
- bool use_uep_protection; |
- int max_fec_frames; |
- FecMaskType fec_mask_type; |
-}; |
- |
-// Interface used by the CallStats class to distribute call statistics. |
-// Callbacks will be triggered as soon as the class has been registered to a |
-// CallStats object using RegisterStatsObserver. |
-class CallStatsObserver { |
- public: |
- virtual void OnRttUpdate(int64_t avg_rtt_ms, int64_t max_rtt_ms) = 0; |
- |
- virtual ~CallStatsObserver() {} |
-}; |
- |
-struct VideoContentMetrics { |
- VideoContentMetrics() |
- : motion_magnitude(0.0f), |
- spatial_pred_err(0.0f), |
- spatial_pred_err_h(0.0f), |
- spatial_pred_err_v(0.0f) {} |
- |
- void Reset() { |
- motion_magnitude = 0.0f; |
- spatial_pred_err = 0.0f; |
- spatial_pred_err_h = 0.0f; |
- spatial_pred_err_v = 0.0f; |
- } |
- float motion_magnitude; |
- float spatial_pred_err; |
- float spatial_pred_err_h; |
- float spatial_pred_err_v; |
-}; |
- |
-/* This class holds up to 60 ms of super-wideband (32 kHz) stereo audio. It |
- * allows for adding and subtracting frames while keeping track of the resulting |
- * states. |
- * |
- * Notes |
- * - The total number of samples in |data_| is |
- * samples_per_channel_ * num_channels_ |
- * |
- * - Stereo data is interleaved starting with the left channel. |
- * |
- * - The +operator assume that you would never add exactly opposite frames when |
- * deciding the resulting state. To do this use the -operator. |
- */ |
-class AudioFrame { |
- public: |
- // Stereo, 32 kHz, 60 ms (2 * 32 * 60) |
- static const size_t kMaxDataSizeSamples = 3840; |
- |
- enum VADActivity { |
- kVadActive = 0, |
- kVadPassive = 1, |
- kVadUnknown = 2 |
- }; |
- enum SpeechType { |
- kNormalSpeech = 0, |
- kPLC = 1, |
- kCNG = 2, |
- kPLCCNG = 3, |
- kUndefined = 4 |
- }; |
- |
- AudioFrame(); |
- virtual ~AudioFrame() {} |
- |
- // Resets all members to their default state (except does not modify the |
- // contents of |data_|). |
- void Reset(); |
- |
- // |interleaved_| is not changed by this method. |
- void UpdateFrame(int id, uint32_t timestamp, const int16_t* data, |
- size_t samples_per_channel, int sample_rate_hz, |
- SpeechType speech_type, VADActivity vad_activity, |
- int num_channels = 1, uint32_t energy = -1); |
- |
- AudioFrame& Append(const AudioFrame& rhs); |
- |
- void CopyFrom(const AudioFrame& src); |
- |
- void Mute(); |
- |
- AudioFrame& operator>>=(const int rhs); |
- AudioFrame& operator+=(const AudioFrame& rhs); |
- AudioFrame& operator-=(const AudioFrame& rhs); |
- |
- int id_; |
- // RTP timestamp of the first sample in the AudioFrame. |
- uint32_t timestamp_; |
- // Time since the first frame in milliseconds. |
- // -1 represents an uninitialized value. |
- int64_t elapsed_time_ms_; |
- // NTP time of the estimated capture time in local timebase in milliseconds. |
- // -1 represents an uninitialized value. |
- int64_t ntp_time_ms_; |
- int16_t data_[kMaxDataSizeSamples]; |
- size_t samples_per_channel_; |
- int sample_rate_hz_; |
- int num_channels_; |
- SpeechType speech_type_; |
- VADActivity vad_activity_; |
- // Note that there is no guarantee that |energy_| is correct. Any user of this |
- // member must verify that the value is correct. |
- // TODO(henrike) Remove |energy_|. |
- // See https://code.google.com/p/webrtc/issues/detail?id=3315. |
- uint32_t energy_; |
- bool interleaved_; |
- |
- private: |
- RTC_DISALLOW_COPY_AND_ASSIGN(AudioFrame); |
-}; |
- |
-inline AudioFrame::AudioFrame() |
- : data_() { |
- Reset(); |
-} |
- |
-inline void AudioFrame::Reset() { |
- id_ = -1; |
- // TODO(wu): Zero is a valid value for |timestamp_|. We should initialize |
- // to an invalid value, or add a new member to indicate invalidity. |
- timestamp_ = 0; |
- elapsed_time_ms_ = -1; |
- ntp_time_ms_ = -1; |
- samples_per_channel_ = 0; |
- sample_rate_hz_ = 0; |
- num_channels_ = 0; |
- speech_type_ = kUndefined; |
- vad_activity_ = kVadUnknown; |
- energy_ = 0xffffffff; |
- interleaved_ = true; |
-} |
- |
-inline void AudioFrame::UpdateFrame(int id, |
- uint32_t timestamp, |
- const int16_t* data, |
- size_t samples_per_channel, |
- int sample_rate_hz, |
- SpeechType speech_type, |
- VADActivity vad_activity, |
- int num_channels, |
- uint32_t energy) { |
- id_ = id; |
- timestamp_ = timestamp; |
- samples_per_channel_ = samples_per_channel; |
- sample_rate_hz_ = sample_rate_hz; |
- speech_type_ = speech_type; |
- vad_activity_ = vad_activity; |
- num_channels_ = num_channels; |
- energy_ = energy; |
- |
- assert(num_channels >= 0); |
- const size_t length = samples_per_channel * num_channels; |
- assert(length <= kMaxDataSizeSamples); |
- if (data != NULL) { |
- memcpy(data_, data, sizeof(int16_t) * length); |
- } else { |
- memset(data_, 0, sizeof(int16_t) * length); |
- } |
-} |
- |
-inline void AudioFrame::CopyFrom(const AudioFrame& src) { |
- if (this == &src) return; |
- |
- id_ = src.id_; |
- timestamp_ = src.timestamp_; |
- elapsed_time_ms_ = src.elapsed_time_ms_; |
- ntp_time_ms_ = src.ntp_time_ms_; |
- samples_per_channel_ = src.samples_per_channel_; |
- sample_rate_hz_ = src.sample_rate_hz_; |
- speech_type_ = src.speech_type_; |
- vad_activity_ = src.vad_activity_; |
- num_channels_ = src.num_channels_; |
- energy_ = src.energy_; |
- interleaved_ = src.interleaved_; |
- |
- assert(num_channels_ >= 0); |
- const size_t length = samples_per_channel_ * num_channels_; |
- assert(length <= kMaxDataSizeSamples); |
- memcpy(data_, src.data_, sizeof(int16_t) * length); |
-} |
- |
-inline void AudioFrame::Mute() { |
- memset(data_, 0, samples_per_channel_ * num_channels_ * sizeof(int16_t)); |
-} |
- |
-inline AudioFrame& AudioFrame::operator>>=(const int rhs) { |
- assert((num_channels_ > 0) && (num_channels_ < 3)); |
- if ((num_channels_ > 2) || (num_channels_ < 1)) return *this; |
- |
- for (size_t i = 0; i < samples_per_channel_ * num_channels_; i++) { |
- data_[i] = static_cast<int16_t>(data_[i] >> rhs); |
- } |
- return *this; |
-} |
- |
-inline AudioFrame& AudioFrame::Append(const AudioFrame& rhs) { |
- // Sanity check |
- assert((num_channels_ > 0) && (num_channels_ < 3)); |
- assert(interleaved_ == rhs.interleaved_); |
- if ((num_channels_ > 2) || (num_channels_ < 1)) return *this; |
- if (num_channels_ != rhs.num_channels_) return *this; |
- |
- if ((vad_activity_ == kVadActive) || rhs.vad_activity_ == kVadActive) { |
- vad_activity_ = kVadActive; |
- } else if (vad_activity_ == kVadUnknown || rhs.vad_activity_ == kVadUnknown) { |
- vad_activity_ = kVadUnknown; |
- } |
- if (speech_type_ != rhs.speech_type_) { |
- speech_type_ = kUndefined; |
- } |
- |
- size_t offset = samples_per_channel_ * num_channels_; |
- for (size_t i = 0; i < rhs.samples_per_channel_ * rhs.num_channels_; i++) { |
- data_[offset + i] = rhs.data_[i]; |
- } |
- samples_per_channel_ += rhs.samples_per_channel_; |
- return *this; |
-} |
- |
-namespace { |
-inline int16_t ClampToInt16(int32_t input) { |
- if (input < -0x00008000) { |
- return -0x8000; |
- } else if (input > 0x00007FFF) { |
- return 0x7FFF; |
- } else { |
- return static_cast<int16_t>(input); |
- } |
-} |
-} |
- |
-inline AudioFrame& AudioFrame::operator+=(const AudioFrame& rhs) { |
- // Sanity check |
- assert((num_channels_ > 0) && (num_channels_ < 3)); |
- assert(interleaved_ == rhs.interleaved_); |
- if ((num_channels_ > 2) || (num_channels_ < 1)) return *this; |
- if (num_channels_ != rhs.num_channels_) return *this; |
- |
- bool noPrevData = false; |
- if (samples_per_channel_ != rhs.samples_per_channel_) { |
- if (samples_per_channel_ == 0) { |
- // special case we have no data to start with |
- samples_per_channel_ = rhs.samples_per_channel_; |
- noPrevData = true; |
- } else { |
- return *this; |
- } |
- } |
- |
- if ((vad_activity_ == kVadActive) || rhs.vad_activity_ == kVadActive) { |
- vad_activity_ = kVadActive; |
- } else if (vad_activity_ == kVadUnknown || rhs.vad_activity_ == kVadUnknown) { |
- vad_activity_ = kVadUnknown; |
- } |
- |
- if (speech_type_ != rhs.speech_type_) speech_type_ = kUndefined; |
- |
- if (noPrevData) { |
- memcpy(data_, rhs.data_, |
- sizeof(int16_t) * rhs.samples_per_channel_ * num_channels_); |
- } else { |
- // IMPROVEMENT this can be done very fast in assembly |
- for (size_t i = 0; i < samples_per_channel_ * num_channels_; i++) { |
- int32_t wrap_guard = |
- static_cast<int32_t>(data_[i]) + static_cast<int32_t>(rhs.data_[i]); |
- data_[i] = ClampToInt16(wrap_guard); |
- } |
- } |
- energy_ = 0xffffffff; |
- return *this; |
-} |
- |
-inline AudioFrame& AudioFrame::operator-=(const AudioFrame& rhs) { |
- // Sanity check |
- assert((num_channels_ > 0) && (num_channels_ < 3)); |
- assert(interleaved_ == rhs.interleaved_); |
- if ((num_channels_ > 2) || (num_channels_ < 1)) return *this; |
- |
- if ((samples_per_channel_ != rhs.samples_per_channel_) || |
- (num_channels_ != rhs.num_channels_)) { |
- return *this; |
- } |
- if ((vad_activity_ != kVadPassive) || rhs.vad_activity_ != kVadPassive) { |
- vad_activity_ = kVadUnknown; |
- } |
- speech_type_ = kUndefined; |
- |
- for (size_t i = 0; i < samples_per_channel_ * num_channels_; i++) { |
- int32_t wrap_guard = |
- static_cast<int32_t>(data_[i]) - static_cast<int32_t>(rhs.data_[i]); |
- data_[i] = ClampToInt16(wrap_guard); |
- } |
- energy_ = 0xffffffff; |
- return *this; |
-} |
- |
-inline bool IsNewerSequenceNumber(uint16_t sequence_number, |
- uint16_t prev_sequence_number) { |
- // Distinguish between elements that are exactly 0x8000 apart. |
- // If s1>s2 and |s1-s2| = 0x8000: IsNewer(s1,s2)=true, IsNewer(s2,s1)=false |
- // rather than having IsNewer(s1,s2) = IsNewer(s2,s1) = false. |
- if (static_cast<uint16_t>(sequence_number - prev_sequence_number) == 0x8000) { |
- return sequence_number > prev_sequence_number; |
- } |
- return sequence_number != prev_sequence_number && |
- static_cast<uint16_t>(sequence_number - prev_sequence_number) < 0x8000; |
-} |
- |
-inline bool IsNewerTimestamp(uint32_t timestamp, uint32_t prev_timestamp) { |
- // Distinguish between elements that are exactly 0x80000000 apart. |
- // If t1>t2 and |t1-t2| = 0x80000000: IsNewer(t1,t2)=true, |
- // IsNewer(t2,t1)=false |
- // rather than having IsNewer(t1,t2) = IsNewer(t2,t1) = false. |
- if (static_cast<uint32_t>(timestamp - prev_timestamp) == 0x80000000) { |
- return timestamp > prev_timestamp; |
- } |
- return timestamp != prev_timestamp && |
- static_cast<uint32_t>(timestamp - prev_timestamp) < 0x80000000; |
-} |
- |
-inline uint16_t LatestSequenceNumber(uint16_t sequence_number1, |
- uint16_t sequence_number2) { |
- return IsNewerSequenceNumber(sequence_number1, sequence_number2) |
- ? sequence_number1 |
- : sequence_number2; |
-} |
- |
-inline uint32_t LatestTimestamp(uint32_t timestamp1, uint32_t timestamp2) { |
- return IsNewerTimestamp(timestamp1, timestamp2) ? timestamp1 : timestamp2; |
-} |
- |
-// Utility class to unwrap a sequence number to a larger type, for easier |
-// handling large ranges. Note that sequence numbers will never be unwrapped |
-// to a negative value. |
-class SequenceNumberUnwrapper { |
- public: |
- SequenceNumberUnwrapper() : last_seq_(-1) {} |
- |
- // Get the unwrapped sequence, but don't update the internal state. |
- int64_t UnwrapWithoutUpdate(uint16_t sequence_number) { |
- if (last_seq_ == -1) |
- return sequence_number; |
- |
- uint16_t cropped_last = static_cast<uint16_t>(last_seq_); |
- int64_t delta = sequence_number - cropped_last; |
- if (IsNewerSequenceNumber(sequence_number, cropped_last)) { |
- if (delta < 0) |
- delta += (1 << 16); // Wrap forwards. |
- } else if (delta > 0 && (last_seq_ + delta - (1 << 16)) >= 0) { |
- // If sequence_number is older but delta is positive, this is a backwards |
- // wrap-around. However, don't wrap backwards past 0 (unwrapped). |
- delta -= (1 << 16); |
- } |
- |
- return last_seq_ + delta; |
- } |
- |
- // Only update the internal state to the specified last (unwrapped) sequence. |
- void UpdateLast(int64_t last_sequence) { last_seq_ = last_sequence; } |
- |
- // Unwrap the sequence number and update the internal state. |
- int64_t Unwrap(uint16_t sequence_number) { |
- int64_t unwrapped = UnwrapWithoutUpdate(sequence_number); |
- UpdateLast(unwrapped); |
- return unwrapped; |
- } |
- |
- private: |
- int64_t last_seq_; |
-}; |
- |
-} // namespace webrtc |
- |
-#endif // WEBRTC_MODULES_INCLUDE_MODULE_COMMON_TYPES_H_ |