
The main purpose was the interface-> include rename, but other files were also moved, eliminating the "main" dir. To avoid breaking downstream, the "interface" directories were copied into a new "video_coding/include" dir. The old headers got pragma warnings added about deprecation (a very short deprecation since I plan to remove them as soon downstream is updated). Other files also moved: video_coding/main/source -> video_coding video_coding/main/test -> video_coding/test BUG=webrtc:5095 TESTED=Passing compile-trybots with --clobber flag: git cl try --clobber --bot=win_compile_rel --bot=linux_compile_rel --bot=android_compile_rel --bot=mac_compile_rel --bot=ios_rel --bot=linux_gn_rel --bot=win_x64_gn_rel --bot=mac_x64_gn_rel --bot=android_gn_rel -m tryserver.webrtc R=stefan@webrtc.org, tommi@webrtc.org Review URL: https://codereview.webrtc.org/1417283007 . Cr-Commit-Position: refs/heads/master@{#10694}
287 lines
9.5 KiB
C++
287 lines
9.5 KiB
C++
/*
|
|
* Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "webrtc/modules/video_coding/decoding_state.h"
|
|
|
|
#include "webrtc/modules/include/module_common_types.h"
|
|
#include "webrtc/modules/video_coding/frame_buffer.h"
|
|
#include "webrtc/modules/video_coding/jitter_buffer_common.h"
|
|
#include "webrtc/modules/video_coding/packet.h"
|
|
|
|
namespace webrtc {
|
|
|
|
VCMDecodingState::VCMDecodingState()
|
|
: sequence_num_(0),
|
|
time_stamp_(0),
|
|
picture_id_(kNoPictureId),
|
|
temporal_id_(kNoTemporalIdx),
|
|
tl0_pic_id_(kNoTl0PicIdx),
|
|
full_sync_(true),
|
|
in_initial_state_(true) {
|
|
memset(frame_decoded_, 0, sizeof(frame_decoded_));
|
|
}
|
|
|
|
VCMDecodingState::~VCMDecodingState() {}
|
|
|
|
void VCMDecodingState::Reset() {
|
|
// TODO(mikhal): Verify - not always would want to reset the sync
|
|
sequence_num_ = 0;
|
|
time_stamp_ = 0;
|
|
picture_id_ = kNoPictureId;
|
|
temporal_id_ = kNoTemporalIdx;
|
|
tl0_pic_id_ = kNoTl0PicIdx;
|
|
full_sync_ = true;
|
|
in_initial_state_ = true;
|
|
memset(frame_decoded_, 0, sizeof(frame_decoded_));
|
|
}
|
|
|
|
uint32_t VCMDecodingState::time_stamp() const {
|
|
return time_stamp_;
|
|
}
|
|
|
|
uint16_t VCMDecodingState::sequence_num() const {
|
|
return sequence_num_;
|
|
}
|
|
|
|
bool VCMDecodingState::IsOldFrame(const VCMFrameBuffer* frame) const {
|
|
assert(frame != NULL);
|
|
if (in_initial_state_)
|
|
return false;
|
|
return !IsNewerTimestamp(frame->TimeStamp(), time_stamp_);
|
|
}
|
|
|
|
bool VCMDecodingState::IsOldPacket(const VCMPacket* packet) const {
|
|
assert(packet != NULL);
|
|
if (in_initial_state_)
|
|
return false;
|
|
return !IsNewerTimestamp(packet->timestamp, time_stamp_);
|
|
}
|
|
|
|
void VCMDecodingState::SetState(const VCMFrameBuffer* frame) {
|
|
assert(frame != NULL && frame->GetHighSeqNum() >= 0);
|
|
if (!UsingFlexibleMode(frame))
|
|
UpdateSyncState(frame);
|
|
sequence_num_ = static_cast<uint16_t>(frame->GetHighSeqNum());
|
|
time_stamp_ = frame->TimeStamp();
|
|
picture_id_ = frame->PictureId();
|
|
temporal_id_ = frame->TemporalId();
|
|
tl0_pic_id_ = frame->Tl0PicId();
|
|
|
|
if (UsingFlexibleMode(frame)) {
|
|
uint16_t frame_index = picture_id_ % kFrameDecodedLength;
|
|
if (in_initial_state_) {
|
|
frame_decoded_cleared_to_ = frame_index;
|
|
} else if (frame->FrameType() == kVideoFrameKey) {
|
|
memset(frame_decoded_, 0, sizeof(frame_decoded_));
|
|
frame_decoded_cleared_to_ = frame_index;
|
|
} else {
|
|
if (AheadOfFramesDecodedClearedTo(frame_index)) {
|
|
while (frame_decoded_cleared_to_ != frame_index) {
|
|
frame_decoded_cleared_to_ =
|
|
(frame_decoded_cleared_to_ + 1) % kFrameDecodedLength;
|
|
frame_decoded_[frame_decoded_cleared_to_] = false;
|
|
}
|
|
}
|
|
}
|
|
frame_decoded_[frame_index] = true;
|
|
}
|
|
|
|
in_initial_state_ = false;
|
|
}
|
|
|
|
void VCMDecodingState::CopyFrom(const VCMDecodingState& state) {
|
|
sequence_num_ = state.sequence_num_;
|
|
time_stamp_ = state.time_stamp_;
|
|
picture_id_ = state.picture_id_;
|
|
temporal_id_ = state.temporal_id_;
|
|
tl0_pic_id_ = state.tl0_pic_id_;
|
|
full_sync_ = state.full_sync_;
|
|
in_initial_state_ = state.in_initial_state_;
|
|
frame_decoded_cleared_to_ = state.frame_decoded_cleared_to_;
|
|
memcpy(frame_decoded_, state.frame_decoded_, sizeof(frame_decoded_));
|
|
}
|
|
|
|
bool VCMDecodingState::UpdateEmptyFrame(const VCMFrameBuffer* frame) {
|
|
bool empty_packet = frame->GetHighSeqNum() == frame->GetLowSeqNum();
|
|
if (in_initial_state_ && empty_packet) {
|
|
// Drop empty packets as long as we are in the initial state.
|
|
return true;
|
|
}
|
|
if ((empty_packet && ContinuousSeqNum(frame->GetHighSeqNum())) ||
|
|
ContinuousFrame(frame)) {
|
|
// Continuous empty packets or continuous frames can be dropped if we
|
|
// advance the sequence number.
|
|
sequence_num_ = frame->GetHighSeqNum();
|
|
time_stamp_ = frame->TimeStamp();
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
void VCMDecodingState::UpdateOldPacket(const VCMPacket* packet) {
|
|
assert(packet != NULL);
|
|
if (packet->timestamp == time_stamp_) {
|
|
// Late packet belonging to the last decoded frame - make sure we update the
|
|
// last decoded sequence number.
|
|
sequence_num_ = LatestSequenceNumber(packet->seqNum, sequence_num_);
|
|
}
|
|
}
|
|
|
|
void VCMDecodingState::SetSeqNum(uint16_t new_seq_num) {
|
|
sequence_num_ = new_seq_num;
|
|
}
|
|
|
|
bool VCMDecodingState::in_initial_state() const {
|
|
return in_initial_state_;
|
|
}
|
|
|
|
bool VCMDecodingState::full_sync() const {
|
|
return full_sync_;
|
|
}
|
|
|
|
void VCMDecodingState::UpdateSyncState(const VCMFrameBuffer* frame) {
|
|
if (in_initial_state_)
|
|
return;
|
|
if (frame->TemporalId() == kNoTemporalIdx ||
|
|
frame->Tl0PicId() == kNoTl0PicIdx) {
|
|
full_sync_ = true;
|
|
} else if (frame->FrameType() == kVideoFrameKey || frame->LayerSync()) {
|
|
full_sync_ = true;
|
|
} else if (full_sync_) {
|
|
// Verify that we are still in sync.
|
|
// Sync will be broken if continuity is true for layers but not for the
|
|
// other methods (PictureId and SeqNum).
|
|
if (UsingPictureId(frame)) {
|
|
// First check for a valid tl0PicId.
|
|
if (frame->Tl0PicId() - tl0_pic_id_ > 1) {
|
|
full_sync_ = false;
|
|
} else {
|
|
full_sync_ = ContinuousPictureId(frame->PictureId());
|
|
}
|
|
} else {
|
|
full_sync_ = ContinuousSeqNum(static_cast<uint16_t>(
|
|
frame->GetLowSeqNum()));
|
|
}
|
|
}
|
|
}
|
|
|
|
bool VCMDecodingState::ContinuousFrame(const VCMFrameBuffer* frame) const {
|
|
// Check continuity based on the following hierarchy:
|
|
// - Temporal layers (stop here if out of sync).
|
|
// - Picture Id when available.
|
|
// - Sequence numbers.
|
|
// Return true when in initial state.
|
|
// Note that when a method is not applicable it will return false.
|
|
assert(frame != NULL);
|
|
// A key frame is always considered continuous as it doesn't refer to any
|
|
// frames and therefore won't introduce any errors even if prior frames are
|
|
// missing.
|
|
if (frame->FrameType() == kVideoFrameKey)
|
|
return true;
|
|
// When in the initial state we always require a key frame to start decoding.
|
|
if (in_initial_state_)
|
|
return false;
|
|
if (ContinuousLayer(frame->TemporalId(), frame->Tl0PicId()))
|
|
return true;
|
|
// tl0picId is either not used, or should remain unchanged.
|
|
if (frame->Tl0PicId() != tl0_pic_id_)
|
|
return false;
|
|
// Base layers are not continuous or temporal layers are inactive.
|
|
// In the presence of temporal layers, check for Picture ID/sequence number
|
|
// continuity if sync can be restored by this frame.
|
|
if (!full_sync_ && !frame->LayerSync())
|
|
return false;
|
|
if (UsingPictureId(frame)) {
|
|
if (UsingFlexibleMode(frame)) {
|
|
return ContinuousFrameRefs(frame);
|
|
} else {
|
|
return ContinuousPictureId(frame->PictureId());
|
|
}
|
|
} else {
|
|
return ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum()));
|
|
}
|
|
}
|
|
|
|
bool VCMDecodingState::ContinuousPictureId(int picture_id) const {
|
|
int next_picture_id = picture_id_ + 1;
|
|
if (picture_id < picture_id_) {
|
|
// Wrap
|
|
if (picture_id_ >= 0x80) {
|
|
// 15 bits used for picture id
|
|
return ((next_picture_id & 0x7FFF) == picture_id);
|
|
} else {
|
|
// 7 bits used for picture id
|
|
return ((next_picture_id & 0x7F) == picture_id);
|
|
}
|
|
}
|
|
// No wrap
|
|
return (next_picture_id == picture_id);
|
|
}
|
|
|
|
bool VCMDecodingState::ContinuousSeqNum(uint16_t seq_num) const {
|
|
return seq_num == static_cast<uint16_t>(sequence_num_ + 1);
|
|
}
|
|
|
|
bool VCMDecodingState::ContinuousLayer(int temporal_id,
|
|
int tl0_pic_id) const {
|
|
// First, check if applicable.
|
|
if (temporal_id == kNoTemporalIdx || tl0_pic_id == kNoTl0PicIdx)
|
|
return false;
|
|
// If this is the first frame to use temporal layers, make sure we start
|
|
// from base.
|
|
else if (tl0_pic_id_ == kNoTl0PicIdx && temporal_id_ == kNoTemporalIdx &&
|
|
temporal_id == 0)
|
|
return true;
|
|
|
|
// Current implementation: Look for base layer continuity.
|
|
if (temporal_id != 0)
|
|
return false;
|
|
return (static_cast<uint8_t>(tl0_pic_id_ + 1) == tl0_pic_id);
|
|
}
|
|
|
|
bool VCMDecodingState::ContinuousFrameRefs(const VCMFrameBuffer* frame) const {
|
|
uint8_t num_refs = frame->CodecSpecific()->codecSpecific.VP9.num_ref_pics;
|
|
for (uint8_t r = 0; r < num_refs; ++r) {
|
|
uint16_t frame_ref = frame->PictureId() -
|
|
frame->CodecSpecific()->codecSpecific.VP9.p_diff[r];
|
|
uint16_t frame_index = frame_ref % kFrameDecodedLength;
|
|
if (AheadOfFramesDecodedClearedTo(frame_index) ||
|
|
!frame_decoded_[frame_index]) {
|
|
return false;
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool VCMDecodingState::UsingPictureId(const VCMFrameBuffer* frame) const {
|
|
return (frame->PictureId() != kNoPictureId && picture_id_ != kNoPictureId);
|
|
}
|
|
|
|
bool VCMDecodingState::UsingFlexibleMode(const VCMFrameBuffer* frame) const {
|
|
return frame->CodecSpecific()->codecType == kVideoCodecVP9 &&
|
|
frame->CodecSpecific()->codecSpecific.VP9.flexible_mode;
|
|
}
|
|
|
|
// TODO(philipel): change how check work, this check practially
|
|
// limits the max p_diff to 64.
|
|
bool VCMDecodingState::AheadOfFramesDecodedClearedTo(uint16_t index) const {
|
|
// No way of knowing for sure if we are actually ahead of
|
|
// frame_decoded_cleared_to_. We just make the assumption
|
|
// that we are not trying to reference back to a very old
|
|
// index, but instead are referencing a newer index.
|
|
uint16_t diff =
|
|
index > frame_decoded_cleared_to_
|
|
? kFrameDecodedLength - (index - frame_decoded_cleared_to_)
|
|
: frame_decoded_cleared_to_ - index;
|
|
return diff > kFrameDecodedLength / 2;
|
|
}
|
|
|
|
} // namespace webrtc
|