123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224 |
- /*
- * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
- *
- * Use of this source code is governed by a BSD-style license
- * that can be found in the LICENSE file in the root of the source
- * tree. An additional intellectual property rights grant can be found
- * in the file PATENTS. All contributing project authors may
- * be found in the AUTHORS file in the root of the source tree.
- */
- #ifndef MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
- #define MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
- #include <array>
- #include <deque>
- #include <map>
- #include <memory>
- #include <set>
- #include <utility>
- #include "modules/include/module_common_types_public.h"
- #include "modules/rtp_rtcp/source/rtp_video_header.h"
- #include "modules/video_coding/codecs/vp9/include/vp9_globals.h"
- #include "rtc_base/numerics/sequence_number_util.h"
- #include "rtc_base/thread_annotations.h"
- namespace webrtc {
- namespace video_coding {
- class EncodedFrame;
- class RtpFrameObject;
- // A complete frame is a frame which has received all its packets and all its
- // references are known.
- class OnCompleteFrameCallback {
- public:
- virtual ~OnCompleteFrameCallback() {}
- virtual void OnCompleteFrame(std::unique_ptr<EncodedFrame> frame) = 0;
- };
- class RtpFrameReferenceFinder {
- public:
- explicit RtpFrameReferenceFinder(OnCompleteFrameCallback* frame_callback);
- explicit RtpFrameReferenceFinder(OnCompleteFrameCallback* frame_callback,
- int64_t picture_id_offset);
- ~RtpFrameReferenceFinder();
- // Manage this frame until:
- // - We have all information needed to determine its references, after
- // which |frame_callback_| is called with the completed frame, or
- // - We have too many stashed frames (determined by |kMaxStashedFrames|)
- // so we drop this frame, or
- // - It gets cleared by ClearTo, which also means we drop it.
- void ManageFrame(std::unique_ptr<RtpFrameObject> frame);
- // Notifies that padding has been received, which the reference finder
- // might need to calculate the references of a frame.
- void PaddingReceived(uint16_t seq_num);
- // Clear all stashed frames that include packets older than |seq_num|.
- void ClearTo(uint16_t seq_num);
- private:
- static const uint16_t kPicIdLength = 1 << 15;
- static const uint8_t kMaxTemporalLayers = 5;
- static const int kMaxLayerInfo = 50;
- static const int kMaxStashedFrames = 100;
- static const int kMaxNotYetReceivedFrames = 100;
- static const int kMaxGofSaved = 50;
- static const int kMaxPaddingAge = 100;
- enum FrameDecision { kStash, kHandOff, kDrop };
- struct GofInfo {
- GofInfo(GofInfoVP9* gof, uint16_t last_picture_id)
- : gof(gof), last_picture_id(last_picture_id) {}
- GofInfoVP9* gof;
- uint16_t last_picture_id;
- };
- // Find the relevant group of pictures and update its "last-picture-id-with
- // padding" sequence number.
- void UpdateLastPictureIdWithPadding(uint16_t seq_num);
- // Retry stashed frames until no more complete frames are found.
- void RetryStashedFrames();
- void HandOffFrame(std::unique_ptr<RtpFrameObject> frame);
- FrameDecision ManageFrameInternal(RtpFrameObject* frame);
- FrameDecision ManageFrameGeneric(
- RtpFrameObject* frame,
- const RTPVideoHeader::GenericDescriptorInfo& descriptor);
- // Find references for frames with no or very limited information in the
- // descriptor. If |picture_id| is unspecified then packet sequence numbers
- // will be used to determine the references of the frames.
- FrameDecision ManageFramePidOrSeqNum(RtpFrameObject* frame, int picture_id);
- // Find references for Vp8 frames
- FrameDecision ManageFrameVp8(RtpFrameObject* frame);
- // Updates necessary layer info state used to determine frame references for
- // Vp8.
- void UpdateLayerInfoVp8(RtpFrameObject* frame,
- int64_t unwrapped_tl0,
- uint8_t temporal_idx);
- // Find references for Vp9 frames
- FrameDecision ManageFrameVp9(RtpFrameObject* frame);
- // Check if we are missing a frame necessary to determine the references
- // for this frame.
- bool MissingRequiredFrameVp9(uint16_t picture_id, const GofInfo& info);
- // Updates which frames that have been received. If there is a gap,
- // missing frames will be added to |missing_frames_for_layer_| or
- // if this is an already missing frame then it will be removed.
- void FrameReceivedVp9(uint16_t picture_id, GofInfo* info);
- // Check if there is a frame with the up-switch flag set in the interval
- // (|pid_ref|, |picture_id|) with temporal layer smaller than |temporal_idx|.
- bool UpSwitchInIntervalVp9(uint16_t picture_id,
- uint8_t temporal_idx,
- uint16_t pid_ref);
- // Unwrap |frame|s picture id and its references to 16 bits.
- void UnwrapPictureIds(RtpFrameObject* frame);
- // Find references for H264 frames
- FrameDecision ManageFrameH264(RtpFrameObject* frame);
- // Update "last-picture-id-with-padding" sequence number for H264.
- void UpdateLastPictureIdWithPaddingH264();
- // Update H264 layer info state used to determine frame references.
- void UpdateLayerInfoH264(RtpFrameObject* frame,
- int64_t unwrapped_tl0,
- uint8_t temporal_idx);
- // Update H264 state for decodeable frames.
- void UpdateDataH264(RtpFrameObject* frame,
- int64_t unwrapped_tl0,
- uint8_t temporal_idx);
- // For every group of pictures, hold two sequence numbers. The first being
- // the sequence number of the last packet of the last completed frame, and
- // the second being the sequence number of the last packet of the last
- // completed frame advanced by any potential continuous packets of padding.
- std::map<uint16_t,
- std::pair<uint16_t, uint16_t>,
- DescendingSeqNumComp<uint16_t>>
- last_seq_num_gop_;
- // Save the last picture id in order to detect when there is a gap in frames
- // that have not yet been fully received.
- int last_picture_id_;
- // Padding packets that have been received but that are not yet continuous
- // with any group of pictures.
- std::set<uint16_t, DescendingSeqNumComp<uint16_t>> stashed_padding_;
- // Frames earlier than the last received frame that have not yet been
- // fully received.
- std::set<uint16_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>
- not_yet_received_frames_;
- // Sequence numbers of frames earlier than the last received frame that
- // have not yet been fully received.
- std::set<uint16_t, DescendingSeqNumComp<uint16_t>> not_yet_received_seq_num_;
- // Frames that have been fully received but didn't have all the information
- // needed to determine their references.
- std::deque<std::unique_ptr<RtpFrameObject>> stashed_frames_;
- // Holds the information about the last completed frame for a given temporal
- // layer given an unwrapped Tl0 picture index.
- std::map<int64_t, std::array<int64_t, kMaxTemporalLayers>> layer_info_;
- // Where the current scalability structure is in the
- // |scalability_structures_| array.
- uint8_t current_ss_idx_;
- // Holds received scalability structures.
- std::array<GofInfoVP9, kMaxGofSaved> scalability_structures_;
- // Holds the the Gof information for a given unwrapped TL0 picture index.
- std::map<int64_t, GofInfo> gof_info_;
- // Keep track of which picture id and which temporal layer that had the
- // up switch flag set.
- std::map<uint16_t, uint8_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>
- up_switch_;
- // For every temporal layer, keep a set of which frames that are missing.
- std::array<std::set<uint16_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>,
- kMaxTemporalLayers>
- missing_frames_for_layer_;
- // How far frames have been cleared by sequence number. A frame will be
- // cleared if it contains a packet with a sequence number older than
- // |cleared_to_seq_num_|.
- int cleared_to_seq_num_;
- OnCompleteFrameCallback* frame_callback_;
- // Unwrapper used to unwrap generic RTP streams. In a generic stream we derive
- // a picture id from the packet sequence number.
- SeqNumUnwrapper<uint16_t> rtp_seq_num_unwrapper_;
- // Unwrapper used to unwrap VP8/VP9 streams which have their picture id
- // specified.
- SeqNumUnwrapper<uint16_t, kPicIdLength> unwrapper_;
- SeqNumUnwrapper<uint8_t> tl0_unwrapper_;
- const int64_t picture_id_offset_;
- };
- } // namespace video_coding
- } // namespace webrtc
- #endif // MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
|