/* * Copyright (c) 2014 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. * */ #ifndef MODULES_VIDEO_CODING_CODECS_VP9_VP9_IMPL_H_ #define MODULES_VIDEO_CODING_CODECS_VP9_VP9_IMPL_H_ #ifdef RTC_ENABLE_VP9 #include #include #include #include #include "api/fec_controller_override.h" #include "api/video_codecs/video_encoder.h" #include "common_video/include/video_frame_buffer_pool.h" #include "media/base/vp9_profile.h" #include "modules/video_coding/codecs/vp9/include/vp9.h" #include "modules/video_coding/codecs/vp9/vp9_frame_buffer_pool.h" #include "modules/video_coding/utility/framerate_controller.h" #include "vpx/vp8cx.h" #include "vpx/vpx_decoder.h" #include "vpx/vpx_encoder.h" namespace webrtc { class VP9EncoderImpl : public VP9Encoder { public: explicit VP9EncoderImpl(const cricket::VideoCodec& codec); ~VP9EncoderImpl() override; void SetFecControllerOverride( FecControllerOverride* fec_controller_override) override; int Release() override; int InitEncode(const VideoCodec* codec_settings, const Settings& settings) override; int Encode(const VideoFrame& input_image, const std::vector* frame_types) override; int RegisterEncodeCompleteCallback(EncodedImageCallback* callback) override; void SetRates(const RateControlParameters& parameters) override; EncoderInfo GetEncoderInfo() const override; private: // Determine number of encoder threads to use. int NumberOfThreads(int width, int height, int number_of_cores); // Call encoder initialize function and set control settings. int InitAndSetControlSettings(const VideoCodec* inst); void PopulateCodecSpecific(CodecSpecificInfo* codec_specific, absl::optional* spatial_idx, const vpx_codec_cx_pkt& pkt, uint32_t timestamp); void FillReferenceIndices(const vpx_codec_cx_pkt& pkt, const size_t pic_num, const bool inter_layer_predicted, CodecSpecificInfoVP9* vp9_info); void UpdateReferenceBuffers(const vpx_codec_cx_pkt& pkt, const size_t pic_num); vpx_svc_ref_frame_config_t SetReferences( bool is_key_pic, size_t first_active_spatial_layer_id); bool ExplicitlyConfiguredSpatialLayers() const; bool SetSvcRates(const VideoBitrateAllocation& bitrate_allocation); virtual int GetEncodedLayerFrame(const vpx_codec_cx_pkt* pkt); // Callback function for outputting packets per spatial layer. static void EncoderOutputCodedPacketCallback(vpx_codec_cx_pkt* pkt, void* user_data); void DeliverBufferedFrame(bool end_of_picture); bool DropFrame(uint8_t spatial_idx, uint32_t rtp_timestamp); // Determine maximum target for Intra frames // // Input: // - optimal_buffer_size : Optimal buffer size // Return Value : Max target size for Intra frames represented as // percentage of the per frame bandwidth uint32_t MaxIntraTarget(uint32_t optimal_buffer_size); size_t SteadyStateSize(int sid, int tid); void MaybeRewrapRawWithFormat(const vpx_img_fmt fmt); EncodedImage encoded_image_; CodecSpecificInfo codec_specific_; EncodedImageCallback* encoded_complete_callback_; VideoCodec codec_; const VP9Profile profile_; bool inited_; int64_t timestamp_; int cpu_speed_; uint32_t rc_max_intra_target_; vpx_codec_ctx_t* encoder_; vpx_codec_enc_cfg_t* config_; vpx_image_t* raw_; vpx_svc_extra_cfg_t svc_params_; const VideoFrame* input_image_; GofInfoVP9 gof_; // Contains each frame's temporal information for // non-flexible mode. bool force_key_frame_; size_t pics_since_key_; uint8_t num_temporal_layers_; uint8_t num_spatial_layers_; // Number of configured SLs uint8_t num_active_spatial_layers_; // Number of actively encoded SLs uint8_t first_active_layer_; bool layer_deactivation_requires_key_frame_; bool is_svc_; InterLayerPredMode inter_layer_pred_; bool external_ref_control_; const bool trusted_rate_controller_; const bool dynamic_rate_settings_; bool layer_buffering_; const bool full_superframe_drop_; vpx_svc_frame_drop_t svc_drop_frame_; bool first_frame_in_picture_; VideoBitrateAllocation current_bitrate_allocation_; bool ss_info_needed_; bool force_all_active_layers_; std::vector framerate_controller_; // Used for flexible mode. bool is_flexible_mode_; struct RefFrameBuffer { RefFrameBuffer(size_t pic_num, size_t spatial_layer_id, size_t temporal_layer_id) : pic_num(pic_num), spatial_layer_id(spatial_layer_id), temporal_layer_id(temporal_layer_id) {} RefFrameBuffer() {} bool operator==(const RefFrameBuffer& o) { return pic_num == o.pic_num && spatial_layer_id == o.spatial_layer_id && temporal_layer_id == o.temporal_layer_id; } size_t pic_num = 0; size_t spatial_layer_id = 0; size_t temporal_layer_id = 0; }; std::map ref_buf_; // Variable frame-rate related fields and methods. const struct VariableFramerateExperiment { bool enabled; // Framerate is limited to this value in steady state. float framerate_limit; // This qp or below is considered a steady state. int steady_state_qp; // Frames of at least this percentage below ideal for configured bitrate are // considered in a steady state. int steady_state_undershoot_percentage; // Number of consecutive frames with good QP and size required to detect // the steady state. int frames_before_steady_state; } variable_framerate_experiment_; static VariableFramerateExperiment ParseVariableFramerateConfig( std::string group_name); FramerateController variable_framerate_controller_; const struct QualityScalerExperiment { int low_qp; int high_qp; bool enabled; } quality_scaler_experiment_; static QualityScalerExperiment ParseQualityScalerConfig( std::string group_name); int num_steady_state_frames_; // Only set config when this flag is set. bool config_changed_; }; class VP9DecoderImpl : public VP9Decoder { public: VP9DecoderImpl(); virtual ~VP9DecoderImpl(); int InitDecode(const VideoCodec* inst, int number_of_cores) override; int Decode(const EncodedImage& input_image, bool missing_frames, int64_t /*render_time_ms*/) override; int RegisterDecodeCompleteCallback(DecodedImageCallback* callback) override; int Release() override; const char* ImplementationName() const override; private: int ReturnFrame(const vpx_image_t* img, uint32_t timestamp, int qp, const webrtc::ColorSpace* explicit_color_space); // Memory pool used to share buffers between libvpx and webrtc. Vp9FrameBufferPool libvpx_buffer_pool_; // Buffer pool used to allocate additionally needed NV12 buffers. VideoFrameBufferPool output_buffer_pool_; DecodedImageCallback* decode_complete_callback_; bool inited_; vpx_codec_ctx_t* decoder_; bool key_frame_required_; VideoCodec current_codec_; int num_cores_; // Decoder should produce this format if possible. const VideoFrameBuffer::Type preferred_output_format_; }; } // namespace webrtc #endif // RTC_ENABLE_VP9 #endif // MODULES_VIDEO_CODING_CODECS_VP9_VP9_IMPL_H_