libaom_av1_encoder.cc 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623
  1. /*
  2. * Copyright (c) 2020 The WebRTC project authors. All Rights Reserved.
  3. *
  4. * Use of this source code is governed by a BSD-style license
  5. * that can be found in the LICENSE file in the root of the source
  6. * tree. An additional intellectual property rights grant can be found
  7. * in the file PATENTS. All contributing project authors may
  8. * be found in the AUTHORS file in the root of the source tree.
  9. */
  10. #include "modules/video_coding/codecs/av1/libaom_av1_encoder.h"
  11. #include <stddef.h>
  12. #include <stdint.h>
  13. #include <memory>
  14. #include <utility>
  15. #include <vector>
  16. #include "absl/algorithm/container.h"
  17. #include "absl/base/macros.h"
  18. #include "absl/types/optional.h"
  19. #include "api/scoped_refptr.h"
  20. #include "api/video/encoded_image.h"
  21. #include "api/video/i420_buffer.h"
  22. #include "api/video/video_frame.h"
  23. #include "api/video_codecs/video_codec.h"
  24. #include "api/video_codecs/video_encoder.h"
  25. #include "modules/video_coding/codecs/av1/scalable_video_controller.h"
  26. #include "modules/video_coding/codecs/av1/scalable_video_controller_no_layering.h"
  27. #include "modules/video_coding/include/video_codec_interface.h"
  28. #include "modules/video_coding/include/video_error_codes.h"
  29. #include "rtc_base/checks.h"
  30. #include "rtc_base/logging.h"
  31. #include "third_party/libaom/source/libaom/aom/aom_codec.h"
  32. #include "third_party/libaom/source/libaom/aom/aom_encoder.h"
  33. #include "third_party/libaom/source/libaom/aom/aomcx.h"
  34. namespace webrtc {
  35. namespace {
  36. // Encoder configuration parameters
  37. constexpr int kQpMin = 10;
  38. constexpr int kUsageProfile = 1; // 0 = good quality; 1 = real-time.
  39. constexpr int kMinQindex = 58; // Min qindex threshold for QP scaling.
  40. constexpr int kMaxQindex = 180; // Max qindex threshold for QP scaling.
  41. constexpr int kBitDepth = 8;
  42. constexpr int kLagInFrames = 0; // No look ahead.
  43. constexpr int kRtpTicksPerSecond = 90000;
  44. constexpr float kMinimumFrameRate = 1.0;
  45. // Only positive speeds, range for real-time coding currently is: 6 - 8.
  46. // Lower means slower/better quality, higher means fastest/lower quality.
  47. int GetCpuSpeed(int width, int height, int number_of_cores) {
  48. // For smaller resolutions, use lower speed setting (get some coding gain at
  49. // the cost of increased encoding complexity).
  50. if (number_of_cores > 2 && width * height <= 320 * 180)
  51. return 6;
  52. else if (width * height >= 1280 * 720)
  53. return 8;
  54. else
  55. return 7;
  56. }
  57. class LibaomAv1Encoder final : public VideoEncoder {
  58. public:
  59. explicit LibaomAv1Encoder(
  60. std::unique_ptr<ScalableVideoController> svc_controller);
  61. ~LibaomAv1Encoder();
  62. int InitEncode(const VideoCodec* codec_settings,
  63. const Settings& settings) override;
  64. int32_t RegisterEncodeCompleteCallback(
  65. EncodedImageCallback* encoded_image_callback) override;
  66. int32_t Release() override;
  67. int32_t Encode(const VideoFrame& frame,
  68. const std::vector<VideoFrameType>* frame_types) override;
  69. void SetRates(const RateControlParameters& parameters) override;
  70. EncoderInfo GetEncoderInfo() const override;
  71. private:
  72. bool SvcEnabled() const { return svc_params_.has_value(); }
  73. // Fills svc_params_ memeber value. Returns false on error.
  74. bool SetSvcParams(ScalableVideoController::StreamLayersConfig svc_config);
  75. // Configures the encoder with layer for the next frame.
  76. void SetSvcLayerId(
  77. const ScalableVideoController::LayerFrameConfig& layer_frame);
  78. // Configures the encoder which buffers next frame updates and can reference.
  79. void SetSvcRefFrameConfig(
  80. const ScalableVideoController::LayerFrameConfig& layer_frame);
  81. const std::unique_ptr<ScalableVideoController> svc_controller_;
  82. bool inited_;
  83. absl::optional<aom_svc_params_t> svc_params_;
  84. VideoCodec encoder_settings_;
  85. aom_image_t* frame_for_encode_;
  86. aom_codec_ctx_t ctx_;
  87. aom_codec_enc_cfg_t cfg_;
  88. EncodedImageCallback* encoded_image_callback_;
  89. };
  90. int32_t VerifyCodecSettings(const VideoCodec& codec_settings) {
  91. if (codec_settings.width < 1) {
  92. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  93. }
  94. if (codec_settings.height < 1) {
  95. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  96. }
  97. // maxBitrate == 0 represents an unspecified maxBitRate.
  98. if (codec_settings.maxBitrate > 0 &&
  99. codec_settings.minBitrate > codec_settings.maxBitrate) {
  100. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  101. }
  102. if (codec_settings.maxBitrate > 0 &&
  103. codec_settings.startBitrate > codec_settings.maxBitrate) {
  104. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  105. }
  106. if (codec_settings.startBitrate < codec_settings.minBitrate) {
  107. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  108. }
  109. if (codec_settings.maxFramerate < 1) {
  110. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  111. }
  112. return WEBRTC_VIDEO_CODEC_OK;
  113. }
  114. LibaomAv1Encoder::LibaomAv1Encoder(
  115. std::unique_ptr<ScalableVideoController> svc_controller)
  116. : svc_controller_(std::move(svc_controller)),
  117. inited_(false),
  118. frame_for_encode_(nullptr),
  119. encoded_image_callback_(nullptr) {
  120. RTC_DCHECK(svc_controller_);
  121. }
  122. LibaomAv1Encoder::~LibaomAv1Encoder() {
  123. Release();
  124. }
  125. int LibaomAv1Encoder::InitEncode(const VideoCodec* codec_settings,
  126. const Settings& settings) {
  127. if (codec_settings == nullptr) {
  128. RTC_LOG(LS_WARNING) << "No codec settings provided to "
  129. "LibaomAv1Encoder.";
  130. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  131. }
  132. if (settings.number_of_cores < 1) {
  133. return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  134. }
  135. if (inited_) {
  136. RTC_LOG(LS_WARNING) << "Initing LibaomAv1Encoder without first releasing.";
  137. Release();
  138. }
  139. encoder_settings_ = *codec_settings;
  140. // Sanity checks for encoder configuration.
  141. const int32_t result = VerifyCodecSettings(encoder_settings_);
  142. if (result < 0) {
  143. RTC_LOG(LS_WARNING) << "Incorrect codec settings provided to "
  144. "LibaomAv1Encoder.";
  145. return result;
  146. }
  147. if (!SetSvcParams(svc_controller_->StreamConfig())) {
  148. return WEBRTC_VIDEO_CODEC_ERROR;
  149. }
  150. // Initialize encoder configuration structure with default values
  151. aom_codec_err_t ret =
  152. aom_codec_enc_config_default(aom_codec_av1_cx(), &cfg_, 0);
  153. if (ret != AOM_CODEC_OK) {
  154. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  155. << " on aom_codec_enc_config_default.";
  156. return WEBRTC_VIDEO_CODEC_ERROR;
  157. }
  158. // Overwrite default config with input encoder settings & RTC-relevant values.
  159. cfg_.g_w = encoder_settings_.width;
  160. cfg_.g_h = encoder_settings_.height;
  161. cfg_.g_threads = settings.number_of_cores;
  162. cfg_.g_timebase.num = 1;
  163. cfg_.g_timebase.den = kRtpTicksPerSecond;
  164. cfg_.rc_target_bitrate = encoder_settings_.maxBitrate; // kilobits/sec.
  165. cfg_.g_input_bit_depth = kBitDepth;
  166. cfg_.kf_mode = AOM_KF_DISABLED;
  167. cfg_.rc_min_quantizer = kQpMin;
  168. cfg_.rc_max_quantizer = encoder_settings_.qpMax;
  169. cfg_.g_usage = kUsageProfile;
  170. cfg_.g_error_resilient = 0;
  171. // Low-latency settings.
  172. cfg_.rc_end_usage = AOM_CBR; // Constant Bit Rate (CBR) mode
  173. cfg_.g_pass = AOM_RC_ONE_PASS; // One-pass rate control
  174. cfg_.g_lag_in_frames = kLagInFrames; // No look ahead when lag equals 0.
  175. // Creating a wrapper to the image - setting image data to nullptr. Actual
  176. // pointer will be set in encode. Setting align to 1, as it is meaningless
  177. // (actual memory is not allocated).
  178. frame_for_encode_ =
  179. aom_img_alloc(nullptr, AOM_IMG_FMT_I420, cfg_.g_w, cfg_.g_h, 1);
  180. // Flag options: AOM_CODEC_USE_PSNR and AOM_CODEC_USE_HIGHBITDEPTH
  181. aom_codec_flags_t flags = 0;
  182. // Initialize an encoder instance.
  183. ret = aom_codec_enc_init(&ctx_, aom_codec_av1_cx(), &cfg_, flags);
  184. if (ret != AOM_CODEC_OK) {
  185. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  186. << " on aom_codec_enc_init.";
  187. return WEBRTC_VIDEO_CODEC_ERROR;
  188. }
  189. inited_ = true;
  190. // Set control parameters
  191. ret = aom_codec_control(
  192. &ctx_, AOME_SET_CPUUSED,
  193. GetCpuSpeed(cfg_.g_w, cfg_.g_h, settings.number_of_cores));
  194. if (ret != AOM_CODEC_OK) {
  195. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  196. << " on control AV1E_SET_CPUUSED.";
  197. return WEBRTC_VIDEO_CODEC_ERROR;
  198. }
  199. ret = aom_codec_control(&ctx_, AV1E_SET_ENABLE_CDEF, 1);
  200. if (ret != AOM_CODEC_OK) {
  201. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  202. << " on control AV1E_SET_ENABLE_CDEF.";
  203. return WEBRTC_VIDEO_CODEC_ERROR;
  204. }
  205. ret = aom_codec_control(&ctx_, AV1E_SET_ENABLE_TPL_MODEL, 0);
  206. if (ret != AOM_CODEC_OK) {
  207. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  208. << " on control AV1E_SET_ENABLE_TPL_MODEL.";
  209. return WEBRTC_VIDEO_CODEC_ERROR;
  210. }
  211. ret = aom_codec_control(&ctx_, AV1E_SET_DELTAQ_MODE, 0);
  212. if (ret != AOM_CODEC_OK) {
  213. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  214. << " on control AV1E_SET_DELTAQ_MODE.";
  215. return WEBRTC_VIDEO_CODEC_ERROR;
  216. }
  217. ret = aom_codec_control(&ctx_, AV1E_SET_ENABLE_ORDER_HINT, 0);
  218. if (ret != AOM_CODEC_OK) {
  219. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  220. << " on control AV1E_SET_ENABLE_ORDER_HINT.";
  221. return WEBRTC_VIDEO_CODEC_ERROR;
  222. }
  223. ret = aom_codec_control(&ctx_, AV1E_SET_AQ_MODE, 3);
  224. if (ret != AOM_CODEC_OK) {
  225. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  226. << " on control AV1E_SET_AQ_MODE.";
  227. return WEBRTC_VIDEO_CODEC_ERROR;
  228. }
  229. if (SvcEnabled()) {
  230. ret = aom_codec_control(&ctx_, AV1E_SET_SVC_PARAMS, &*svc_params_);
  231. if (ret != AOM_CODEC_OK) {
  232. RTC_LOG(LS_WARNING) << "LibaomAV1Encoder::EncodeInit returned " << ret
  233. << " on control AV1E_SET_SVC_PARAMS.";
  234. return false;
  235. }
  236. }
  237. ret = aom_codec_control(&ctx_, AOME_SET_MAX_INTRA_BITRATE_PCT, 300);
  238. if (ret != AOM_CODEC_OK) {
  239. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  240. << " on control AV1E_SET_MAX_INTRA_BITRATE_PCT.";
  241. return WEBRTC_VIDEO_CODEC_ERROR;
  242. }
  243. ret = aom_codec_control(&ctx_, AV1E_SET_COEFF_COST_UPD_FREQ, 2);
  244. if (ret != AOM_CODEC_OK) {
  245. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  246. << " on control AV1E_SET_COEFF_COST_UPD_FREQ.";
  247. return WEBRTC_VIDEO_CODEC_ERROR;
  248. }
  249. ret = aom_codec_control(&ctx_, AV1E_SET_MODE_COST_UPD_FREQ, 2);
  250. if (ret != AOM_CODEC_OK) {
  251. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  252. << " on control AV1E_SET_MODE_COST_UPD_FREQ.";
  253. return WEBRTC_VIDEO_CODEC_ERROR;
  254. }
  255. ret = aom_codec_control(&ctx_, AV1E_SET_MV_COST_UPD_FREQ, 3);
  256. if (ret != AOM_CODEC_OK) {
  257. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::EncodeInit returned " << ret
  258. << " on control AV1E_SET_MV_COST_UPD_FREQ.";
  259. return WEBRTC_VIDEO_CODEC_ERROR;
  260. }
  261. return WEBRTC_VIDEO_CODEC_OK;
  262. }
  263. bool LibaomAv1Encoder::SetSvcParams(
  264. ScalableVideoController::StreamLayersConfig svc_config) {
  265. bool svc_enabled =
  266. svc_config.num_spatial_layers > 1 || svc_config.num_temporal_layers > 1;
  267. if (!svc_enabled) {
  268. svc_params_ = absl::nullopt;
  269. return true;
  270. }
  271. if (svc_config.num_spatial_layers < 1 || svc_config.num_spatial_layers > 4) {
  272. RTC_LOG(LS_WARNING) << "Av1 supports up to 4 spatial layers. "
  273. << svc_config.num_spatial_layers << " configured.";
  274. return false;
  275. }
  276. if (svc_config.num_temporal_layers < 1 ||
  277. svc_config.num_temporal_layers > 8) {
  278. RTC_LOG(LS_WARNING) << "Av1 supports up to 8 temporal layers. "
  279. << svc_config.num_temporal_layers << " configured.";
  280. return false;
  281. }
  282. aom_svc_params_t& svc_params = svc_params_.emplace();
  283. svc_params.number_spatial_layers = svc_config.num_spatial_layers;
  284. svc_params.number_temporal_layers = svc_config.num_temporal_layers;
  285. int num_layers =
  286. svc_config.num_spatial_layers * svc_config.num_temporal_layers;
  287. for (int i = 0; i < num_layers; ++i) {
  288. svc_params.min_quantizers[i] = kQpMin;
  289. svc_params.max_quantizers[i] = encoder_settings_.qpMax;
  290. }
  291. // Assume each temporal layer doubles framerate.
  292. for (int tid = 0; tid < svc_config.num_temporal_layers; ++tid) {
  293. svc_params.framerate_factor[tid] =
  294. 1 << (svc_config.num_temporal_layers - tid - 1);
  295. }
  296. for (int sid = 0; sid < svc_config.num_spatial_layers; ++sid) {
  297. svc_params.scaling_factor_num[sid] = svc_config.scaling_factor_num[sid];
  298. svc_params.scaling_factor_den[sid] = svc_config.scaling_factor_den[sid];
  299. }
  300. return true;
  301. }
  302. void LibaomAv1Encoder::SetSvcLayerId(
  303. const ScalableVideoController::LayerFrameConfig& layer_frame) {
  304. aom_svc_layer_id_t layer_id = {};
  305. layer_id.spatial_layer_id = layer_frame.SpatialId();
  306. layer_id.temporal_layer_id = layer_frame.TemporalId();
  307. aom_codec_err_t ret =
  308. aom_codec_control(&ctx_, AV1E_SET_SVC_LAYER_ID, &layer_id);
  309. if (ret != AOM_CODEC_OK) {
  310. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::Encode returned " << ret
  311. << " on control AV1E_SET_SVC_LAYER_ID.";
  312. }
  313. }
  314. void LibaomAv1Encoder::SetSvcRefFrameConfig(
  315. const ScalableVideoController::LayerFrameConfig& layer_frame) {
  316. // Buffer name to use for each layer_frame.buffers position. In particular
  317. // when there are 2 buffers are referenced, prefer name them last and golden,
  318. // because av1 bitstream format has dedicated fields for these two names.
  319. // See last_frame_idx and golden_frame_idx in the av1 spec
  320. // https://aomediacodec.github.io/av1-spec/av1-spec.pdf
  321. static constexpr int kPreferedSlotName[] = {0, // Last
  322. 3, // Golden
  323. 1, 2, 4, 5, 6};
  324. static constexpr int kAv1NumBuffers = 8;
  325. aom_svc_ref_frame_config_t ref_frame_config = {};
  326. RTC_CHECK_LE(layer_frame.Buffers().size(), ABSL_ARRAYSIZE(kPreferedSlotName));
  327. for (size_t i = 0; i < layer_frame.Buffers().size(); ++i) {
  328. const CodecBufferUsage& buffer = layer_frame.Buffers()[i];
  329. int slot_name = kPreferedSlotName[i];
  330. RTC_CHECK_GE(buffer.id, 0);
  331. RTC_CHECK_LT(buffer.id, kAv1NumBuffers);
  332. ref_frame_config.ref_idx[slot_name] = buffer.id;
  333. if (buffer.referenced) {
  334. ref_frame_config.reference[slot_name] = 1;
  335. }
  336. if (buffer.updated) {
  337. ref_frame_config.refresh[buffer.id] = 1;
  338. }
  339. }
  340. aom_codec_err_t ret = aom_codec_control(&ctx_, AV1E_SET_SVC_REF_FRAME_CONFIG,
  341. &ref_frame_config);
  342. if (ret != AOM_CODEC_OK) {
  343. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::Encode returned " << ret
  344. << " on control AV1_SET_SVC_REF_FRAME_CONFIG.";
  345. }
  346. }
  347. int32_t LibaomAv1Encoder::RegisterEncodeCompleteCallback(
  348. EncodedImageCallback* encoded_image_callback) {
  349. encoded_image_callback_ = encoded_image_callback;
  350. return WEBRTC_VIDEO_CODEC_OK;
  351. }
  352. int32_t LibaomAv1Encoder::Release() {
  353. if (frame_for_encode_ != nullptr) {
  354. aom_img_free(frame_for_encode_);
  355. frame_for_encode_ = nullptr;
  356. }
  357. if (inited_) {
  358. if (aom_codec_destroy(&ctx_)) {
  359. return WEBRTC_VIDEO_CODEC_MEMORY;
  360. }
  361. inited_ = false;
  362. }
  363. return WEBRTC_VIDEO_CODEC_OK;
  364. }
  365. int32_t LibaomAv1Encoder::Encode(
  366. const VideoFrame& frame,
  367. const std::vector<VideoFrameType>* frame_types) {
  368. if (!inited_ || encoded_image_callback_ == nullptr) {
  369. return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
  370. }
  371. bool keyframe_required =
  372. frame_types != nullptr &&
  373. absl::c_linear_search(*frame_types, VideoFrameType::kVideoFrameKey);
  374. std::vector<ScalableVideoController::LayerFrameConfig> layer_frames =
  375. svc_controller_->NextFrameConfig(keyframe_required);
  376. if (layer_frames.empty()) {
  377. RTC_LOG(LS_ERROR) << "SVCController returned no configuration for a frame.";
  378. return WEBRTC_VIDEO_CODEC_ERROR;
  379. }
  380. // Convert input frame to I420, if needed.
  381. VideoFrame prepped_input_frame = frame;
  382. if (prepped_input_frame.video_frame_buffer()->type() !=
  383. VideoFrameBuffer::Type::kI420) {
  384. rtc::scoped_refptr<I420BufferInterface> converted_buffer(
  385. prepped_input_frame.video_frame_buffer()->ToI420());
  386. prepped_input_frame = VideoFrame(converted_buffer, frame.timestamp(),
  387. frame.render_time_ms(), frame.rotation());
  388. }
  389. // Set frame_for_encode_ data pointers and strides.
  390. auto i420_buffer = prepped_input_frame.video_frame_buffer()->GetI420();
  391. frame_for_encode_->planes[AOM_PLANE_Y] =
  392. const_cast<unsigned char*>(i420_buffer->DataY());
  393. frame_for_encode_->planes[AOM_PLANE_U] =
  394. const_cast<unsigned char*>(i420_buffer->DataU());
  395. frame_for_encode_->planes[AOM_PLANE_V] =
  396. const_cast<unsigned char*>(i420_buffer->DataV());
  397. frame_for_encode_->stride[AOM_PLANE_Y] = i420_buffer->StrideY();
  398. frame_for_encode_->stride[AOM_PLANE_U] = i420_buffer->StrideU();
  399. frame_for_encode_->stride[AOM_PLANE_V] = i420_buffer->StrideV();
  400. const uint32_t duration =
  401. kRtpTicksPerSecond / static_cast<float>(encoder_settings_.maxFramerate);
  402. for (ScalableVideoController::LayerFrameConfig& layer_frame : layer_frames) {
  403. aom_enc_frame_flags_t flags =
  404. layer_frame.IsKeyframe() ? AOM_EFLAG_FORCE_KF : 0;
  405. if (SvcEnabled()) {
  406. SetSvcLayerId(layer_frame);
  407. SetSvcRefFrameConfig(layer_frame);
  408. }
  409. // Encode a frame.
  410. aom_codec_err_t ret = aom_codec_encode(&ctx_, frame_for_encode_,
  411. frame.timestamp(), duration, flags);
  412. if (ret != AOM_CODEC_OK) {
  413. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::Encode returned " << ret
  414. << " on aom_codec_encode.";
  415. return WEBRTC_VIDEO_CODEC_ERROR;
  416. }
  417. // Get encoded image data.
  418. EncodedImage encoded_image;
  419. encoded_image._completeFrame = true;
  420. aom_codec_iter_t iter = nullptr;
  421. int data_pkt_count = 0;
  422. while (const aom_codec_cx_pkt_t* pkt =
  423. aom_codec_get_cx_data(&ctx_, &iter)) {
  424. if (pkt->kind == AOM_CODEC_CX_FRAME_PKT && pkt->data.frame.sz > 0) {
  425. if (data_pkt_count > 0) {
  426. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::Encoder returned more than "
  427. "one data packet for an input video frame.";
  428. Release();
  429. }
  430. encoded_image.SetEncodedData(EncodedImageBuffer::Create(
  431. /*data=*/static_cast<const uint8_t*>(pkt->data.frame.buf),
  432. /*size=*/pkt->data.frame.sz));
  433. if ((pkt->data.frame.flags & AOM_EFLAG_FORCE_KF) != 0) {
  434. layer_frame.Keyframe();
  435. }
  436. encoded_image._frameType = layer_frame.IsKeyframe()
  437. ? VideoFrameType::kVideoFrameKey
  438. : VideoFrameType::kVideoFrameDelta;
  439. encoded_image.SetTimestamp(frame.timestamp());
  440. encoded_image.capture_time_ms_ = frame.render_time_ms();
  441. encoded_image.rotation_ = frame.rotation();
  442. encoded_image.content_type_ = VideoContentType::UNSPECIFIED;
  443. // If encoded image width/height info are added to aom_codec_cx_pkt_t,
  444. // use those values in lieu of the values in frame.
  445. encoded_image._encodedHeight = frame.height();
  446. encoded_image._encodedWidth = frame.width();
  447. encoded_image.timing_.flags = VideoSendTiming::kInvalid;
  448. int qp = -1;
  449. ret = aom_codec_control(&ctx_, AOME_GET_LAST_QUANTIZER, &qp);
  450. if (ret != AOM_CODEC_OK) {
  451. RTC_LOG(LS_WARNING) << "LibaomAv1Encoder::Encode returned " << ret
  452. << " on control AOME_GET_LAST_QUANTIZER.";
  453. return WEBRTC_VIDEO_CODEC_ERROR;
  454. }
  455. encoded_image.qp_ = qp;
  456. encoded_image.SetColorSpace(frame.color_space());
  457. ++data_pkt_count;
  458. }
  459. }
  460. // Deliver encoded image data.
  461. if (encoded_image.size() > 0) {
  462. CodecSpecificInfo codec_specific_info;
  463. codec_specific_info.codecType = kVideoCodecAV1;
  464. bool is_keyframe = layer_frame.IsKeyframe();
  465. codec_specific_info.generic_frame_info =
  466. svc_controller_->OnEncodeDone(std::move(layer_frame));
  467. if (is_keyframe && codec_specific_info.generic_frame_info) {
  468. codec_specific_info.template_structure =
  469. svc_controller_->DependencyStructure();
  470. auto& resolutions = codec_specific_info.template_structure->resolutions;
  471. if (SvcEnabled()) {
  472. resolutions.resize(svc_params_->number_spatial_layers);
  473. for (int sid = 0; sid < svc_params_->number_spatial_layers; ++sid) {
  474. int n = svc_params_->scaling_factor_num[sid];
  475. int d = svc_params_->scaling_factor_den[sid];
  476. resolutions[sid] =
  477. RenderResolution(cfg_.g_w * n / d, cfg_.g_h * n / d);
  478. }
  479. } else {
  480. resolutions = {RenderResolution(cfg_.g_w, cfg_.g_h)};
  481. }
  482. }
  483. encoded_image_callback_->OnEncodedImage(encoded_image,
  484. &codec_specific_info);
  485. }
  486. }
  487. return WEBRTC_VIDEO_CODEC_OK;
  488. }
  489. void LibaomAv1Encoder::SetRates(const RateControlParameters& parameters) {
  490. if (!inited_) {
  491. RTC_LOG(LS_WARNING) << "SetRates() while encoder is not initialized";
  492. return;
  493. }
  494. if (parameters.framerate_fps < kMinimumFrameRate) {
  495. RTC_LOG(LS_WARNING) << "Unsupported framerate (must be >= "
  496. << kMinimumFrameRate
  497. << " ): " << parameters.framerate_fps;
  498. return;
  499. }
  500. if (parameters.bitrate.get_sum_bps() == 0) {
  501. RTC_LOG(LS_WARNING) << "Attempt to set target bit rate to zero";
  502. return;
  503. }
  504. // Check input target bit rate value.
  505. uint32_t rc_target_bitrate_kbps = parameters.bitrate.get_sum_kbps();
  506. if (encoder_settings_.maxBitrate > 0)
  507. RTC_DCHECK_LE(rc_target_bitrate_kbps, encoder_settings_.maxBitrate);
  508. RTC_DCHECK_GE(rc_target_bitrate_kbps, encoder_settings_.minBitrate);
  509. svc_controller_->OnRatesUpdated(parameters.bitrate);
  510. // Set target bit rate.
  511. cfg_.rc_target_bitrate = rc_target_bitrate_kbps;
  512. if (SvcEnabled()) {
  513. for (int sid = 0; sid < svc_params_->number_spatial_layers; ++sid) {
  514. // libaom bitrate for spatial id S and temporal id T means bitrate
  515. // of frames with spatial_id=S and temporal_id<=T
  516. // while `parameters.bitrate` provdies bitrate of frames with
  517. // spatial_id=S and temporal_id=T
  518. int accumulated_bitrate_bps = 0;
  519. for (int tid = 0; tid < svc_params_->number_temporal_layers; ++tid) {
  520. int layer_index = sid * svc_params_->number_temporal_layers + tid;
  521. accumulated_bitrate_bps += parameters.bitrate.GetBitrate(sid, tid);
  522. // `svc_params.layer_target_bitrate` expects bitrate in kbps.
  523. svc_params_->layer_target_bitrate[layer_index] =
  524. accumulated_bitrate_bps / 1000;
  525. }
  526. }
  527. aom_codec_control(&ctx_, AV1E_SET_SVC_PARAMS, &*svc_params_);
  528. }
  529. // Set frame rate to closest integer value.
  530. encoder_settings_.maxFramerate =
  531. static_cast<uint32_t>(parameters.framerate_fps + 0.5);
  532. // Update encoder context.
  533. aom_codec_err_t error_code = aom_codec_enc_config_set(&ctx_, &cfg_);
  534. if (error_code != AOM_CODEC_OK) {
  535. RTC_LOG(LS_WARNING) << "Error configuring encoder, error code: "
  536. << error_code;
  537. }
  538. }
  539. VideoEncoder::EncoderInfo LibaomAv1Encoder::GetEncoderInfo() const {
  540. EncoderInfo info;
  541. info.supports_native_handle = false;
  542. info.implementation_name = "libaom";
  543. info.has_trusted_rate_controller = true;
  544. info.is_hardware_accelerated = false;
  545. info.scaling_settings = VideoEncoder::ScalingSettings(kMinQindex, kMaxQindex);
  546. return info;
  547. }
  548. } // namespace
  549. const bool kIsLibaomAv1EncoderSupported = true;
  550. std::unique_ptr<VideoEncoder> CreateLibaomAv1Encoder() {
  551. return std::make_unique<LibaomAv1Encoder>(
  552. std::make_unique<ScalableVideoControllerNoLayering>());
  553. }
  554. std::unique_ptr<VideoEncoder> CreateLibaomAv1Encoder(
  555. std::unique_ptr<ScalableVideoController> svc_controller) {
  556. return std::make_unique<LibaomAv1Encoder>(std::move(svc_controller));
  557. }
  558. } // namespace webrtc