util.cpp 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402
  1. #include "util.h"
  2. #include <c10/util/Logging.h>
  3. namespace ffmpeg {
  4. namespace Serializer {
  5. // fixed size types
  6. template <typename T>
  7. inline size_t getSize(const T& x) {
  8. return sizeof(x);
  9. }
  10. template <typename T>
  11. inline bool serializeItem(
  12. uint8_t* dest,
  13. size_t len,
  14. size_t& pos,
  15. const T& src) {
  16. VLOG(6) << "Generic serializeItem";
  17. const auto required = sizeof(src);
  18. if (len < pos + required) {
  19. return false;
  20. }
  21. memcpy(dest + pos, &src, required);
  22. pos += required;
  23. return true;
  24. }
  25. template <typename T>
  26. inline bool deserializeItem(
  27. const uint8_t* src,
  28. size_t len,
  29. size_t& pos,
  30. T& dest) {
  31. const auto required = sizeof(dest);
  32. if (len < pos + required) {
  33. return false;
  34. }
  35. memcpy(&dest, src + pos, required);
  36. pos += required;
  37. return true;
  38. }
  39. // AVSubtitleRect specialization
  40. inline size_t getSize(const AVSubtitleRect& x) {
  41. auto rectBytes = [](const AVSubtitleRect& y) -> size_t {
  42. size_t s = 0;
  43. switch (y.type) {
  44. case SUBTITLE_BITMAP:
  45. for (int i = 0; i < y.nb_colors; ++i) {
  46. s += sizeof(y.linesize[i]);
  47. s += y.linesize[i];
  48. }
  49. break;
  50. case SUBTITLE_TEXT:
  51. s += sizeof(size_t);
  52. s += strlen(y.text);
  53. break;
  54. case SUBTITLE_ASS:
  55. s += sizeof(size_t);
  56. s += strlen(y.ass);
  57. break;
  58. default:
  59. break;
  60. }
  61. return s;
  62. };
  63. return getSize(x.x) + getSize(x.y) + getSize(x.w) + getSize(x.h) +
  64. getSize(x.nb_colors) + getSize(x.type) + getSize(x.flags) + rectBytes(x);
  65. }
  66. // AVSubtitle specialization
  67. inline size_t getSize(const AVSubtitle& x) {
  68. auto rectBytes = [](const AVSubtitle& y) -> size_t {
  69. size_t s = getSize(y.num_rects);
  70. for (unsigned i = 0; i < y.num_rects; ++i) {
  71. s += getSize(*y.rects[i]);
  72. }
  73. return s;
  74. };
  75. return getSize(x.format) + getSize(x.start_display_time) +
  76. getSize(x.end_display_time) + getSize(x.pts) + rectBytes(x);
  77. }
  78. inline bool serializeItem(
  79. uint8_t* dest,
  80. size_t len,
  81. size_t& pos,
  82. const AVSubtitleRect& src) {
  83. auto rectSerialize =
  84. [](uint8_t* d, size_t l, size_t& p, const AVSubtitleRect& x) -> size_t {
  85. switch (x.type) {
  86. case SUBTITLE_BITMAP:
  87. for (int i = 0; i < x.nb_colors; ++i) {
  88. if (!serializeItem(d, l, p, x.linesize[i])) {
  89. return false;
  90. }
  91. if (p + x.linesize[i] > l) {
  92. return false;
  93. }
  94. memcpy(d + p, x.data[i], x.linesize[i]);
  95. p += x.linesize[i];
  96. }
  97. return true;
  98. case SUBTITLE_TEXT: {
  99. const size_t s = strlen(x.text);
  100. if (!serializeItem(d, l, p, s)) {
  101. return false;
  102. }
  103. if (p + s > l) {
  104. return false;
  105. }
  106. memcpy(d + p, x.text, s);
  107. p += s;
  108. return true;
  109. }
  110. case SUBTITLE_ASS: {
  111. const size_t s = strlen(x.ass);
  112. if (!serializeItem(d, l, p, s)) {
  113. return false;
  114. }
  115. if (p + s > l) {
  116. return false;
  117. }
  118. memcpy(d + p, x.ass, s);
  119. p += s;
  120. return true;
  121. }
  122. default:
  123. return true;
  124. }
  125. };
  126. return serializeItem(dest, len, pos, src.x) &&
  127. serializeItem(dest, len, pos, src.y) &&
  128. serializeItem(dest, len, pos, src.w) &&
  129. serializeItem(dest, len, pos, src.h) &&
  130. serializeItem(dest, len, pos, src.nb_colors) &&
  131. serializeItem(dest, len, pos, src.type) &&
  132. serializeItem(dest, len, pos, src.flags) &&
  133. rectSerialize(dest, len, pos, src);
  134. }
  135. inline bool serializeItem(
  136. uint8_t* dest,
  137. size_t len,
  138. size_t& pos,
  139. const AVSubtitle& src) {
  140. auto rectSerialize =
  141. [](uint8_t* d, size_t l, size_t& p, const AVSubtitle& x) -> bool {
  142. bool res = serializeItem(d, l, p, x.num_rects);
  143. for (unsigned i = 0; res && i < x.num_rects; ++i) {
  144. res = serializeItem(d, l, p, *(x.rects[i]));
  145. }
  146. return res;
  147. };
  148. VLOG(6) << "AVSubtitle serializeItem";
  149. return serializeItem(dest, len, pos, src.format) &&
  150. serializeItem(dest, len, pos, src.start_display_time) &&
  151. serializeItem(dest, len, pos, src.end_display_time) &&
  152. serializeItem(dest, len, pos, src.pts) &&
  153. rectSerialize(dest, len, pos, src);
  154. }
  155. inline bool deserializeItem(
  156. const uint8_t* src,
  157. size_t len,
  158. size_t& pos,
  159. AVSubtitleRect& dest) {
  160. auto rectDeserialize =
  161. [](const uint8_t* y, size_t l, size_t& p, AVSubtitleRect& x) -> bool {
  162. switch (x.type) {
  163. case SUBTITLE_BITMAP:
  164. for (int i = 0; i < x.nb_colors; ++i) {
  165. if (!deserializeItem(y, l, p, x.linesize[i])) {
  166. return false;
  167. }
  168. if (p + x.linesize[i] > l) {
  169. return false;
  170. }
  171. x.data[i] = (uint8_t*)av_malloc(x.linesize[i]);
  172. memcpy(x.data[i], y + p, x.linesize[i]);
  173. p += x.linesize[i];
  174. }
  175. return true;
  176. case SUBTITLE_TEXT: {
  177. size_t s = 0;
  178. if (!deserializeItem(y, l, p, s)) {
  179. return false;
  180. }
  181. if (p + s > l) {
  182. return false;
  183. }
  184. x.text = (char*)av_malloc(s + 1);
  185. memcpy(x.text, y + p, s);
  186. x.text[s] = 0;
  187. p += s;
  188. return true;
  189. }
  190. case SUBTITLE_ASS: {
  191. size_t s = 0;
  192. if (!deserializeItem(y, l, p, s)) {
  193. return false;
  194. }
  195. if (p + s > l) {
  196. return false;
  197. }
  198. x.ass = (char*)av_malloc(s + 1);
  199. memcpy(x.ass, y + p, s);
  200. x.ass[s] = 0;
  201. p += s;
  202. return true;
  203. }
  204. default:
  205. return true;
  206. }
  207. };
  208. return deserializeItem(src, len, pos, dest.x) &&
  209. deserializeItem(src, len, pos, dest.y) &&
  210. deserializeItem(src, len, pos, dest.w) &&
  211. deserializeItem(src, len, pos, dest.h) &&
  212. deserializeItem(src, len, pos, dest.nb_colors) &&
  213. deserializeItem(src, len, pos, dest.type) &&
  214. deserializeItem(src, len, pos, dest.flags) &&
  215. rectDeserialize(src, len, pos, dest);
  216. }
  217. inline bool deserializeItem(
  218. const uint8_t* src,
  219. size_t len,
  220. size_t& pos,
  221. AVSubtitle& dest) {
  222. auto rectDeserialize =
  223. [](const uint8_t* y, size_t l, size_t& p, AVSubtitle& x) -> bool {
  224. bool res = deserializeItem(y, l, p, x.num_rects);
  225. if (res && x.num_rects) {
  226. x.rects =
  227. (AVSubtitleRect**)av_malloc(x.num_rects * sizeof(AVSubtitleRect*));
  228. }
  229. for (unsigned i = 0; res && i < x.num_rects; ++i) {
  230. x.rects[i] = (AVSubtitleRect*)av_malloc(sizeof(AVSubtitleRect));
  231. memset(x.rects[i], 0, sizeof(AVSubtitleRect));
  232. res = deserializeItem(y, l, p, *x.rects[i]);
  233. }
  234. return res;
  235. };
  236. return deserializeItem(src, len, pos, dest.format) &&
  237. deserializeItem(src, len, pos, dest.start_display_time) &&
  238. deserializeItem(src, len, pos, dest.end_display_time) &&
  239. deserializeItem(src, len, pos, dest.pts) &&
  240. rectDeserialize(src, len, pos, dest);
  241. }
  242. } // namespace Serializer
  243. namespace Util {
  244. std::string generateErrorDesc(int errorCode) {
  245. std::array<char, 1024> buffer;
  246. if (av_strerror(errorCode, buffer.data(), buffer.size()) < 0) {
  247. return std::string("Unknown error code: ") + std::to_string(errorCode);
  248. }
  249. buffer.back() = 0;
  250. return std::string(buffer.data());
  251. }
  252. size_t serialize(const AVSubtitle& sub, ByteStorage* out) {
  253. const auto len = size(sub);
  254. TORCH_CHECK_LE(len, out->tail());
  255. size_t pos = 0;
  256. if (!Serializer::serializeItem(out->writableTail(), len, pos, sub)) {
  257. return 0;
  258. }
  259. out->append(len);
  260. return len;
  261. }
  262. bool deserialize(const ByteStorage& buf, AVSubtitle* sub) {
  263. size_t pos = 0;
  264. return Serializer::deserializeItem(buf.data(), buf.length(), pos, *sub);
  265. }
  266. size_t size(const AVSubtitle& sub) {
  267. return Serializer::getSize(sub);
  268. }
  269. bool validateVideoFormat(const VideoFormat& f) {
  270. // clang-format off
  271. /*
  272. Valid parameters values for decoder
  273. ____________________________________________________________________________________
  274. | W | H | minDimension | maxDimension | cropImage | algorithm |
  275. |__________________________________________________________________________________|
  276. | 0 | 0 | 0 | 0 | N/A | original |
  277. |__________________________________________________________________________________|
  278. | >0 | 0 | N/A | N/A | N/A | scale keeping W |
  279. |__________________________________________________________________________________|
  280. | 0 | >0 | N/A | N/A | N/A | scale keeping H |
  281. |__________________________________________________________________________________|
  282. | >0 | >0 | N/A | N/A | 0 | stretch/scale |
  283. |__________________________________________________________________________________|
  284. | >0 | >0 | N/A | N/A | >0 | scale/crop |
  285. |__________________________________________________________________________________|
  286. | 0 | 0 | >0 | 0 | N/A |scale to min dimension |
  287. |__________________________________________________________________________________|
  288. | 0 | 0 | 0 | >0 | N/A |scale to max dimension |
  289. |__________________________________________________________________________________|
  290. | 0 | 0 | >0 | >0 | N/A |stretch to min/max dimension|
  291. |_____|_____|______________|______________|___________|____________________________|
  292. */
  293. // clang-format on
  294. return (f.width == 0 && // #1, #6, #7 and #8
  295. f.height == 0 && f.cropImage == 0) ||
  296. (f.width != 0 && // #4 and #5
  297. f.height != 0 && f.minDimension == 0 && f.maxDimension == 0) ||
  298. (((f.width != 0 && // #2
  299. f.height == 0) ||
  300. (f.width == 0 && // #3
  301. f.height != 0)) &&
  302. f.minDimension == 0 && f.maxDimension == 0 && f.cropImage == 0);
  303. }
  304. void setFormatDimensions(
  305. size_t& destW,
  306. size_t& destH,
  307. size_t userW,
  308. size_t userH,
  309. size_t srcW,
  310. size_t srcH,
  311. size_t minDimension,
  312. size_t maxDimension,
  313. size_t cropImage) {
  314. // rounding rules
  315. // int -> double -> round up
  316. // if fraction is >= 0.5 or round down if fraction is < 0.5
  317. // int result = double(value) + 0.5
  318. // here we rounding double to int according to the above rule
  319. // #1, #6, #7 and #8
  320. if (userW == 0 && userH == 0) {
  321. if (minDimension > 0 && maxDimension == 0) { // #6
  322. if (srcW > srcH) {
  323. // landscape
  324. destH = minDimension;
  325. destW = round(double(srcW * minDimension) / srcH);
  326. } else {
  327. // portrait
  328. destW = minDimension;
  329. destH = round(double(srcH * minDimension) / srcW);
  330. }
  331. } else if (minDimension == 0 && maxDimension > 0) { // #7
  332. if (srcW > srcH) {
  333. // landscape
  334. destW = maxDimension;
  335. destH = round(double(srcH * maxDimension) / srcW);
  336. } else {
  337. // portrait
  338. destH = maxDimension;
  339. destW = round(double(srcW * maxDimension) / srcH);
  340. }
  341. } else if (minDimension > 0 && maxDimension > 0) { // #8
  342. if (srcW > srcH) {
  343. // landscape
  344. destW = maxDimension;
  345. destH = minDimension;
  346. } else {
  347. // portrait
  348. destW = minDimension;
  349. destH = maxDimension;
  350. }
  351. } else { // #1
  352. destW = srcW;
  353. destH = srcH;
  354. }
  355. } else if (userW != 0 && userH == 0) { // #2
  356. destW = userW;
  357. destH = round(double(srcH * userW) / srcW);
  358. } else if (userW == 0 && userH != 0) { // #3
  359. destW = round(double(srcW * userH) / srcH);
  360. destH = userH;
  361. } else { // userW != 0 && userH != 0
  362. if (cropImage == 0) { // #4
  363. destW = userW;
  364. destH = userH;
  365. } else { // #5
  366. double userSlope = double(userH) / userW;
  367. double srcSlope = double(srcH) / srcW;
  368. if (srcSlope < userSlope) {
  369. destW = round(double(srcW * userH) / srcH);
  370. destH = userH;
  371. } else {
  372. destW = userW;
  373. destH = round(double(srcH * userW) / srcW);
  374. }
  375. }
  376. }
  377. // prevent zeros
  378. destW = std::max(destW, size_t(1UL));
  379. destH = std::max(destH, size_t(1UL));
  380. }
  381. } // namespace Util
  382. } // namespace ffmpeg