You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

492 lines
18KB

  1. /*
  2. * Copyright (c) 2018 Ronald S. Bultje <rsbultje gmail com>
  3. * Copyright (c) 2018 James Almer <jamrial gmail com>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <dav1d/dav1d.h>
  22. #include "libavutil/avassert.h"
  23. #include "libavutil/film_grain_params.h"
  24. #include "libavutil/mastering_display_metadata.h"
  25. #include "libavutil/imgutils.h"
  26. #include "libavutil/opt.h"
  27. #include "atsc_a53.h"
  28. #include "avcodec.h"
  29. #include "bytestream.h"
  30. #include "decode.h"
  31. #include "internal.h"
  32. typedef struct Libdav1dContext {
  33. AVClass *class;
  34. Dav1dContext *c;
  35. AVBufferPool *pool;
  36. int pool_size;
  37. Dav1dData data;
  38. int tile_threads;
  39. int frame_threads;
  40. int apply_grain;
  41. int operating_point;
  42. int all_layers;
  43. } Libdav1dContext;
  44. static const enum AVPixelFormat pix_fmt[][3] = {
  45. [DAV1D_PIXEL_LAYOUT_I400] = { AV_PIX_FMT_GRAY8, AV_PIX_FMT_GRAY10, AV_PIX_FMT_GRAY12 },
  46. [DAV1D_PIXEL_LAYOUT_I420] = { AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV420P12 },
  47. [DAV1D_PIXEL_LAYOUT_I422] = { AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV422P12 },
  48. [DAV1D_PIXEL_LAYOUT_I444] = { AV_PIX_FMT_YUV444P, AV_PIX_FMT_YUV444P10, AV_PIX_FMT_YUV444P12 },
  49. };
  50. static const enum AVPixelFormat pix_fmt_rgb[3] = {
  51. AV_PIX_FMT_GBRP, AV_PIX_FMT_GBRP10, AV_PIX_FMT_GBRP12,
  52. };
  53. static void libdav1d_log_callback(void *opaque, const char *fmt, va_list vl)
  54. {
  55. AVCodecContext *c = opaque;
  56. av_vlog(c, AV_LOG_ERROR, fmt, vl);
  57. }
  58. static int libdav1d_picture_allocator(Dav1dPicture *p, void *cookie)
  59. {
  60. Libdav1dContext *dav1d = cookie;
  61. enum AVPixelFormat format = pix_fmt[p->p.layout][p->seq_hdr->hbd];
  62. int ret, linesize[4], h = FFALIGN(p->p.h, 128), w = FFALIGN(p->p.w, 128);
  63. uint8_t *aligned_ptr, *data[4];
  64. AVBufferRef *buf;
  65. ret = av_image_get_buffer_size(format, w, h, DAV1D_PICTURE_ALIGNMENT);
  66. if (ret < 0)
  67. return ret;
  68. if (ret != dav1d->pool_size) {
  69. av_buffer_pool_uninit(&dav1d->pool);
  70. // Use twice the amount of required padding bytes for aligned_ptr below.
  71. dav1d->pool = av_buffer_pool_init(ret + DAV1D_PICTURE_ALIGNMENT * 2, NULL);
  72. if (!dav1d->pool) {
  73. dav1d->pool_size = 0;
  74. return AVERROR(ENOMEM);
  75. }
  76. dav1d->pool_size = ret;
  77. }
  78. buf = av_buffer_pool_get(dav1d->pool);
  79. if (!buf)
  80. return AVERROR(ENOMEM);
  81. // libdav1d requires DAV1D_PICTURE_ALIGNMENT aligned buffers, which av_malloc()
  82. // doesn't guarantee for example when AVX is disabled at configure time.
  83. // Use the extra DAV1D_PICTURE_ALIGNMENT padding bytes in the buffer to align it
  84. // if required.
  85. aligned_ptr = (uint8_t *)FFALIGN((uintptr_t)buf->data, DAV1D_PICTURE_ALIGNMENT);
  86. ret = av_image_fill_arrays(data, linesize, aligned_ptr, format, w, h,
  87. DAV1D_PICTURE_ALIGNMENT);
  88. if (ret < 0) {
  89. av_buffer_unref(&buf);
  90. return ret;
  91. }
  92. p->data[0] = data[0];
  93. p->data[1] = data[1];
  94. p->data[2] = data[2];
  95. p->stride[0] = linesize[0];
  96. p->stride[1] = linesize[1];
  97. p->allocator_data = buf;
  98. return 0;
  99. }
  100. static void libdav1d_picture_release(Dav1dPicture *p, void *cookie)
  101. {
  102. AVBufferRef *buf = p->allocator_data;
  103. av_buffer_unref(&buf);
  104. }
  105. static av_cold int libdav1d_init(AVCodecContext *c)
  106. {
  107. Libdav1dContext *dav1d = c->priv_data;
  108. Dav1dSettings s;
  109. int threads = (c->thread_count ? c->thread_count : av_cpu_count()) * 3 / 2;
  110. int res;
  111. av_log(c, AV_LOG_INFO, "libdav1d %s\n", dav1d_version());
  112. dav1d_default_settings(&s);
  113. s.logger.cookie = c;
  114. s.logger.callback = libdav1d_log_callback;
  115. s.allocator.cookie = dav1d;
  116. s.allocator.alloc_picture_callback = libdav1d_picture_allocator;
  117. s.allocator.release_picture_callback = libdav1d_picture_release;
  118. s.frame_size_limit = c->max_pixels;
  119. if (dav1d->apply_grain >= 0)
  120. s.apply_grain = dav1d->apply_grain;
  121. else if (c->export_side_data & AV_CODEC_EXPORT_DATA_FILM_GRAIN)
  122. s.apply_grain = 0;
  123. s.all_layers = dav1d->all_layers;
  124. if (dav1d->operating_point >= 0)
  125. s.operating_point = dav1d->operating_point;
  126. s.n_tile_threads = dav1d->tile_threads
  127. ? dav1d->tile_threads
  128. : FFMIN(floor(sqrt(threads)), DAV1D_MAX_TILE_THREADS);
  129. s.n_frame_threads = dav1d->frame_threads
  130. ? dav1d->frame_threads
  131. : FFMIN(ceil(threads / s.n_tile_threads), DAV1D_MAX_FRAME_THREADS);
  132. av_log(c, AV_LOG_DEBUG, "Using %d frame threads, %d tile threads\n",
  133. s.n_frame_threads, s.n_tile_threads);
  134. res = dav1d_open(&dav1d->c, &s);
  135. if (res < 0)
  136. return AVERROR(ENOMEM);
  137. return 0;
  138. }
  139. static void libdav1d_flush(AVCodecContext *c)
  140. {
  141. Libdav1dContext *dav1d = c->priv_data;
  142. dav1d_data_unref(&dav1d->data);
  143. dav1d_flush(dav1d->c);
  144. }
  145. static void libdav1d_data_free(const uint8_t *data, void *opaque) {
  146. AVBufferRef *buf = opaque;
  147. av_buffer_unref(&buf);
  148. }
  149. static void libdav1d_user_data_free(const uint8_t *data, void *opaque) {
  150. av_assert0(data == opaque);
  151. av_free(opaque);
  152. }
  153. static int libdav1d_receive_frame(AVCodecContext *c, AVFrame *frame)
  154. {
  155. Libdav1dContext *dav1d = c->priv_data;
  156. Dav1dData *data = &dav1d->data;
  157. Dav1dPicture pic = { 0 }, *p = &pic;
  158. int res;
  159. if (!data->sz) {
  160. AVPacket pkt = { 0 };
  161. res = ff_decode_get_packet(c, &pkt);
  162. if (res < 0 && res != AVERROR_EOF)
  163. return res;
  164. if (pkt.size) {
  165. res = dav1d_data_wrap(data, pkt.data, pkt.size, libdav1d_data_free, pkt.buf);
  166. if (res < 0) {
  167. av_packet_unref(&pkt);
  168. return res;
  169. }
  170. data->m.timestamp = pkt.pts;
  171. data->m.offset = pkt.pos;
  172. data->m.duration = pkt.duration;
  173. pkt.buf = NULL;
  174. av_packet_unref(&pkt);
  175. if (c->reordered_opaque != AV_NOPTS_VALUE) {
  176. uint8_t *reordered_opaque = av_malloc(sizeof(c->reordered_opaque));
  177. if (!reordered_opaque) {
  178. dav1d_data_unref(data);
  179. return AVERROR(ENOMEM);
  180. }
  181. memcpy(reordered_opaque, &c->reordered_opaque, sizeof(c->reordered_opaque));
  182. res = dav1d_data_wrap_user_data(data, reordered_opaque,
  183. libdav1d_user_data_free, reordered_opaque);
  184. if (res < 0) {
  185. av_free(reordered_opaque);
  186. dav1d_data_unref(data);
  187. return res;
  188. }
  189. }
  190. }
  191. }
  192. res = dav1d_send_data(dav1d->c, data);
  193. if (res < 0) {
  194. if (res == AVERROR(EINVAL))
  195. res = AVERROR_INVALIDDATA;
  196. if (res != AVERROR(EAGAIN))
  197. return res;
  198. }
  199. res = dav1d_get_picture(dav1d->c, p);
  200. if (res < 0) {
  201. if (res == AVERROR(EINVAL))
  202. res = AVERROR_INVALIDDATA;
  203. else if (res == AVERROR(EAGAIN) && c->internal->draining)
  204. res = AVERROR_EOF;
  205. return res;
  206. }
  207. av_assert0(p->data[0] && p->allocator_data);
  208. // This requires the custom allocator above
  209. frame->buf[0] = av_buffer_ref(p->allocator_data);
  210. if (!frame->buf[0]) {
  211. dav1d_picture_unref(p);
  212. return AVERROR(ENOMEM);
  213. }
  214. frame->data[0] = p->data[0];
  215. frame->data[1] = p->data[1];
  216. frame->data[2] = p->data[2];
  217. frame->linesize[0] = p->stride[0];
  218. frame->linesize[1] = p->stride[1];
  219. frame->linesize[2] = p->stride[1];
  220. c->profile = p->seq_hdr->profile;
  221. c->level = ((p->seq_hdr->operating_points[0].major_level - 2) << 2)
  222. | p->seq_hdr->operating_points[0].minor_level;
  223. frame->width = p->p.w;
  224. frame->height = p->p.h;
  225. if (c->width != p->p.w || c->height != p->p.h) {
  226. res = ff_set_dimensions(c, p->p.w, p->p.h);
  227. if (res < 0)
  228. goto fail;
  229. }
  230. av_reduce(&frame->sample_aspect_ratio.num,
  231. &frame->sample_aspect_ratio.den,
  232. frame->height * (int64_t)p->frame_hdr->render_width,
  233. frame->width * (int64_t)p->frame_hdr->render_height,
  234. INT_MAX);
  235. ff_set_sar(c, frame->sample_aspect_ratio);
  236. switch (p->seq_hdr->chr) {
  237. case DAV1D_CHR_VERTICAL:
  238. frame->chroma_location = c->chroma_sample_location = AVCHROMA_LOC_LEFT;
  239. break;
  240. case DAV1D_CHR_COLOCATED:
  241. frame->chroma_location = c->chroma_sample_location = AVCHROMA_LOC_TOPLEFT;
  242. break;
  243. }
  244. frame->colorspace = c->colorspace = (enum AVColorSpace) p->seq_hdr->mtrx;
  245. frame->color_primaries = c->color_primaries = (enum AVColorPrimaries) p->seq_hdr->pri;
  246. frame->color_trc = c->color_trc = (enum AVColorTransferCharacteristic) p->seq_hdr->trc;
  247. frame->color_range = c->color_range = p->seq_hdr->color_range ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG;
  248. if (p->p.layout == DAV1D_PIXEL_LAYOUT_I444 &&
  249. p->seq_hdr->mtrx == DAV1D_MC_IDENTITY &&
  250. p->seq_hdr->pri == DAV1D_COLOR_PRI_BT709 &&
  251. p->seq_hdr->trc == DAV1D_TRC_SRGB)
  252. frame->format = c->pix_fmt = pix_fmt_rgb[p->seq_hdr->hbd];
  253. else
  254. frame->format = c->pix_fmt = pix_fmt[p->p.layout][p->seq_hdr->hbd];
  255. if (p->m.user_data.data)
  256. memcpy(&frame->reordered_opaque, p->m.user_data.data, sizeof(frame->reordered_opaque));
  257. else
  258. frame->reordered_opaque = AV_NOPTS_VALUE;
  259. if (p->seq_hdr->num_units_in_tick && p->seq_hdr->time_scale) {
  260. av_reduce(&c->framerate.den, &c->framerate.num,
  261. p->seq_hdr->num_units_in_tick, p->seq_hdr->time_scale, INT_MAX);
  262. if (p->seq_hdr->equal_picture_interval)
  263. c->ticks_per_frame = p->seq_hdr->num_ticks_per_picture;
  264. }
  265. // match timestamps and packet size
  266. frame->pts = frame->best_effort_timestamp = p->m.timestamp;
  267. #if FF_API_PKT_PTS
  268. FF_DISABLE_DEPRECATION_WARNINGS
  269. frame->pkt_pts = p->m.timestamp;
  270. FF_ENABLE_DEPRECATION_WARNINGS
  271. #endif
  272. frame->pkt_dts = p->m.timestamp;
  273. frame->pkt_pos = p->m.offset;
  274. frame->pkt_size = p->m.size;
  275. frame->pkt_duration = p->m.duration;
  276. frame->key_frame = p->frame_hdr->frame_type == DAV1D_FRAME_TYPE_KEY;
  277. switch (p->frame_hdr->frame_type) {
  278. case DAV1D_FRAME_TYPE_KEY:
  279. case DAV1D_FRAME_TYPE_INTRA:
  280. frame->pict_type = AV_PICTURE_TYPE_I;
  281. break;
  282. case DAV1D_FRAME_TYPE_INTER:
  283. frame->pict_type = AV_PICTURE_TYPE_P;
  284. break;
  285. case DAV1D_FRAME_TYPE_SWITCH:
  286. frame->pict_type = AV_PICTURE_TYPE_SP;
  287. break;
  288. default:
  289. res = AVERROR_INVALIDDATA;
  290. goto fail;
  291. }
  292. if (p->mastering_display) {
  293. AVMasteringDisplayMetadata *mastering = av_mastering_display_metadata_create_side_data(frame);
  294. if (!mastering) {
  295. res = AVERROR(ENOMEM);
  296. goto fail;
  297. }
  298. for (int i = 0; i < 3; i++) {
  299. mastering->display_primaries[i][0] = av_make_q(p->mastering_display->primaries[i][0], 1 << 16);
  300. mastering->display_primaries[i][1] = av_make_q(p->mastering_display->primaries[i][1], 1 << 16);
  301. }
  302. mastering->white_point[0] = av_make_q(p->mastering_display->white_point[0], 1 << 16);
  303. mastering->white_point[1] = av_make_q(p->mastering_display->white_point[1], 1 << 16);
  304. mastering->max_luminance = av_make_q(p->mastering_display->max_luminance, 1 << 8);
  305. mastering->min_luminance = av_make_q(p->mastering_display->min_luminance, 1 << 14);
  306. mastering->has_primaries = 1;
  307. mastering->has_luminance = 1;
  308. }
  309. if (p->content_light) {
  310. AVContentLightMetadata *light = av_content_light_metadata_create_side_data(frame);
  311. if (!light) {
  312. res = AVERROR(ENOMEM);
  313. goto fail;
  314. }
  315. light->MaxCLL = p->content_light->max_content_light_level;
  316. light->MaxFALL = p->content_light->max_frame_average_light_level;
  317. }
  318. if (p->itut_t35) {
  319. GetByteContext gb;
  320. unsigned int user_identifier;
  321. bytestream2_init(&gb, p->itut_t35->payload, p->itut_t35->payload_size);
  322. bytestream2_skip(&gb, 1); // terminal provider code
  323. bytestream2_skip(&gb, 1); // terminal provider oriented code
  324. user_identifier = bytestream2_get_be32(&gb);
  325. switch (user_identifier) {
  326. case MKBETAG('G', 'A', '9', '4'): { // closed captions
  327. AVBufferRef *buf = NULL;
  328. res = ff_parse_a53_cc(&buf, gb.buffer, bytestream2_get_bytes_left(&gb));
  329. if (res < 0)
  330. goto fail;
  331. if (!res)
  332. break;
  333. if (!av_frame_new_side_data_from_buf(frame, AV_FRAME_DATA_A53_CC, buf))
  334. av_buffer_unref(&buf);
  335. c->properties |= FF_CODEC_PROPERTY_CLOSED_CAPTIONS;
  336. break;
  337. }
  338. default: // ignore unsupported identifiers
  339. break;
  340. }
  341. }
  342. if (p->frame_hdr->film_grain.present && (!dav1d->apply_grain ||
  343. (c->export_side_data & AV_CODEC_EXPORT_DATA_FILM_GRAIN))) {
  344. AVFilmGrainParams *fgp = av_film_grain_params_create_side_data(frame);
  345. if (!fgp) {
  346. res = AVERROR(ENOMEM);
  347. goto fail;
  348. }
  349. fgp->type = AV_FILM_GRAIN_PARAMS_AV1;
  350. fgp->seed = p->frame_hdr->film_grain.data.seed;
  351. fgp->codec.aom.num_y_points = p->frame_hdr->film_grain.data.num_y_points;
  352. fgp->codec.aom.chroma_scaling_from_luma = p->frame_hdr->film_grain.data.chroma_scaling_from_luma;
  353. fgp->codec.aom.scaling_shift = p->frame_hdr->film_grain.data.scaling_shift;
  354. fgp->codec.aom.ar_coeff_lag = p->frame_hdr->film_grain.data.ar_coeff_lag;
  355. fgp->codec.aom.ar_coeff_shift = p->frame_hdr->film_grain.data.ar_coeff_shift;
  356. fgp->codec.aom.grain_scale_shift = p->frame_hdr->film_grain.data.grain_scale_shift;
  357. fgp->codec.aom.overlap_flag = p->frame_hdr->film_grain.data.overlap_flag;
  358. fgp->codec.aom.limit_output_range = p->frame_hdr->film_grain.data.clip_to_restricted_range;
  359. memcpy(&fgp->codec.aom.y_points, &p->frame_hdr->film_grain.data.y_points,
  360. sizeof(fgp->codec.aom.y_points));
  361. memcpy(&fgp->codec.aom.num_uv_points, &p->frame_hdr->film_grain.data.num_uv_points,
  362. sizeof(fgp->codec.aom.num_uv_points));
  363. memcpy(&fgp->codec.aom.uv_points, &p->frame_hdr->film_grain.data.uv_points,
  364. sizeof(fgp->codec.aom.uv_points));
  365. memcpy(&fgp->codec.aom.ar_coeffs_y, &p->frame_hdr->film_grain.data.ar_coeffs_y,
  366. sizeof(fgp->codec.aom.ar_coeffs_y));
  367. memcpy(&fgp->codec.aom.ar_coeffs_uv[0], &p->frame_hdr->film_grain.data.ar_coeffs_uv[0],
  368. sizeof(fgp->codec.aom.ar_coeffs_uv[0]));
  369. memcpy(&fgp->codec.aom.ar_coeffs_uv[1], &p->frame_hdr->film_grain.data.ar_coeffs_uv[1],
  370. sizeof(fgp->codec.aom.ar_coeffs_uv[1]));
  371. memcpy(&fgp->codec.aom.uv_mult, &p->frame_hdr->film_grain.data.uv_mult,
  372. sizeof(fgp->codec.aom.uv_mult));
  373. memcpy(&fgp->codec.aom.uv_mult_luma, &p->frame_hdr->film_grain.data.uv_luma_mult,
  374. sizeof(fgp->codec.aom.uv_mult_luma));
  375. memcpy(&fgp->codec.aom.uv_offset, &p->frame_hdr->film_grain.data.uv_offset,
  376. sizeof(fgp->codec.aom.uv_offset));
  377. }
  378. res = 0;
  379. fail:
  380. dav1d_picture_unref(p);
  381. if (res < 0)
  382. av_frame_unref(frame);
  383. return res;
  384. }
  385. static av_cold int libdav1d_close(AVCodecContext *c)
  386. {
  387. Libdav1dContext *dav1d = c->priv_data;
  388. av_buffer_pool_uninit(&dav1d->pool);
  389. dav1d_data_unref(&dav1d->data);
  390. dav1d_close(&dav1d->c);
  391. return 0;
  392. }
  393. #define OFFSET(x) offsetof(Libdav1dContext, x)
  394. #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
  395. static const AVOption libdav1d_options[] = {
  396. { "tilethreads", "Tile threads", OFFSET(tile_threads), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, DAV1D_MAX_TILE_THREADS, VD },
  397. { "framethreads", "Frame threads", OFFSET(frame_threads), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, DAV1D_MAX_FRAME_THREADS, VD },
  398. { "filmgrain", "Apply Film Grain", OFFSET(apply_grain), AV_OPT_TYPE_BOOL, { .i64 = -1 }, -1, 1, VD | AV_OPT_FLAG_DEPRECATED },
  399. { "oppoint", "Select an operating point of the scalable bitstream", OFFSET(operating_point), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 31, VD },
  400. { "alllayers", "Output all spatial layers", OFFSET(all_layers), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VD },
  401. { NULL }
  402. };
  403. static const AVClass libdav1d_class = {
  404. .class_name = "libdav1d decoder",
  405. .item_name = av_default_item_name,
  406. .option = libdav1d_options,
  407. .version = LIBAVUTIL_VERSION_INT,
  408. };
  409. AVCodec ff_libdav1d_decoder = {
  410. .name = "libdav1d",
  411. .long_name = NULL_IF_CONFIG_SMALL("dav1d AV1 decoder by VideoLAN"),
  412. .type = AVMEDIA_TYPE_VIDEO,
  413. .id = AV_CODEC_ID_AV1,
  414. .priv_data_size = sizeof(Libdav1dContext),
  415. .init = libdav1d_init,
  416. .close = libdav1d_close,
  417. .flush = libdav1d_flush,
  418. .receive_frame = libdav1d_receive_frame,
  419. .capabilities = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_AUTO_THREADS,
  420. .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_SETS_PKT_DTS,
  421. .priv_class = &libdav1d_class,
  422. .wrapper_name = "libdav1d",
  423. };