You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

357 lines
11KB

  1. /*
  2. * Copyright (c) 2018 Ronald S. Bultje <rsbultje gmail com>
  3. * Copyright (c) 2018 James Almer <jamrial gmail com>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <dav1d/dav1d.h>
  22. #include "libavutil/avassert.h"
  23. #include "libavutil/mastering_display_metadata.h"
  24. #include "libavutil/imgutils.h"
  25. #include "libavutil/opt.h"
  26. #include "avcodec.h"
  27. #include "decode.h"
  28. #include "internal.h"
  29. typedef struct Libdav1dContext {
  30. AVClass *class;
  31. Dav1dContext *c;
  32. AVBufferPool *pool;
  33. int pool_size;
  34. Dav1dData data;
  35. int tile_threads;
  36. int apply_grain;
  37. } Libdav1dContext;
  38. static const enum AVPixelFormat pix_fmt[][3] = {
  39. [DAV1D_PIXEL_LAYOUT_I400] = { AV_PIX_FMT_GRAY8, AV_PIX_FMT_GRAY10, AV_PIX_FMT_GRAY12 },
  40. [DAV1D_PIXEL_LAYOUT_I420] = { AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV420P12 },
  41. [DAV1D_PIXEL_LAYOUT_I422] = { AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV422P12 },
  42. [DAV1D_PIXEL_LAYOUT_I444] = { AV_PIX_FMT_YUV444P, AV_PIX_FMT_YUV444P10, AV_PIX_FMT_YUV444P12 },
  43. };
  44. static void libdav1d_log_callback(void *opaque, const char *fmt, va_list vl)
  45. {
  46. AVCodecContext *c = opaque;
  47. av_vlog(c, AV_LOG_ERROR, fmt, vl);
  48. }
  49. static int libdav1d_picture_allocator(Dav1dPicture *p, void *cookie)
  50. {
  51. Libdav1dContext *dav1d = cookie;
  52. enum AVPixelFormat format = pix_fmt[p->p.layout][p->seq_hdr->hbd];
  53. int ret, linesize[4], h = FFALIGN(p->p.h, 128);
  54. uint8_t *aligned_ptr, *data[4];
  55. AVBufferRef *buf;
  56. ret = av_image_fill_arrays(data, linesize, NULL, format, FFALIGN(p->p.w, 128),
  57. h, DAV1D_PICTURE_ALIGNMENT);
  58. if (ret < 0)
  59. return ret;
  60. if (ret != dav1d->pool_size) {
  61. av_buffer_pool_uninit(&dav1d->pool);
  62. // Use twice the amount of required padding bytes for aligned_ptr below.
  63. dav1d->pool = av_buffer_pool_init(ret + DAV1D_PICTURE_ALIGNMENT * 2, NULL);
  64. if (!dav1d->pool)
  65. return AVERROR(ENOMEM);
  66. dav1d->pool_size = ret;
  67. }
  68. buf = av_buffer_pool_get(dav1d->pool);
  69. if (!buf)
  70. return AVERROR(ENOMEM);
  71. // libdav1d requires DAV1D_PICTURE_ALIGNMENT aligned buffers, which av_malloc()
  72. // doesn't guarantee for example when AVX is disabled at configure time.
  73. // Use the extra DAV1D_PICTURE_ALIGNMENT padding bytes in the buffer to align it
  74. // if required.
  75. aligned_ptr = (uint8_t *)FFALIGN((uintptr_t)buf->data, DAV1D_PICTURE_ALIGNMENT);
  76. ret = av_image_fill_pointers(data, format, h, aligned_ptr, linesize);
  77. if (ret < 0) {
  78. av_buffer_unref(&buf);
  79. return ret;
  80. }
  81. p->data[0] = data[0];
  82. p->data[1] = data[1];
  83. p->data[2] = data[2];
  84. p->stride[0] = linesize[0];
  85. p->stride[1] = linesize[1];
  86. p->allocator_data = buf;
  87. return 0;
  88. }
  89. static void libdav1d_picture_release(Dav1dPicture *p, void *cookie)
  90. {
  91. AVBufferRef *buf = p->allocator_data;
  92. av_buffer_unref(&buf);
  93. }
  94. static av_cold int libdav1d_init(AVCodecContext *c)
  95. {
  96. Libdav1dContext *dav1d = c->priv_data;
  97. Dav1dSettings s;
  98. int res;
  99. av_log(c, AV_LOG_INFO, "libdav1d %s\n", dav1d_version());
  100. dav1d_default_settings(&s);
  101. s.logger.cookie = c;
  102. s.logger.callback = libdav1d_log_callback;
  103. s.allocator.cookie = dav1d;
  104. s.allocator.alloc_picture_callback = libdav1d_picture_allocator;
  105. s.allocator.release_picture_callback = libdav1d_picture_release;
  106. s.n_tile_threads = dav1d->tile_threads;
  107. s.apply_grain = dav1d->apply_grain;
  108. s.n_frame_threads = FFMIN(c->thread_count ? c->thread_count : av_cpu_count(), DAV1D_MAX_FRAME_THREADS);
  109. res = dav1d_open(&dav1d->c, &s);
  110. if (res < 0)
  111. return AVERROR(ENOMEM);
  112. return 0;
  113. }
  114. static void libdav1d_flush(AVCodecContext *c)
  115. {
  116. Libdav1dContext *dav1d = c->priv_data;
  117. dav1d_data_unref(&dav1d->data);
  118. dav1d_flush(dav1d->c);
  119. }
  120. static void libdav1d_data_free(const uint8_t *data, void *opaque) {
  121. AVBufferRef *buf = opaque;
  122. av_buffer_unref(&buf);
  123. }
  124. static void libdav1d_frame_free(void *opaque, uint8_t *data) {
  125. Dav1dPicture *p = opaque;
  126. dav1d_picture_unref(p);
  127. av_free(p);
  128. }
  129. static int libdav1d_receive_frame(AVCodecContext *c, AVFrame *frame)
  130. {
  131. Libdav1dContext *dav1d = c->priv_data;
  132. Dav1dData *data = &dav1d->data;
  133. Dav1dPicture *p;
  134. int res;
  135. if (!data->sz) {
  136. AVPacket pkt = { 0 };
  137. res = ff_decode_get_packet(c, &pkt);
  138. if (res < 0 && res != AVERROR_EOF)
  139. return res;
  140. if (pkt.size) {
  141. res = dav1d_data_wrap(data, pkt.data, pkt.size, libdav1d_data_free, pkt.buf);
  142. if (res < 0) {
  143. av_packet_unref(&pkt);
  144. return res;
  145. }
  146. data->m.timestamp = pkt.pts;
  147. data->m.offset = pkt.pos;
  148. data->m.duration = pkt.duration;
  149. pkt.buf = NULL;
  150. av_packet_unref(&pkt);
  151. }
  152. }
  153. res = dav1d_send_data(dav1d->c, data);
  154. if (res < 0) {
  155. if (res == AVERROR(EINVAL))
  156. res = AVERROR_INVALIDDATA;
  157. if (res != AVERROR(EAGAIN))
  158. return res;
  159. }
  160. p = av_mallocz(sizeof(*p));
  161. if (!p)
  162. return AVERROR(ENOMEM);
  163. res = dav1d_get_picture(dav1d->c, p);
  164. if (res < 0) {
  165. if (res == AVERROR(EINVAL))
  166. res = AVERROR_INVALIDDATA;
  167. else if (res == AVERROR(EAGAIN) && c->internal->draining)
  168. res = AVERROR_EOF;
  169. av_free(p);
  170. return res;
  171. }
  172. av_assert0(p->data[0] != NULL);
  173. frame->buf[0] = av_buffer_create(NULL, 0, libdav1d_frame_free,
  174. p, AV_BUFFER_FLAG_READONLY);
  175. if (!frame->buf[0]) {
  176. dav1d_picture_unref(p);
  177. av_free(p);
  178. return AVERROR(ENOMEM);
  179. }
  180. frame->data[0] = p->data[0];
  181. frame->data[1] = p->data[1];
  182. frame->data[2] = p->data[2];
  183. frame->linesize[0] = p->stride[0];
  184. frame->linesize[1] = p->stride[1];
  185. frame->linesize[2] = p->stride[1];
  186. c->profile = p->seq_hdr->profile;
  187. frame->format = c->pix_fmt = pix_fmt[p->p.layout][p->seq_hdr->hbd];
  188. frame->width = p->p.w;
  189. frame->height = p->p.h;
  190. if (c->width != p->p.w || c->height != p->p.h) {
  191. res = ff_set_dimensions(c, p->p.w, p->p.h);
  192. if (res < 0)
  193. goto fail;
  194. }
  195. switch (p->seq_hdr->chr) {
  196. case DAV1D_CHR_VERTICAL:
  197. frame->chroma_location = c->chroma_sample_location = AVCHROMA_LOC_LEFT;
  198. break;
  199. case DAV1D_CHR_COLOCATED:
  200. frame->chroma_location = c->chroma_sample_location = AVCHROMA_LOC_TOPLEFT;
  201. break;
  202. }
  203. frame->colorspace = c->colorspace = (enum AVColorSpace) p->seq_hdr->mtrx;
  204. frame->color_primaries = c->color_primaries = (enum AVColorPrimaries) p->seq_hdr->pri;
  205. frame->color_trc = c->color_trc = (enum AVColorTransferCharacteristic) p->seq_hdr->trc;
  206. frame->color_range = c->color_range = p->seq_hdr->color_range ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG;
  207. // match timestamps and packet size
  208. frame->pts = frame->best_effort_timestamp = p->m.timestamp;
  209. #if FF_API_PKT_PTS
  210. FF_DISABLE_DEPRECATION_WARNINGS
  211. frame->pkt_pts = p->m.timestamp;
  212. FF_ENABLE_DEPRECATION_WARNINGS
  213. #endif
  214. frame->pkt_dts = p->m.timestamp;
  215. frame->pkt_pos = p->m.offset;
  216. frame->pkt_size = p->m.size;
  217. frame->pkt_duration = p->m.duration;
  218. frame->key_frame = p->frame_hdr->frame_type == DAV1D_FRAME_TYPE_KEY;
  219. switch (p->frame_hdr->frame_type) {
  220. case DAV1D_FRAME_TYPE_KEY:
  221. case DAV1D_FRAME_TYPE_INTRA:
  222. frame->pict_type = AV_PICTURE_TYPE_I;
  223. break;
  224. case DAV1D_FRAME_TYPE_INTER:
  225. frame->pict_type = AV_PICTURE_TYPE_P;
  226. break;
  227. case DAV1D_FRAME_TYPE_SWITCH:
  228. frame->pict_type = AV_PICTURE_TYPE_SP;
  229. break;
  230. default:
  231. res = AVERROR_INVALIDDATA;
  232. goto fail;
  233. }
  234. if (p->mastering_display) {
  235. AVMasteringDisplayMetadata *mastering = av_mastering_display_metadata_create_side_data(frame);
  236. if (!mastering) {
  237. res = AVERROR(ENOMEM);
  238. goto fail;
  239. }
  240. for (int i = 0; i < 3; i++) {
  241. mastering->display_primaries[i][0] = av_make_q(p->mastering_display->primaries[i][0], 1 << 16);
  242. mastering->display_primaries[i][1] = av_make_q(p->mastering_display->primaries[i][1], 1 << 16);
  243. }
  244. mastering->white_point[0] = av_make_q(p->mastering_display->white_point[0], 1 << 16);
  245. mastering->white_point[1] = av_make_q(p->mastering_display->white_point[1], 1 << 16);
  246. mastering->max_luminance = av_make_q(p->mastering_display->max_luminance, 1 << 8);
  247. mastering->min_luminance = av_make_q(p->mastering_display->min_luminance, 1 << 14);
  248. mastering->has_primaries = 1;
  249. mastering->has_luminance = 1;
  250. }
  251. if (p->content_light) {
  252. AVContentLightMetadata *light = av_content_light_metadata_create_side_data(frame);
  253. if (!light) {
  254. res = AVERROR(ENOMEM);
  255. goto fail;
  256. }
  257. light->MaxCLL = p->content_light->max_content_light_level;
  258. light->MaxFALL = p->content_light->max_frame_average_light_level;
  259. }
  260. res = 0;
  261. fail:
  262. if (res < 0)
  263. av_frame_unref(frame);
  264. return res;
  265. }
  266. static av_cold int libdav1d_close(AVCodecContext *c)
  267. {
  268. Libdav1dContext *dav1d = c->priv_data;
  269. av_buffer_pool_uninit(&dav1d->pool);
  270. dav1d_data_unref(&dav1d->data);
  271. dav1d_close(&dav1d->c);
  272. return 0;
  273. }
  274. #define OFFSET(x) offsetof(Libdav1dContext, x)
  275. #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
  276. static const AVOption libdav1d_options[] = {
  277. { "tilethreads", "Tile threads", OFFSET(tile_threads), AV_OPT_TYPE_INT, { .i64 = 1 }, 1, DAV1D_MAX_TILE_THREADS, VD },
  278. { "filmgrain", "Apply Film Grain", OFFSET(apply_grain), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, VD },
  279. { NULL }
  280. };
  281. static const AVClass libdav1d_class = {
  282. .class_name = "libdav1d decoder",
  283. .item_name = av_default_item_name,
  284. .option = libdav1d_options,
  285. .version = LIBAVUTIL_VERSION_INT,
  286. };
  287. AVCodec ff_libdav1d_decoder = {
  288. .name = "libdav1d",
  289. .long_name = NULL_IF_CONFIG_SMALL("dav1d AV1 decoder by VideoLAN"),
  290. .type = AVMEDIA_TYPE_VIDEO,
  291. .id = AV_CODEC_ID_AV1,
  292. .priv_data_size = sizeof(Libdav1dContext),
  293. .init = libdav1d_init,
  294. .close = libdav1d_close,
  295. .flush = libdav1d_flush,
  296. .receive_frame = libdav1d_receive_frame,
  297. .capabilities = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_AUTO_THREADS,
  298. .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_SETS_PKT_DTS,
  299. .priv_class = &libdav1d_class,
  300. .wrapper_name = "libdav1d",
  301. };