You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

268 lines
8.3KB

  1. /*
  2. * V210 encoder
  3. *
  4. * Copyright (C) 2009 Michael Niedermayer <michaelni@gmx.at>
  5. * Copyright (c) 2009 Baptiste Coudurier <baptiste dot coudurier at gmail dot com>
  6. *
  7. * This file is part of FFmpeg.
  8. *
  9. * FFmpeg is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation; either
  12. * version 2.1 of the License, or (at your option) any later version.
  13. *
  14. * FFmpeg is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17. * Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with FFmpeg; if not, write to the Free Software
  21. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  22. */
  23. #include "avcodec.h"
  24. #include "bytestream.h"
  25. #include "internal.h"
  26. #include "v210enc.h"
  27. #define CLIP(v) av_clip(v, 4, 1019)
  28. #define CLIP8(v) av_clip(v, 1, 254)
  29. #define WRITE_PIXELS(a, b, c) \
  30. do { \
  31. val = CLIP(*a++); \
  32. val |= (CLIP(*b++) << 10) | \
  33. (CLIP(*c++) << 20); \
  34. AV_WL32(dst, val); \
  35. dst += 4; \
  36. } while (0)
  37. #define WRITE_PIXELS8(a, b, c) \
  38. do { \
  39. val = (CLIP8(*a++) << 2); \
  40. val |= (CLIP8(*b++) << 12) | \
  41. (CLIP8(*c++) << 22); \
  42. AV_WL32(dst, val); \
  43. dst += 4; \
  44. } while (0)
  45. static void v210_planar_pack_8_c(const uint8_t *y, const uint8_t *u,
  46. const uint8_t *v, uint8_t *dst,
  47. ptrdiff_t width)
  48. {
  49. uint32_t val;
  50. int i;
  51. /* unroll this to match the assembly */
  52. for (i = 0; i < width - 11; i += 12) {
  53. WRITE_PIXELS8(u, y, v);
  54. WRITE_PIXELS8(y, u, y);
  55. WRITE_PIXELS8(v, y, u);
  56. WRITE_PIXELS8(y, v, y);
  57. WRITE_PIXELS8(u, y, v);
  58. WRITE_PIXELS8(y, u, y);
  59. WRITE_PIXELS8(v, y, u);
  60. WRITE_PIXELS8(y, v, y);
  61. }
  62. }
  63. static void v210_planar_pack_10_c(const uint16_t *y, const uint16_t *u,
  64. const uint16_t *v, uint8_t *dst,
  65. ptrdiff_t width)
  66. {
  67. uint32_t val;
  68. int i;
  69. for (i = 0; i < width - 5; i += 6) {
  70. WRITE_PIXELS(u, y, v);
  71. WRITE_PIXELS(y, u, y);
  72. WRITE_PIXELS(v, y, u);
  73. WRITE_PIXELS(y, v, y);
  74. }
  75. }
  76. av_cold void ff_v210enc_init(V210EncContext *s)
  77. {
  78. s->pack_line_8 = v210_planar_pack_8_c;
  79. s->pack_line_10 = v210_planar_pack_10_c;
  80. s->sample_factor_8 = 1;
  81. s->sample_factor_10 = 1;
  82. if (ARCH_X86)
  83. ff_v210enc_init_x86(s);
  84. }
  85. static av_cold int encode_init(AVCodecContext *avctx)
  86. {
  87. V210EncContext *s = avctx->priv_data;
  88. if (avctx->width & 1) {
  89. av_log(avctx, AV_LOG_ERROR, "v210 needs even width\n");
  90. return AVERROR(EINVAL);
  91. }
  92. #if FF_API_CODED_FRAME
  93. FF_DISABLE_DEPRECATION_WARNINGS
  94. avctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;
  95. FF_ENABLE_DEPRECATION_WARNINGS
  96. #endif
  97. ff_v210enc_init(s);
  98. avctx->bits_per_coded_sample = 20;
  99. avctx->bit_rate = ff_guess_coded_bitrate(avctx) * 16 / 15;
  100. return 0;
  101. }
  102. static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
  103. const AVFrame *pic, int *got_packet)
  104. {
  105. V210EncContext *s = avctx->priv_data;
  106. int aligned_width = ((avctx->width + 47) / 48) * 48;
  107. int stride = aligned_width * 8 / 3;
  108. int line_padding = stride - ((avctx->width * 8 + 11) / 12) * 4;
  109. AVFrameSideData *side_data;
  110. int h, w, ret;
  111. uint8_t *dst;
  112. ret = ff_alloc_packet2(avctx, pkt, avctx->height * stride, avctx->height * stride);
  113. if (ret < 0) {
  114. av_log(avctx, AV_LOG_ERROR, "Error getting output packet.\n");
  115. return ret;
  116. }
  117. dst = pkt->data;
  118. if (pic->format == AV_PIX_FMT_YUV422P10) {
  119. const uint16_t *y = (const uint16_t *)pic->data[0];
  120. const uint16_t *u = (const uint16_t *)pic->data[1];
  121. const uint16_t *v = (const uint16_t *)pic->data[2];
  122. const int sample_size = 6 * s->sample_factor_10;
  123. const int sample_w = avctx->width / sample_size;
  124. for (h = 0; h < avctx->height; h++) {
  125. uint32_t val;
  126. w = sample_w * sample_size;
  127. s->pack_line_10(y, u, v, dst, w);
  128. y += w;
  129. u += w >> 1;
  130. v += w >> 1;
  131. dst += sample_w * 16 * s->sample_factor_10;
  132. for (; w < avctx->width - 5; w += 6) {
  133. WRITE_PIXELS(u, y, v);
  134. WRITE_PIXELS(y, u, y);
  135. WRITE_PIXELS(v, y, u);
  136. WRITE_PIXELS(y, v, y);
  137. }
  138. if (w < avctx->width - 1) {
  139. WRITE_PIXELS(u, y, v);
  140. val = CLIP(*y++);
  141. if (w == avctx->width - 2) {
  142. AV_WL32(dst, val);
  143. dst += 4;
  144. }
  145. }
  146. if (w < avctx->width - 3) {
  147. val |= (CLIP(*u++) << 10) | (CLIP(*y++) << 20);
  148. AV_WL32(dst, val);
  149. dst += 4;
  150. val = CLIP(*v++) | (CLIP(*y++) << 10);
  151. AV_WL32(dst, val);
  152. dst += 4;
  153. }
  154. memset(dst, 0, line_padding);
  155. dst += line_padding;
  156. y += pic->linesize[0] / 2 - avctx->width;
  157. u += pic->linesize[1] / 2 - avctx->width / 2;
  158. v += pic->linesize[2] / 2 - avctx->width / 2;
  159. }
  160. } else if(pic->format == AV_PIX_FMT_YUV422P) {
  161. const uint8_t *y = pic->data[0];
  162. const uint8_t *u = pic->data[1];
  163. const uint8_t *v = pic->data[2];
  164. const int sample_size = 12 * s->sample_factor_8;
  165. const int sample_w = avctx->width / sample_size;
  166. for (h = 0; h < avctx->height; h++) {
  167. uint32_t val;
  168. w = sample_w * sample_size;
  169. s->pack_line_8(y, u, v, dst, w);
  170. y += w;
  171. u += w >> 1;
  172. v += w >> 1;
  173. dst += sample_w * 32 * s->sample_factor_8;
  174. for (; w < avctx->width - 5; w += 6) {
  175. WRITE_PIXELS8(u, y, v);
  176. WRITE_PIXELS8(y, u, y);
  177. WRITE_PIXELS8(v, y, u);
  178. WRITE_PIXELS8(y, v, y);
  179. }
  180. if (w < avctx->width - 1) {
  181. WRITE_PIXELS8(u, y, v);
  182. val = CLIP8(*y++) << 2;
  183. if (w == avctx->width - 2) {
  184. AV_WL32(dst, val);
  185. dst += 4;
  186. }
  187. }
  188. if (w < avctx->width - 3) {
  189. val |= (CLIP8(*u++) << 12) | (CLIP8(*y++) << 22);
  190. AV_WL32(dst, val);
  191. dst += 4;
  192. val = (CLIP8(*v++) << 2) | (CLIP8(*y++) << 12);
  193. AV_WL32(dst, val);
  194. dst += 4;
  195. }
  196. memset(dst, 0, line_padding);
  197. dst += line_padding;
  198. y += pic->linesize[0] - avctx->width;
  199. u += pic->linesize[1] - avctx->width / 2;
  200. v += pic->linesize[2] - avctx->width / 2;
  201. }
  202. }
  203. side_data = av_frame_get_side_data(pic, AV_FRAME_DATA_A53_CC);
  204. if (side_data && side_data->size) {
  205. uint8_t *buf = av_packet_new_side_data(pkt, AV_PKT_DATA_A53_CC, side_data->size);
  206. if (!buf)
  207. return AVERROR(ENOMEM);
  208. memcpy(buf, side_data->data, side_data->size);
  209. }
  210. side_data = av_frame_get_side_data(pic, AV_FRAME_DATA_AFD);
  211. if (side_data && side_data->size) {
  212. uint8_t *buf = av_packet_new_side_data(pkt, AV_PKT_DATA_AFD, side_data->size);
  213. if (!buf)
  214. return AVERROR(ENOMEM);
  215. memcpy(buf, side_data->data, side_data->size);
  216. }
  217. pkt->flags |= AV_PKT_FLAG_KEY;
  218. *got_packet = 1;
  219. return 0;
  220. }
  221. AVCodec ff_v210_encoder = {
  222. .name = "v210",
  223. .long_name = NULL_IF_CONFIG_SMALL("Uncompressed 4:2:2 10-bit"),
  224. .type = AVMEDIA_TYPE_VIDEO,
  225. .id = AV_CODEC_ID_V210,
  226. .priv_data_size = sizeof(V210EncContext),
  227. .init = encode_init,
  228. .encode2 = encode_frame,
  229. .pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV422P, AV_PIX_FMT_NONE },
  230. };