You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1073 lines
38KB

  1. /*
  2. * huffyuv decoder
  3. *
  4. * Copyright (c) 2002-2003 Michael Niedermayer <michaelni@gmx.at>
  5. *
  6. * see http://www.pcisys.net/~melanson/codecs/huffyuv.txt for a description of
  7. * the algorithm used
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. *
  25. * yuva, gray, 4:4:4, 4:1:1, 4:1:0 and >8 bit per sample support sponsored by NOA
  26. */
  27. /**
  28. * @file
  29. * huffyuv decoder
  30. */
  31. #include "avcodec.h"
  32. #include "get_bits.h"
  33. #include "huffyuv.h"
  34. #include "thread.h"
  35. #include "libavutil/pixdesc.h"
  36. #define classic_shift_luma_table_size 42
  37. static const unsigned char classic_shift_luma[classic_shift_luma_table_size + FF_INPUT_BUFFER_PADDING_SIZE] = {
  38. 34,36,35,69,135,232,9,16,10,24,11,23,12,16,13,10,14,8,15,8,
  39. 16,8,17,20,16,10,207,206,205,236,11,8,10,21,9,23,8,8,199,70,
  40. 69,68, 0,
  41. 0,0,0,0,0,0,0,0,
  42. };
  43. #define classic_shift_chroma_table_size 59
  44. static const unsigned char classic_shift_chroma[classic_shift_chroma_table_size + FF_INPUT_BUFFER_PADDING_SIZE] = {
  45. 66,36,37,38,39,40,41,75,76,77,110,239,144,81,82,83,84,85,118,183,
  46. 56,57,88,89,56,89,154,57,58,57,26,141,57,56,58,57,58,57,184,119,
  47. 214,245,116,83,82,49,80,79,78,77,44,75,41,40,39,38,37,36,34, 0,
  48. 0,0,0,0,0,0,0,0,
  49. };
  50. static const unsigned char classic_add_luma[256] = {
  51. 3, 9, 5, 12, 10, 35, 32, 29, 27, 50, 48, 45, 44, 41, 39, 37,
  52. 73, 70, 68, 65, 64, 61, 58, 56, 53, 50, 49, 46, 44, 41, 38, 36,
  53. 68, 65, 63, 61, 58, 55, 53, 51, 48, 46, 45, 43, 41, 39, 38, 36,
  54. 35, 33, 32, 30, 29, 27, 26, 25, 48, 47, 46, 44, 43, 41, 40, 39,
  55. 37, 36, 35, 34, 32, 31, 30, 28, 27, 26, 24, 23, 22, 20, 19, 37,
  56. 35, 34, 33, 31, 30, 29, 27, 26, 24, 23, 21, 20, 18, 17, 15, 29,
  57. 27, 26, 24, 22, 21, 19, 17, 16, 14, 26, 25, 23, 21, 19, 18, 16,
  58. 15, 27, 25, 23, 21, 19, 17, 16, 14, 26, 25, 23, 21, 18, 17, 14,
  59. 12, 17, 19, 13, 4, 9, 2, 11, 1, 7, 8, 0, 16, 3, 14, 6,
  60. 12, 10, 5, 15, 18, 11, 10, 13, 15, 16, 19, 20, 22, 24, 27, 15,
  61. 18, 20, 22, 24, 26, 14, 17, 20, 22, 24, 27, 15, 18, 20, 23, 25,
  62. 28, 16, 19, 22, 25, 28, 32, 36, 21, 25, 29, 33, 38, 42, 45, 49,
  63. 28, 31, 34, 37, 40, 42, 44, 47, 49, 50, 52, 54, 56, 57, 59, 60,
  64. 62, 64, 66, 67, 69, 35, 37, 39, 40, 42, 43, 45, 47, 48, 51, 52,
  65. 54, 55, 57, 59, 60, 62, 63, 66, 67, 69, 71, 72, 38, 40, 42, 43,
  66. 46, 47, 49, 51, 26, 28, 30, 31, 33, 34, 18, 19, 11, 13, 7, 8,
  67. };
  68. static const unsigned char classic_add_chroma[256] = {
  69. 3, 1, 2, 2, 2, 2, 3, 3, 7, 5, 7, 5, 8, 6, 11, 9,
  70. 7, 13, 11, 10, 9, 8, 7, 5, 9, 7, 6, 4, 7, 5, 8, 7,
  71. 11, 8, 13, 11, 19, 15, 22, 23, 20, 33, 32, 28, 27, 29, 51, 77,
  72. 43, 45, 76, 81, 46, 82, 75, 55, 56,144, 58, 80, 60, 74,147, 63,
  73. 143, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79,
  74. 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 27, 30, 21, 22,
  75. 17, 14, 5, 6,100, 54, 47, 50, 51, 53,106,107,108,109,110,111,
  76. 112,113,114,115, 4,117,118, 92, 94,121,122, 3,124,103, 2, 1,
  77. 0,129,130,131,120,119,126,125,136,137,138,139,140,141,142,134,
  78. 135,132,133,104, 64,101, 62, 57,102, 95, 93, 59, 61, 28, 97, 96,
  79. 52, 49, 48, 29, 32, 25, 24, 46, 23, 98, 45, 44, 43, 20, 42, 41,
  80. 19, 18, 99, 40, 15, 39, 38, 16, 13, 12, 11, 37, 10, 9, 8, 36,
  81. 7,128,127,105,123,116, 35, 34, 33,145, 31, 79, 42,146, 78, 26,
  82. 83, 48, 49, 50, 44, 47, 26, 31, 30, 18, 17, 19, 21, 24, 25, 13,
  83. 14, 16, 17, 18, 20, 21, 12, 14, 15, 9, 10, 6, 9, 6, 5, 8,
  84. 6, 12, 8, 10, 7, 9, 6, 4, 6, 2, 2, 3, 3, 3, 3, 2,
  85. };
  86. static int read_len_table(uint8_t *dst, GetBitContext *gb, int n)
  87. {
  88. int i, val, repeat;
  89. for (i = 0; i < n;) {
  90. repeat = get_bits(gb, 3);
  91. val = get_bits(gb, 5);
  92. if (repeat == 0)
  93. repeat = get_bits(gb, 8);
  94. if (i + repeat > n || get_bits_left(gb) < 0) {
  95. av_log(NULL, AV_LOG_ERROR, "Error reading huffman table\n");
  96. return -1;
  97. }
  98. while (repeat--)
  99. dst[i++] = val;
  100. }
  101. return 0;
  102. }
  103. static int generate_joint_tables(HYuvContext *s)
  104. {
  105. uint16_t symbols[1 << VLC_BITS];
  106. uint16_t bits[1 << VLC_BITS];
  107. uint8_t len[1 << VLC_BITS];
  108. int ret;
  109. if (s->bitstream_bpp < 24 || s->version > 2) {
  110. int p, i, y, u;
  111. for (p = 0; p < 4; p++) {
  112. int p0 = s->version > 2 ? p : 0;
  113. for (i = y = 0; y < s->n; y++) {
  114. int len0 = s->len[p0][y];
  115. int limit = VLC_BITS - len0;
  116. if(limit <= 0 || !len0)
  117. continue;
  118. for (u = 0; u < s->n; u++) {
  119. int len1 = s->len[p][u];
  120. if (len1 > limit || !len1)
  121. continue;
  122. av_assert0(i < (1 << VLC_BITS));
  123. len[i] = len0 + len1;
  124. bits[i] = (s->bits[p0][y] << len1) + s->bits[p][u];
  125. symbols[i] = (y << 8) + u; //FIXME
  126. if(symbols[i] != 0xffff) // reserved to mean "invalid"
  127. i++;
  128. }
  129. }
  130. ff_free_vlc(&s->vlc[4 + p]);
  131. if ((ret = ff_init_vlc_sparse(&s->vlc[4 + p], VLC_BITS, i, len, 1, 1,
  132. bits, 2, 2, symbols, 2, 2, 0)) < 0)
  133. return ret;
  134. }
  135. } else {
  136. uint8_t (*map)[4] = (uint8_t(*)[4])s->pix_bgr_map;
  137. int i, b, g, r, code;
  138. int p0 = s->decorrelate;
  139. int p1 = !s->decorrelate;
  140. // restrict the range to +/-16 because that's pretty much guaranteed to
  141. // cover all the combinations that fit in 11 bits total, and it doesn't
  142. // matter if we miss a few rare codes.
  143. for (i = 0, g = -16; g < 16; g++) {
  144. int len0 = s->len[p0][g & 255];
  145. int limit0 = VLC_BITS - len0;
  146. if (limit0 < 2 || !len0)
  147. continue;
  148. for (b = -16; b < 16; b++) {
  149. int len1 = s->len[p1][b & 255];
  150. int limit1 = limit0 - len1;
  151. if (limit1 < 1 || !len1)
  152. continue;
  153. code = (s->bits[p0][g & 255] << len1) + s->bits[p1][b & 255];
  154. for (r = -16; r < 16; r++) {
  155. int len2 = s->len[2][r & 255];
  156. if (len2 > limit1 || !len2)
  157. continue;
  158. av_assert0(i < (1 << VLC_BITS));
  159. len[i] = len0 + len1 + len2;
  160. bits[i] = (code << len2) + s->bits[2][r & 255];
  161. if (s->decorrelate) {
  162. map[i][G] = g;
  163. map[i][B] = g + b;
  164. map[i][R] = g + r;
  165. } else {
  166. map[i][B] = g;
  167. map[i][G] = b;
  168. map[i][R] = r;
  169. }
  170. i++;
  171. }
  172. }
  173. }
  174. ff_free_vlc(&s->vlc[4]);
  175. if ((ret = init_vlc(&s->vlc[4], VLC_BITS, i, len, 1, 1, bits, 2, 2, 0)) < 0)
  176. return ret;
  177. }
  178. return 0;
  179. }
  180. static int read_huffman_tables(HYuvContext *s, const uint8_t *src, int length)
  181. {
  182. GetBitContext gb;
  183. int i;
  184. int ret;
  185. int count = 3;
  186. init_get_bits(&gb, src, length * 8);
  187. if (s->version > 2)
  188. count = 1 + s->alpha + 2*s->chroma;
  189. for (i = 0; i < count; i++) {
  190. if (read_len_table(s->len[i], &gb, s->n) < 0)
  191. return -1;
  192. if (ff_huffyuv_generate_bits_table(s->bits[i], s->len[i], s->n) < 0) {
  193. return -1;
  194. }
  195. ff_free_vlc(&s->vlc[i]);
  196. if ((ret = init_vlc(&s->vlc[i], VLC_BITS, s->n, s->len[i], 1, 1,
  197. s->bits[i], 4, 4, 0)) < 0)
  198. return ret;
  199. }
  200. if ((ret = generate_joint_tables(s)) < 0)
  201. return ret;
  202. return (get_bits_count(&gb) + 7) / 8;
  203. }
  204. static int read_old_huffman_tables(HYuvContext *s)
  205. {
  206. GetBitContext gb;
  207. int i;
  208. int ret;
  209. init_get_bits(&gb, classic_shift_luma,
  210. classic_shift_luma_table_size * 8);
  211. if (read_len_table(s->len[0], &gb, 256) < 0)
  212. return -1;
  213. init_get_bits(&gb, classic_shift_chroma,
  214. classic_shift_chroma_table_size * 8);
  215. if (read_len_table(s->len[1], &gb, 256) < 0)
  216. return -1;
  217. for(i=0; i<256; i++) s->bits[0][i] = classic_add_luma [i];
  218. for(i=0; i<256; i++) s->bits[1][i] = classic_add_chroma[i];
  219. if (s->bitstream_bpp >= 24) {
  220. memcpy(s->bits[1], s->bits[0], 256 * sizeof(uint32_t));
  221. memcpy(s->len[1] , s->len [0], 256 * sizeof(uint8_t));
  222. }
  223. memcpy(s->bits[2], s->bits[1], 256 * sizeof(uint32_t));
  224. memcpy(s->len[2] , s->len [1], 256 * sizeof(uint8_t));
  225. for (i = 0; i < 4; i++) {
  226. ff_free_vlc(&s->vlc[i]);
  227. if ((ret = init_vlc(&s->vlc[i], VLC_BITS, 256, s->len[i], 1, 1,
  228. s->bits[i], 4, 4, 0)) < 0)
  229. return ret;
  230. }
  231. if ((ret = generate_joint_tables(s)) < 0)
  232. return ret;
  233. return 0;
  234. }
  235. static av_cold int decode_init(AVCodecContext *avctx)
  236. {
  237. HYuvContext *s = avctx->priv_data;
  238. ff_huffyuv_common_init(avctx);
  239. memset(s->vlc, 0, 4 * sizeof(VLC));
  240. s->interlaced = s->height > 288;
  241. s->bgr32 = 1;
  242. if (avctx->extradata_size) {
  243. if ((avctx->bits_per_coded_sample & 7) &&
  244. avctx->bits_per_coded_sample != 12)
  245. s->version = 1; // do such files exist at all?
  246. else if (avctx->extradata_size > 3 && avctx->extradata[3] == 0)
  247. s->version = 2;
  248. else
  249. s->version = 3;
  250. } else
  251. s->version = 0;
  252. s->bps = 8;
  253. s->n = 1<<s->bps;
  254. s->chroma = 1;
  255. if (s->version >= 2) {
  256. int method, interlace;
  257. if (avctx->extradata_size < 4)
  258. return -1;
  259. method = ((uint8_t*)avctx->extradata)[0];
  260. s->decorrelate = method & 64 ? 1 : 0;
  261. s->predictor = method & 63;
  262. if (s->version == 2) {
  263. s->bitstream_bpp = ((uint8_t*)avctx->extradata)[1];
  264. if (s->bitstream_bpp == 0)
  265. s->bitstream_bpp = avctx->bits_per_coded_sample & ~7;
  266. } else {
  267. s->bps = (avctx->extradata[1] >> 4) + 1;
  268. s->n = 1<<s->bps;
  269. s->chroma_h_shift = avctx->extradata[1] & 3;
  270. s->chroma_v_shift = (avctx->extradata[1] >> 2) & 3;
  271. s->yuv = !!(((uint8_t*)avctx->extradata)[2] & 1);
  272. s->chroma= !!(((uint8_t*)avctx->extradata)[2] & 3);
  273. s->alpha = !!(((uint8_t*)avctx->extradata)[2] & 4);
  274. }
  275. interlace = (((uint8_t*)avctx->extradata)[2] & 0x30) >> 4;
  276. s->interlaced = (interlace == 1) ? 1 : (interlace == 2) ? 0 : s->interlaced;
  277. s->context = ((uint8_t*)avctx->extradata)[2] & 0x40 ? 1 : 0;
  278. if ( read_huffman_tables(s, ((uint8_t*)avctx->extradata) + 4,
  279. avctx->extradata_size - 4) < 0)
  280. return AVERROR_INVALIDDATA;
  281. }else{
  282. switch (avctx->bits_per_coded_sample & 7) {
  283. case 1:
  284. s->predictor = LEFT;
  285. s->decorrelate = 0;
  286. break;
  287. case 2:
  288. s->predictor = LEFT;
  289. s->decorrelate = 1;
  290. break;
  291. case 3:
  292. s->predictor = PLANE;
  293. s->decorrelate = avctx->bits_per_coded_sample >= 24;
  294. break;
  295. case 4:
  296. s->predictor = MEDIAN;
  297. s->decorrelate = 0;
  298. break;
  299. default:
  300. s->predictor = LEFT; //OLD
  301. s->decorrelate = 0;
  302. break;
  303. }
  304. s->bitstream_bpp = avctx->bits_per_coded_sample & ~7;
  305. s->context = 0;
  306. if (read_old_huffman_tables(s) < 0)
  307. return AVERROR_INVALIDDATA;
  308. }
  309. if (s->version <= 2) {
  310. switch (s->bitstream_bpp) {
  311. case 12:
  312. avctx->pix_fmt = AV_PIX_FMT_YUV420P;
  313. s->yuv = 1;
  314. break;
  315. case 16:
  316. if (s->yuy2) {
  317. avctx->pix_fmt = AV_PIX_FMT_YUYV422;
  318. } else {
  319. avctx->pix_fmt = AV_PIX_FMT_YUV422P;
  320. }
  321. s->yuv = 1;
  322. break;
  323. case 24:
  324. case 32:
  325. if (s->bgr32) {
  326. avctx->pix_fmt = AV_PIX_FMT_RGB32;
  327. s->alpha = 1;
  328. } else {
  329. avctx->pix_fmt = AV_PIX_FMT_BGR24;
  330. }
  331. break;
  332. default:
  333. return AVERROR_INVALIDDATA;
  334. }
  335. av_pix_fmt_get_chroma_sub_sample(avctx->pix_fmt,
  336. &s->chroma_h_shift,
  337. &s->chroma_v_shift);
  338. } else {
  339. switch ( (s->chroma<<10) | (s->yuv<<9) | (s->alpha<<8) | ((s->bps-1)<<4) | s->chroma_h_shift | (s->chroma_v_shift<<2)) {
  340. case 0x070:
  341. avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  342. break;
  343. case 0x170:
  344. avctx->pix_fmt = AV_PIX_FMT_GRAY8A;
  345. break;
  346. case 0x470:
  347. avctx->pix_fmt = AV_PIX_FMT_GBRP;
  348. break;
  349. case 0x570:
  350. avctx->pix_fmt = AV_PIX_FMT_GBRAP;
  351. break;
  352. case 0x670:
  353. avctx->pix_fmt = AV_PIX_FMT_YUV444P;
  354. break;
  355. case 0x680:
  356. avctx->pix_fmt = AV_PIX_FMT_YUV444P9;
  357. break;
  358. case 0x690:
  359. avctx->pix_fmt = AV_PIX_FMT_YUV444P10;
  360. break;
  361. case 0x6B0:
  362. avctx->pix_fmt = AV_PIX_FMT_YUV444P12;
  363. break;
  364. case 0x6D0:
  365. avctx->pix_fmt = AV_PIX_FMT_YUV444P14;
  366. break;
  367. case 0x671:
  368. avctx->pix_fmt = AV_PIX_FMT_YUV422P;
  369. break;
  370. case 0x681:
  371. avctx->pix_fmt = AV_PIX_FMT_YUV422P9;
  372. break;
  373. case 0x691:
  374. avctx->pix_fmt = AV_PIX_FMT_YUV422P10;
  375. break;
  376. case 0x6B1:
  377. avctx->pix_fmt = AV_PIX_FMT_YUV422P12;
  378. break;
  379. case 0x6D1:
  380. avctx->pix_fmt = AV_PIX_FMT_YUV422P14;
  381. break;
  382. case 0x672:
  383. avctx->pix_fmt = AV_PIX_FMT_YUV411P;
  384. break;
  385. case 0x674:
  386. avctx->pix_fmt = AV_PIX_FMT_YUV440P;
  387. break;
  388. case 0x675:
  389. avctx->pix_fmt = AV_PIX_FMT_YUV420P;
  390. break;
  391. case 0x685:
  392. avctx->pix_fmt = AV_PIX_FMT_YUV420P9;
  393. break;
  394. case 0x695:
  395. avctx->pix_fmt = AV_PIX_FMT_YUV420P10;
  396. break;
  397. case 0x6B5:
  398. avctx->pix_fmt = AV_PIX_FMT_YUV420P12;
  399. break;
  400. case 0x6D5:
  401. avctx->pix_fmt = AV_PIX_FMT_YUV420P14;
  402. break;
  403. case 0x67A:
  404. avctx->pix_fmt = AV_PIX_FMT_YUV410P;
  405. break;
  406. case 0x770:
  407. avctx->pix_fmt = AV_PIX_FMT_YUVA444P;
  408. break;
  409. case 0x771:
  410. avctx->pix_fmt = AV_PIX_FMT_YUVA422P;
  411. break;
  412. case 0x775:
  413. avctx->pix_fmt = AV_PIX_FMT_YUVA420P;
  414. break;
  415. case 0x795:
  416. avctx->pix_fmt = AV_PIX_FMT_YUVA420P10;
  417. break;
  418. default:
  419. return AVERROR_INVALIDDATA;
  420. }
  421. }
  422. if ((avctx->pix_fmt == AV_PIX_FMT_YUV422P || avctx->pix_fmt == AV_PIX_FMT_YUV420P) && avctx->width & 1) {
  423. av_log(avctx, AV_LOG_ERROR, "width must be even for this colorspace\n");
  424. return AVERROR_INVALIDDATA;
  425. }
  426. if (s->predictor == MEDIAN && avctx->pix_fmt == AV_PIX_FMT_YUV422P && avctx->width%4) {
  427. av_log(avctx, AV_LOG_ERROR, "width must be a multiple of 4 this colorspace and predictor\n");
  428. return AVERROR_INVALIDDATA;
  429. }
  430. if (ff_huffyuv_alloc_temp(s)) {
  431. ff_huffyuv_common_end(s);
  432. return AVERROR(ENOMEM);
  433. }
  434. return 0;
  435. }
  436. static av_cold int decode_init_thread_copy(AVCodecContext *avctx)
  437. {
  438. HYuvContext *s = avctx->priv_data;
  439. int i;
  440. if (ff_huffyuv_alloc_temp(s)) {
  441. ff_huffyuv_common_end(s);
  442. return AVERROR(ENOMEM);
  443. }
  444. for (i = 0; i < 8; i++)
  445. s->vlc[i].table = NULL;
  446. if (s->version >= 2) {
  447. if (read_huffman_tables(s, ((uint8_t*)avctx->extradata) + 4,
  448. avctx->extradata_size) < 0)
  449. return AVERROR_INVALIDDATA;
  450. } else {
  451. if (read_old_huffman_tables(s) < 0)
  452. return AVERROR_INVALIDDATA;
  453. }
  454. return 0;
  455. }
  456. /* TODO instead of restarting the read when the code isn't in the first level
  457. * of the joint table, jump into the 2nd level of the individual table. */
  458. #define READ_2PIX(dst0, dst1, plane1){\
  459. uint16_t code = get_vlc2(&s->gb, s->vlc[4+plane1].table, VLC_BITS, 1);\
  460. if(code != 0xffff){\
  461. dst0 = code>>8;\
  462. dst1 = code;\
  463. }else{\
  464. dst0 = get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3);\
  465. dst1 = get_vlc2(&s->gb, s->vlc[plane1].table, VLC_BITS, 3);\
  466. }\
  467. }
  468. static void decode_422_bitstream(HYuvContext *s, int count)
  469. {
  470. int i;
  471. count /= 2;
  472. if (count >= (get_bits_left(&s->gb)) / (31 * 4)) {
  473. for (i = 0; i < count && get_bits_left(&s->gb) > 0; i++) {
  474. READ_2PIX(s->temp[0][2 * i ], s->temp[1][i], 1);
  475. READ_2PIX(s->temp[0][2 * i + 1], s->temp[2][i], 2);
  476. }
  477. for (; i < count; i++)
  478. s->temp[0][2 * i ] = s->temp[1][i] =
  479. s->temp[0][2 * i + 1] = s->temp[2][i] = 128;
  480. } else {
  481. for (i = 0; i < count; i++) {
  482. READ_2PIX(s->temp[0][2 * i ], s->temp[1][i], 1);
  483. READ_2PIX(s->temp[0][2 * i + 1], s->temp[2][i], 2);
  484. }
  485. }
  486. }
  487. #define READ_2PIX_PLANE(dst0, dst1, plane){\
  488. uint16_t code = get_vlc2(&s->gb, s->vlc[4+plane].table, VLC_BITS, 1);\
  489. if(code != 0xffff){\
  490. dst0 = code>>8;\
  491. dst1 = code;\
  492. }else{\
  493. dst0 = get_vlc2(&s->gb, s->vlc[plane].table, VLC_BITS, 3);\
  494. dst1 = get_vlc2(&s->gb, s->vlc[plane].table, VLC_BITS, 3);\
  495. }\
  496. }
  497. #define READ_2PIX_PLANE16(dst0, dst1, plane){\
  498. dst0 = get_vlc2(&s->gb, s->vlc[plane].table, VLC_BITS, 3);\
  499. dst1 = get_vlc2(&s->gb, s->vlc[plane].table, VLC_BITS, 3);\
  500. }
  501. static void decode_plane_bitstream(HYuvContext *s, int count, int plane)
  502. {
  503. int i;
  504. count/=2;
  505. if (s->bps <= 8) {
  506. if (count >= (get_bits_left(&s->gb)) / (31 * 2)) {
  507. for (i = 0; i < count && get_bits_left(&s->gb) > 0; i++) {
  508. READ_2PIX_PLANE(s->temp[0][2 * i], s->temp[0][2 * i + 1], plane);
  509. }
  510. } else {
  511. for(i=0; i<count; i++){
  512. READ_2PIX_PLANE(s->temp[0][2 * i], s->temp[0][2 * i + 1], plane);
  513. }
  514. }
  515. } else {
  516. if (count >= (get_bits_left(&s->gb)) / (31 * 2)) {
  517. for (i = 0; i < count && get_bits_left(&s->gb) > 0; i++) {
  518. READ_2PIX_PLANE16(s->temp16[0][2 * i], s->temp16[0][2 * i + 1], plane);
  519. }
  520. } else {
  521. for(i=0; i<count; i++){
  522. READ_2PIX_PLANE16(s->temp16[0][2 * i], s->temp16[0][2 * i + 1], plane);
  523. }
  524. }
  525. }
  526. }
  527. static void decode_gray_bitstream(HYuvContext *s, int count)
  528. {
  529. int i;
  530. count/=2;
  531. if (count >= (get_bits_left(&s->gb)) / (31 * 2)) {
  532. for (i = 0; i < count && get_bits_left(&s->gb) > 0; i++) {
  533. READ_2PIX(s->temp[0][2 * i], s->temp[0][2 * i + 1], 0);
  534. }
  535. } else {
  536. for(i=0; i<count; i++){
  537. READ_2PIX(s->temp[0][2 * i], s->temp[0][2 * i + 1], 0);
  538. }
  539. }
  540. }
  541. static av_always_inline void decode_bgr_1(HYuvContext *s, int count,
  542. int decorrelate, int alpha)
  543. {
  544. int i;
  545. for (i = 0; i < count; i++) {
  546. int code = get_vlc2(&s->gb, s->vlc[4].table, VLC_BITS, 1);
  547. if (code != -1) {
  548. *(uint32_t*)&s->temp[0][4 * i] = s->pix_bgr_map[code];
  549. } else if(decorrelate) {
  550. s->temp[0][4 * i + G] = get_vlc2(&s->gb, s->vlc[1].table, VLC_BITS, 3);
  551. s->temp[0][4 * i + B] = get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3) +
  552. s->temp[0][4 * i + G];
  553. s->temp[0][4 * i + R] = get_vlc2(&s->gb, s->vlc[2].table, VLC_BITS, 3) +
  554. s->temp[0][4 * i + G];
  555. } else {
  556. s->temp[0][4 * i + B] = get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3);
  557. s->temp[0][4 * i + G] = get_vlc2(&s->gb, s->vlc[1].table, VLC_BITS, 3);
  558. s->temp[0][4 * i + R] = get_vlc2(&s->gb, s->vlc[2].table, VLC_BITS, 3);
  559. }
  560. if (alpha)
  561. s->temp[0][4 * i + A] = get_vlc2(&s->gb, s->vlc[2].table, VLC_BITS, 3);
  562. }
  563. }
  564. static void decode_bgr_bitstream(HYuvContext *s, int count)
  565. {
  566. if (s->decorrelate) {
  567. if (s->bitstream_bpp==24)
  568. decode_bgr_1(s, count, 1, 0);
  569. else
  570. decode_bgr_1(s, count, 1, 1);
  571. } else {
  572. if (s->bitstream_bpp==24)
  573. decode_bgr_1(s, count, 0, 0);
  574. else
  575. decode_bgr_1(s, count, 0, 1);
  576. }
  577. }
  578. static void draw_slice(HYuvContext *s, AVFrame *frame, int y)
  579. {
  580. int h, cy, i;
  581. int offset[AV_NUM_DATA_POINTERS];
  582. if (s->avctx->draw_horiz_band==NULL)
  583. return;
  584. h = y - s->last_slice_end;
  585. y -= h;
  586. if (s->bitstream_bpp == 12) {
  587. cy = y>>1;
  588. } else {
  589. cy = y;
  590. }
  591. offset[0] = frame->linesize[0] * y;
  592. offset[1] = frame->linesize[1] * cy;
  593. offset[2] = frame->linesize[2] * cy;
  594. for (i = 3; i < AV_NUM_DATA_POINTERS; i++)
  595. offset[i] = 0;
  596. emms_c();
  597. s->avctx->draw_horiz_band(s->avctx, frame, offset, y, 3, h);
  598. s->last_slice_end = y + h;
  599. }
  600. static int left_prediction(HYuvContext *s, uint8_t *dst, const uint8_t *src, int w, int acc)
  601. {
  602. if (s->bps <= 8) {
  603. return s->dsp.add_hfyu_left_prediction(dst, src, w, acc);
  604. } else {
  605. //FIXME optimize
  606. unsigned mask = s->n-1;
  607. int i;
  608. const uint16_t *src16 = (const uint16_t *)src;
  609. uint16_t *dst16 = ( uint16_t *)dst;
  610. for(i=0; i<w-1; i++){
  611. acc+= src16[i];
  612. dst16[i]= acc & mask;
  613. i++;
  614. acc+= src16[i];
  615. dst16[i]= acc & mask;
  616. }
  617. for(; i<w; i++){
  618. acc+= src16[i];
  619. dst16[i]= acc & mask;
  620. }
  621. return acc;
  622. }
  623. }
  624. static void add_bytes(HYuvContext *s, uint8_t *dst, uint8_t *src, int w)
  625. {
  626. if (s->bps <= 8) {
  627. s->dsp.add_bytes(dst, src, w);
  628. } else {
  629. //FIXME optimize
  630. const uint16_t *src16 = (const uint16_t *)src;
  631. uint16_t *dst16 = ( uint16_t *)dst;
  632. long i;
  633. unsigned long msb = 0x1000100010001ULL << (s->bps-1);
  634. unsigned long lsb = msb - 0x1000100010001ULL;
  635. unsigned long mask = lsb + msb;
  636. for (i = 0; i <= w - (int)sizeof(long)/2; i += sizeof(long)/2) {
  637. long a = *(long*)(src16+i);
  638. long b = *(long*)(dst16+i);
  639. *(long*)(dst16+i) = ((a&lsb) + (b&lsb)) ^ ((a^b)&msb);
  640. }
  641. for(; i<w; i++)
  642. dst16[i] = (dst16[i] + src16[i]) & mask;
  643. }
  644. }
  645. static int decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
  646. AVPacket *avpkt)
  647. {
  648. const uint8_t *buf = avpkt->data;
  649. int buf_size = avpkt->size;
  650. HYuvContext *s = avctx->priv_data;
  651. const int width = s->width;
  652. const int width2 = s->width>>1;
  653. const int height = s->height;
  654. int fake_ystride, fake_ustride, fake_vstride;
  655. ThreadFrame frame = { .f = data };
  656. AVFrame * const p = data;
  657. int table_size = 0, ret;
  658. av_fast_padded_malloc(&s->bitstream_buffer,
  659. &s->bitstream_buffer_size,
  660. buf_size);
  661. if (!s->bitstream_buffer)
  662. return AVERROR(ENOMEM);
  663. s->dsp.bswap_buf((uint32_t*)s->bitstream_buffer,
  664. (const uint32_t*)buf, buf_size / 4);
  665. if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
  666. return ret;
  667. if (s->context) {
  668. table_size = read_huffman_tables(s, s->bitstream_buffer, buf_size);
  669. if (table_size < 0)
  670. return AVERROR_INVALIDDATA;
  671. }
  672. if ((unsigned)(buf_size-table_size) >= INT_MAX / 8)
  673. return AVERROR_INVALIDDATA;
  674. init_get_bits(&s->gb, s->bitstream_buffer+table_size,
  675. (buf_size-table_size) * 8);
  676. fake_ystride = s->interlaced ? p->linesize[0] * 2 : p->linesize[0];
  677. fake_ustride = s->interlaced ? p->linesize[1] * 2 : p->linesize[1];
  678. fake_vstride = s->interlaced ? p->linesize[2] * 2 : p->linesize[2];
  679. s->last_slice_end = 0;
  680. if (s->version > 2) {
  681. int plane;
  682. for(plane = 0; plane < 1 + 2*s->chroma + s->alpha; plane++) {
  683. int left, lefttop, y;
  684. int w = width;
  685. int h = height;
  686. int fake_stride = fake_ystride;
  687. if (s->chroma && (plane == 1 || plane == 2)) {
  688. w >>= s->chroma_h_shift;
  689. h >>= s->chroma_v_shift;
  690. fake_stride = plane == 1 ? fake_ustride : fake_vstride;
  691. }
  692. switch (s->predictor) {
  693. case LEFT:
  694. case PLANE:
  695. decode_plane_bitstream(s, w, plane);
  696. left = left_prediction(s, p->data[plane], s->temp[0], w, 0);
  697. for (y = 1; y < h; y++) {
  698. uint8_t *dst = p->data[plane] + p->linesize[plane]*y;
  699. decode_plane_bitstream(s, w, plane);
  700. left = left_prediction(s, dst, s->temp[0], w, left);
  701. if (s->predictor == PLANE) {
  702. if (y > s->interlaced) {
  703. add_bytes(s, dst, dst - fake_stride, w);
  704. }
  705. }
  706. }
  707. break;
  708. case MEDIAN:
  709. decode_plane_bitstream(s, w, plane);
  710. left= left_prediction(s, p->data[plane], s->temp[0], w, 0);
  711. y = 1;
  712. /* second line is left predicted for interlaced case */
  713. if (s->interlaced) {
  714. decode_plane_bitstream(s, w, plane);
  715. left = left_prediction(s, p->data[plane] + p->linesize[plane], s->temp[0], w, left);
  716. y++;
  717. }
  718. lefttop = p->data[plane][0];
  719. decode_plane_bitstream(s, w, plane);
  720. s->dsp.add_hfyu_median_prediction(p->data[plane] + fake_stride, p->data[plane], s->temp[0], w, &left, &lefttop);
  721. y++;
  722. for (; y<h; y++) {
  723. uint8_t *dst;
  724. decode_plane_bitstream(s, w, plane);
  725. dst = p->data[plane] + p->linesize[plane] * y;
  726. s->dsp.add_hfyu_median_prediction(dst, dst - fake_stride, s->temp[0], w, &left, &lefttop);
  727. }
  728. break;
  729. }
  730. }
  731. draw_slice(s, p, height);
  732. } else if (s->bitstream_bpp < 24) {
  733. int y, cy;
  734. int lefty, leftu, leftv;
  735. int lefttopy, lefttopu, lefttopv;
  736. if (s->yuy2) {
  737. p->data[0][3] = get_bits(&s->gb, 8);
  738. p->data[0][2] = get_bits(&s->gb, 8);
  739. p->data[0][1] = get_bits(&s->gb, 8);
  740. p->data[0][0] = get_bits(&s->gb, 8);
  741. av_log(avctx, AV_LOG_ERROR,
  742. "YUY2 output is not implemented yet\n");
  743. return AVERROR_PATCHWELCOME;
  744. } else {
  745. leftv = p->data[2][0] = get_bits(&s->gb, 8);
  746. lefty = p->data[0][1] = get_bits(&s->gb, 8);
  747. leftu = p->data[1][0] = get_bits(&s->gb, 8);
  748. p->data[0][0] = get_bits(&s->gb, 8);
  749. switch (s->predictor) {
  750. case LEFT:
  751. case PLANE:
  752. decode_422_bitstream(s, width-2);
  753. lefty = s->dsp.add_hfyu_left_prediction(p->data[0] + 2, s->temp[0], width-2, lefty);
  754. if (!(s->flags&CODEC_FLAG_GRAY)) {
  755. leftu = s->dsp.add_hfyu_left_prediction(p->data[1] + 1, s->temp[1], width2 - 1, leftu);
  756. leftv = s->dsp.add_hfyu_left_prediction(p->data[2] + 1, s->temp[2], width2 - 1, leftv);
  757. }
  758. for (cy = y = 1; y < s->height; y++, cy++) {
  759. uint8_t *ydst, *udst, *vdst;
  760. if (s->bitstream_bpp == 12) {
  761. decode_gray_bitstream(s, width);
  762. ydst = p->data[0] + p->linesize[0] * y;
  763. lefty = s->dsp.add_hfyu_left_prediction(ydst, s->temp[0], width, lefty);
  764. if (s->predictor == PLANE) {
  765. if (y > s->interlaced)
  766. s->dsp.add_bytes(ydst, ydst - fake_ystride, width);
  767. }
  768. y++;
  769. if (y >= s->height) break;
  770. }
  771. draw_slice(s, p, y);
  772. ydst = p->data[0] + p->linesize[0]*y;
  773. udst = p->data[1] + p->linesize[1]*cy;
  774. vdst = p->data[2] + p->linesize[2]*cy;
  775. decode_422_bitstream(s, width);
  776. lefty = s->dsp.add_hfyu_left_prediction(ydst, s->temp[0], width, lefty);
  777. if (!(s->flags & CODEC_FLAG_GRAY)) {
  778. leftu= s->dsp.add_hfyu_left_prediction(udst, s->temp[1], width2, leftu);
  779. leftv= s->dsp.add_hfyu_left_prediction(vdst, s->temp[2], width2, leftv);
  780. }
  781. if (s->predictor == PLANE) {
  782. if (cy > s->interlaced) {
  783. s->dsp.add_bytes(ydst, ydst - fake_ystride, width);
  784. if (!(s->flags & CODEC_FLAG_GRAY)) {
  785. s->dsp.add_bytes(udst, udst - fake_ustride, width2);
  786. s->dsp.add_bytes(vdst, vdst - fake_vstride, width2);
  787. }
  788. }
  789. }
  790. }
  791. draw_slice(s, p, height);
  792. break;
  793. case MEDIAN:
  794. /* first line except first 2 pixels is left predicted */
  795. decode_422_bitstream(s, width - 2);
  796. lefty= s->dsp.add_hfyu_left_prediction(p->data[0] + 2, s->temp[0], width - 2, lefty);
  797. if (!(s->flags & CODEC_FLAG_GRAY)) {
  798. leftu = s->dsp.add_hfyu_left_prediction(p->data[1] + 1, s->temp[1], width2 - 1, leftu);
  799. leftv = s->dsp.add_hfyu_left_prediction(p->data[2] + 1, s->temp[2], width2 - 1, leftv);
  800. }
  801. cy = y = 1;
  802. /* second line is left predicted for interlaced case */
  803. if (s->interlaced) {
  804. decode_422_bitstream(s, width);
  805. lefty = s->dsp.add_hfyu_left_prediction(p->data[0] + p->linesize[0], s->temp[0], width, lefty);
  806. if (!(s->flags & CODEC_FLAG_GRAY)) {
  807. leftu = s->dsp.add_hfyu_left_prediction(p->data[1] + p->linesize[2], s->temp[1], width2, leftu);
  808. leftv = s->dsp.add_hfyu_left_prediction(p->data[2] + p->linesize[1], s->temp[2], width2, leftv);
  809. }
  810. y++; cy++;
  811. }
  812. /* next 4 pixels are left predicted too */
  813. decode_422_bitstream(s, 4);
  814. lefty = s->dsp.add_hfyu_left_prediction(p->data[0] + fake_ystride, s->temp[0], 4, lefty);
  815. if (!(s->flags&CODEC_FLAG_GRAY)) {
  816. leftu = s->dsp.add_hfyu_left_prediction(p->data[1] + fake_ustride, s->temp[1], 2, leftu);
  817. leftv = s->dsp.add_hfyu_left_prediction(p->data[2] + fake_vstride, s->temp[2], 2, leftv);
  818. }
  819. /* next line except the first 4 pixels is median predicted */
  820. lefttopy = p->data[0][3];
  821. decode_422_bitstream(s, width - 4);
  822. s->dsp.add_hfyu_median_prediction(p->data[0] + fake_ystride+4, p->data[0]+4, s->temp[0], width-4, &lefty, &lefttopy);
  823. if (!(s->flags&CODEC_FLAG_GRAY)) {
  824. lefttopu = p->data[1][1];
  825. lefttopv = p->data[2][1];
  826. s->dsp.add_hfyu_median_prediction(p->data[1] + fake_ustride+2, p->data[1] + 2, s->temp[1], width2 - 2, &leftu, &lefttopu);
  827. s->dsp.add_hfyu_median_prediction(p->data[2] + fake_vstride+2, p->data[2] + 2, s->temp[2], width2 - 2, &leftv, &lefttopv);
  828. }
  829. y++; cy++;
  830. for (; y<height; y++, cy++) {
  831. uint8_t *ydst, *udst, *vdst;
  832. if (s->bitstream_bpp == 12) {
  833. while (2 * cy > y) {
  834. decode_gray_bitstream(s, width);
  835. ydst = p->data[0] + p->linesize[0] * y;
  836. s->dsp.add_hfyu_median_prediction(ydst, ydst - fake_ystride, s->temp[0], width, &lefty, &lefttopy);
  837. y++;
  838. }
  839. if (y >= height) break;
  840. }
  841. draw_slice(s, p, y);
  842. decode_422_bitstream(s, width);
  843. ydst = p->data[0] + p->linesize[0] * y;
  844. udst = p->data[1] + p->linesize[1] * cy;
  845. vdst = p->data[2] + p->linesize[2] * cy;
  846. s->dsp.add_hfyu_median_prediction(ydst, ydst - fake_ystride, s->temp[0], width, &lefty, &lefttopy);
  847. if (!(s->flags & CODEC_FLAG_GRAY)) {
  848. s->dsp.add_hfyu_median_prediction(udst, udst - fake_ustride, s->temp[1], width2, &leftu, &lefttopu);
  849. s->dsp.add_hfyu_median_prediction(vdst, vdst - fake_vstride, s->temp[2], width2, &leftv, &lefttopv);
  850. }
  851. }
  852. draw_slice(s, p, height);
  853. break;
  854. }
  855. }
  856. } else {
  857. int y;
  858. int leftr, leftg, leftb, lefta;
  859. const int last_line = (height - 1) * p->linesize[0];
  860. if (s->bitstream_bpp == 32) {
  861. lefta = p->data[0][last_line+A] = get_bits(&s->gb, 8);
  862. leftr = p->data[0][last_line+R] = get_bits(&s->gb, 8);
  863. leftg = p->data[0][last_line+G] = get_bits(&s->gb, 8);
  864. leftb = p->data[0][last_line+B] = get_bits(&s->gb, 8);
  865. } else {
  866. leftr = p->data[0][last_line+R] = get_bits(&s->gb, 8);
  867. leftg = p->data[0][last_line+G] = get_bits(&s->gb, 8);
  868. leftb = p->data[0][last_line+B] = get_bits(&s->gb, 8);
  869. lefta = p->data[0][last_line+A] = 255;
  870. skip_bits(&s->gb, 8);
  871. }
  872. if (s->bgr32) {
  873. switch (s->predictor) {
  874. case LEFT:
  875. case PLANE:
  876. decode_bgr_bitstream(s, width - 1);
  877. s->dsp.add_hfyu_left_prediction_bgr32(p->data[0] + last_line+4, s->temp[0], width - 1, &leftr, &leftg, &leftb, &lefta);
  878. for (y = s->height - 2; y >= 0; y--) { //Yes it is stored upside down.
  879. decode_bgr_bitstream(s, width);
  880. s->dsp.add_hfyu_left_prediction_bgr32(p->data[0] + p->linesize[0]*y, s->temp[0], width, &leftr, &leftg, &leftb, &lefta);
  881. if (s->predictor == PLANE) {
  882. if (s->bitstream_bpp != 32) lefta = 0;
  883. if ((y & s->interlaced) == 0 &&
  884. y < s->height - 1 - s->interlaced) {
  885. s->dsp.add_bytes(p->data[0] + p->linesize[0] * y,
  886. p->data[0] + p->linesize[0] * y +
  887. fake_ystride, fake_ystride);
  888. }
  889. }
  890. }
  891. // just 1 large slice as this is not possible in reverse order
  892. draw_slice(s, p, height);
  893. break;
  894. default:
  895. av_log(avctx, AV_LOG_ERROR,
  896. "prediction type not supported!\n");
  897. }
  898. }else{
  899. av_log(avctx, AV_LOG_ERROR,
  900. "BGR24 output is not implemented yet\n");
  901. return AVERROR_PATCHWELCOME;
  902. }
  903. }
  904. emms_c();
  905. *got_frame = 1;
  906. return (get_bits_count(&s->gb) + 31) / 32 * 4 + table_size;
  907. }
  908. static av_cold int decode_end(AVCodecContext *avctx)
  909. {
  910. HYuvContext *s = avctx->priv_data;
  911. int i;
  912. ff_huffyuv_common_end(s);
  913. av_freep(&s->bitstream_buffer);
  914. for (i = 0; i < 8; i++) {
  915. ff_free_vlc(&s->vlc[i]);
  916. }
  917. return 0;
  918. }
  919. #if CONFIG_HUFFYUV_DECODER
  920. AVCodec ff_huffyuv_decoder = {
  921. .name = "huffyuv",
  922. .long_name = NULL_IF_CONFIG_SMALL("Huffyuv / HuffYUV"),
  923. .type = AVMEDIA_TYPE_VIDEO,
  924. .id = AV_CODEC_ID_HUFFYUV,
  925. .priv_data_size = sizeof(HYuvContext),
  926. .init = decode_init,
  927. .close = decode_end,
  928. .decode = decode_frame,
  929. .capabilities = CODEC_CAP_DR1 | CODEC_CAP_DRAW_HORIZ_BAND |
  930. CODEC_CAP_FRAME_THREADS,
  931. .init_thread_copy = ONLY_IF_THREADS_ENABLED(decode_init_thread_copy),
  932. };
  933. #endif
  934. #if CONFIG_FFVHUFF_DECODER
  935. AVCodec ff_ffvhuff_decoder = {
  936. .name = "ffvhuff",
  937. .long_name = NULL_IF_CONFIG_SMALL("Huffyuv FFmpeg variant"),
  938. .type = AVMEDIA_TYPE_VIDEO,
  939. .id = AV_CODEC_ID_FFVHUFF,
  940. .priv_data_size = sizeof(HYuvContext),
  941. .init = decode_init,
  942. .close = decode_end,
  943. .decode = decode_frame,
  944. .capabilities = CODEC_CAP_DR1 | CODEC_CAP_DRAW_HORIZ_BAND |
  945. CODEC_CAP_FRAME_THREADS,
  946. .init_thread_copy = ONLY_IF_THREADS_ENABLED(decode_init_thread_copy),
  947. };
  948. #endif