You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1731 lines
59KB

  1. /*
  2. * MJPEG decoder
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. * Copyright (c) 2003 Alex Beregszaszi
  5. * Copyright (c) 2003-2004 Michael Niedermayer
  6. *
  7. * Support for external huffman table, various fixes (AVID workaround),
  8. * aspecting, new decode_frame mechanism and apple mjpeg-b support
  9. * by Alex Beregszaszi
  10. *
  11. * This file is part of Libav.
  12. *
  13. * Libav is free software; you can redistribute it and/or
  14. * modify it under the terms of the GNU Lesser General Public
  15. * License as published by the Free Software Foundation; either
  16. * version 2.1 of the License, or (at your option) any later version.
  17. *
  18. * Libav is distributed in the hope that it will be useful,
  19. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  20. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  21. * Lesser General Public License for more details.
  22. *
  23. * You should have received a copy of the GNU Lesser General Public
  24. * License along with Libav; if not, write to the Free Software
  25. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  26. */
  27. /**
  28. * @file
  29. * MJPEG decoder.
  30. */
  31. #include <assert.h>
  32. #include "libavutil/imgutils.h"
  33. #include "libavutil/opt.h"
  34. #include "avcodec.h"
  35. #include "blockdsp.h"
  36. #include "idctdsp.h"
  37. #include "internal.h"
  38. #include "mjpeg.h"
  39. #include "mjpegdec.h"
  40. #include "jpeglsdec.h"
  41. static int build_vlc(VLC *vlc, const uint8_t *bits_table,
  42. const uint8_t *val_table, int nb_codes,
  43. int use_static, int is_ac)
  44. {
  45. uint8_t huff_size[256] = { 0 };
  46. uint16_t huff_code[256];
  47. uint16_t huff_sym[256];
  48. int i;
  49. assert(nb_codes <= 256);
  50. ff_mjpeg_build_huffman_codes(huff_size, huff_code, bits_table, val_table);
  51. for (i = 0; i < 256; i++)
  52. huff_sym[i] = i + 16 * is_ac;
  53. if (is_ac)
  54. huff_sym[0] = 16 * 256;
  55. return ff_init_vlc_sparse(vlc, 9, nb_codes, huff_size, 1, 1,
  56. huff_code, 2, 2, huff_sym, 2, 2, use_static);
  57. }
  58. static void build_basic_mjpeg_vlc(MJpegDecodeContext *s)
  59. {
  60. build_vlc(&s->vlcs[0][0], avpriv_mjpeg_bits_dc_luminance,
  61. avpriv_mjpeg_val_dc, 12, 0, 0);
  62. build_vlc(&s->vlcs[0][1], avpriv_mjpeg_bits_dc_chrominance,
  63. avpriv_mjpeg_val_dc, 12, 0, 0);
  64. build_vlc(&s->vlcs[1][0], avpriv_mjpeg_bits_ac_luminance,
  65. avpriv_mjpeg_val_ac_luminance, 251, 0, 1);
  66. build_vlc(&s->vlcs[1][1], avpriv_mjpeg_bits_ac_chrominance,
  67. avpriv_mjpeg_val_ac_chrominance, 251, 0, 1);
  68. build_vlc(&s->vlcs[2][0], avpriv_mjpeg_bits_ac_luminance,
  69. avpriv_mjpeg_val_ac_luminance, 251, 0, 0);
  70. build_vlc(&s->vlcs[2][1], avpriv_mjpeg_bits_ac_chrominance,
  71. avpriv_mjpeg_val_ac_chrominance, 251, 0, 0);
  72. }
  73. av_cold int ff_mjpeg_decode_init(AVCodecContext *avctx)
  74. {
  75. MJpegDecodeContext *s = avctx->priv_data;
  76. if (!s->picture_ptr) {
  77. s->picture = av_frame_alloc();
  78. if (!s->picture)
  79. return AVERROR(ENOMEM);
  80. s->picture_ptr = s->picture;
  81. }
  82. s->avctx = avctx;
  83. ff_blockdsp_init(&s->bdsp, avctx);
  84. ff_hpeldsp_init(&s->hdsp, avctx->flags);
  85. ff_idctdsp_init(&s->idsp, avctx);
  86. ff_init_scantable(s->idsp.idct_permutation, &s->scantable,
  87. ff_zigzag_direct);
  88. s->buffer_size = 0;
  89. s->buffer = NULL;
  90. s->start_code = -1;
  91. s->first_picture = 1;
  92. s->org_height = avctx->coded_height;
  93. avctx->chroma_sample_location = AVCHROMA_LOC_CENTER;
  94. avctx->colorspace = AVCOL_SPC_BT470BG;
  95. build_basic_mjpeg_vlc(s);
  96. if (s->extern_huff) {
  97. int ret;
  98. av_log(avctx, AV_LOG_INFO, "mjpeg: using external huffman table\n");
  99. init_get_bits(&s->gb, avctx->extradata, avctx->extradata_size * 8);
  100. if ((ret = ff_mjpeg_decode_dht(s))) {
  101. av_log(avctx, AV_LOG_ERROR,
  102. "mjpeg: error using external huffman table\n");
  103. return ret;
  104. }
  105. }
  106. if (avctx->field_order == AV_FIELD_BB) { /* quicktime icefloe 019 */
  107. s->interlace_polarity = 1; /* bottom field first */
  108. av_log(avctx, AV_LOG_DEBUG, "mjpeg bottom field first\n");
  109. }
  110. if (avctx->codec->id == AV_CODEC_ID_AMV)
  111. s->flipped = 1;
  112. return 0;
  113. }
  114. /* quantize tables */
  115. int ff_mjpeg_decode_dqt(MJpegDecodeContext *s)
  116. {
  117. int len, index, i, j;
  118. len = get_bits(&s->gb, 16) - 2;
  119. while (len >= 65) {
  120. /* only 8 bit precision handled */
  121. if (get_bits(&s->gb, 4) != 0) {
  122. av_log(s->avctx, AV_LOG_ERROR, "dqt: 16bit precision\n");
  123. return -1;
  124. }
  125. index = get_bits(&s->gb, 4);
  126. if (index >= 4)
  127. return -1;
  128. av_log(s->avctx, AV_LOG_DEBUG, "index=%d\n", index);
  129. /* read quant table */
  130. for (i = 0; i < 64; i++) {
  131. j = s->scantable.permutated[i];
  132. s->quant_matrixes[index][j] = get_bits(&s->gb, 8);
  133. }
  134. // XXX FIXME finetune, and perhaps add dc too
  135. s->qscale[index] = FFMAX(s->quant_matrixes[index][s->scantable.permutated[1]],
  136. s->quant_matrixes[index][s->scantable.permutated[8]]) >> 1;
  137. av_log(s->avctx, AV_LOG_DEBUG, "qscale[%d]: %d\n",
  138. index, s->qscale[index]);
  139. len -= 65;
  140. }
  141. return 0;
  142. }
  143. /* decode huffman tables and build VLC decoders */
  144. int ff_mjpeg_decode_dht(MJpegDecodeContext *s)
  145. {
  146. int len, index, i, class, n, v, code_max;
  147. uint8_t bits_table[17];
  148. uint8_t val_table[256];
  149. int ret = 0;
  150. len = get_bits(&s->gb, 16) - 2;
  151. while (len > 0) {
  152. if (len < 17)
  153. return AVERROR_INVALIDDATA;
  154. class = get_bits(&s->gb, 4);
  155. if (class >= 2)
  156. return AVERROR_INVALIDDATA;
  157. index = get_bits(&s->gb, 4);
  158. if (index >= 4)
  159. return AVERROR_INVALIDDATA;
  160. n = 0;
  161. for (i = 1; i <= 16; i++) {
  162. bits_table[i] = get_bits(&s->gb, 8);
  163. n += bits_table[i];
  164. }
  165. len -= 17;
  166. if (len < n || n > 256)
  167. return AVERROR_INVALIDDATA;
  168. code_max = 0;
  169. for (i = 0; i < n; i++) {
  170. v = get_bits(&s->gb, 8);
  171. if (v > code_max)
  172. code_max = v;
  173. val_table[i] = v;
  174. }
  175. len -= n;
  176. /* build VLC and flush previous vlc if present */
  177. ff_free_vlc(&s->vlcs[class][index]);
  178. av_log(s->avctx, AV_LOG_DEBUG, "class=%d index=%d nb_codes=%d\n",
  179. class, index, code_max + 1);
  180. if ((ret = build_vlc(&s->vlcs[class][index], bits_table, val_table,
  181. code_max + 1, 0, class > 0)) < 0)
  182. return ret;
  183. if (class > 0) {
  184. ff_free_vlc(&s->vlcs[2][index]);
  185. if ((ret = build_vlc(&s->vlcs[2][index], bits_table, val_table,
  186. code_max + 1, 0, 0)) < 0)
  187. return ret;
  188. }
  189. }
  190. return 0;
  191. }
  192. int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
  193. {
  194. int len, nb_components, i, width, height, pix_fmt_id, ret;
  195. /* XXX: verify len field validity */
  196. len = get_bits(&s->gb, 16);
  197. s->bits = get_bits(&s->gb, 8);
  198. if (s->pegasus_rct)
  199. s->bits = 9;
  200. if (s->bits == 9 && !s->pegasus_rct)
  201. s->rct = 1; // FIXME ugly
  202. if (s->bits != 8 && !s->lossless) {
  203. av_log(s->avctx, AV_LOG_ERROR, "only 8 bits/component accepted\n");
  204. return -1;
  205. }
  206. height = get_bits(&s->gb, 16);
  207. width = get_bits(&s->gb, 16);
  208. // HACK for odd_height.mov
  209. if (s->interlaced && s->width == width && s->height == height + 1)
  210. height= s->height;
  211. av_log(s->avctx, AV_LOG_DEBUG, "sof0: picture: %dx%d\n", width, height);
  212. if (av_image_check_size(width, height, 0, s->avctx))
  213. return AVERROR_INVALIDDATA;
  214. nb_components = get_bits(&s->gb, 8);
  215. if (nb_components <= 0 ||
  216. nb_components > MAX_COMPONENTS)
  217. return -1;
  218. if (s->interlaced && (s->bottom_field == !s->interlace_polarity)) {
  219. if (nb_components != s->nb_components) {
  220. av_log(s->avctx, AV_LOG_ERROR,
  221. "nb_components changing in interlaced picture\n");
  222. return AVERROR_INVALIDDATA;
  223. }
  224. }
  225. if (s->ls && !(s->bits <= 8 || nb_components == 1)) {
  226. avpriv_report_missing_feature(s->avctx,
  227. "JPEG-LS that is not <= 8 "
  228. "bits/component or 16-bit gray");
  229. return AVERROR_PATCHWELCOME;
  230. }
  231. s->nb_components = nb_components;
  232. s->h_max = 1;
  233. s->v_max = 1;
  234. for (i = 0; i < nb_components; i++) {
  235. /* component id */
  236. s->component_id[i] = get_bits(&s->gb, 8) - 1;
  237. s->h_count[i] = get_bits(&s->gb, 4);
  238. s->v_count[i] = get_bits(&s->gb, 4);
  239. /* compute hmax and vmax (only used in interleaved case) */
  240. if (s->h_count[i] > s->h_max)
  241. s->h_max = s->h_count[i];
  242. if (s->v_count[i] > s->v_max)
  243. s->v_max = s->v_count[i];
  244. s->quant_index[i] = get_bits(&s->gb, 8);
  245. if (s->quant_index[i] >= 4)
  246. return AVERROR_INVALIDDATA;
  247. if (!s->h_count[i] || !s->v_count[i]) {
  248. av_log(s->avctx, AV_LOG_ERROR,
  249. "Invalid sampling factor in component %d %d:%d\n",
  250. i, s->h_count[i], s->v_count[i]);
  251. return AVERROR_INVALIDDATA;
  252. }
  253. av_log(s->avctx, AV_LOG_DEBUG, "component %d %d:%d id: %d quant:%d\n",
  254. i, s->h_count[i], s->v_count[i],
  255. s->component_id[i], s->quant_index[i]);
  256. }
  257. if (s->ls && (s->h_max > 1 || s->v_max > 1)) {
  258. avpriv_report_missing_feature(s->avctx, "Subsampling in JPEG-LS");
  259. return AVERROR_PATCHWELCOME;
  260. }
  261. if (s->v_max == 1 && s->h_max == 1 && s->lossless == 1)
  262. s->rgb = 1;
  263. /* if different size, realloc/alloc picture */
  264. /* XXX: also check h_count and v_count */
  265. if (width != s->width || height != s->height) {
  266. s->width = width;
  267. s->height = height;
  268. s->interlaced = 0;
  269. /* test interlaced mode */
  270. if (s->first_picture &&
  271. s->org_height != 0 &&
  272. s->height < ((s->org_height * 3) / 4)) {
  273. s->interlaced = 1;
  274. s->bottom_field = s->interlace_polarity;
  275. s->picture_ptr->interlaced_frame = 1;
  276. s->picture_ptr->top_field_first = !s->interlace_polarity;
  277. height *= 2;
  278. }
  279. ret = ff_set_dimensions(s->avctx, width, height);
  280. if (ret < 0)
  281. return ret;
  282. s->first_picture = 0;
  283. }
  284. if (!(s->interlaced && (s->bottom_field == !s->interlace_polarity))) {
  285. /* XXX: not complete test ! */
  286. pix_fmt_id = (s->h_count[0] << 28) | (s->v_count[0] << 24) |
  287. (s->h_count[1] << 20) | (s->v_count[1] << 16) |
  288. (s->h_count[2] << 12) | (s->v_count[2] << 8) |
  289. (s->h_count[3] << 4) | s->v_count[3];
  290. av_log(s->avctx, AV_LOG_DEBUG, "pix fmt id %x\n", pix_fmt_id);
  291. /* NOTE we do not allocate pictures large enough for the possible
  292. * padding of h/v_count being 4 */
  293. if (!(pix_fmt_id & 0xD0D0D0D0))
  294. pix_fmt_id -= (pix_fmt_id & 0xF0F0F0F0) >> 1;
  295. if (!(pix_fmt_id & 0x0D0D0D0D))
  296. pix_fmt_id -= (pix_fmt_id & 0x0F0F0F0F) >> 1;
  297. switch (pix_fmt_id) {
  298. case 0x11111100:
  299. if (s->rgb)
  300. s->avctx->pix_fmt = AV_PIX_FMT_BGRA;
  301. else {
  302. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV444P : AV_PIX_FMT_YUVJ444P;
  303. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  304. }
  305. assert(s->nb_components == 3);
  306. break;
  307. case 0x11000000:
  308. s->avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  309. break;
  310. case 0x12111100:
  311. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV440P : AV_PIX_FMT_YUVJ440P;
  312. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  313. break;
  314. case 0x21111100:
  315. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV422P : AV_PIX_FMT_YUVJ422P;
  316. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  317. break;
  318. case 0x22111100:
  319. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV420P : AV_PIX_FMT_YUVJ420P;
  320. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  321. break;
  322. default:
  323. av_log(s->avctx, AV_LOG_ERROR, "Unhandled pixel format 0x%x\n", pix_fmt_id);
  324. return AVERROR_PATCHWELCOME;
  325. }
  326. if (s->ls) {
  327. if (s->nb_components > 1)
  328. s->avctx->pix_fmt = AV_PIX_FMT_RGB24;
  329. else if (s->bits <= 8)
  330. s->avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  331. else
  332. s->avctx->pix_fmt = AV_PIX_FMT_GRAY16;
  333. }
  334. s->pix_desc = av_pix_fmt_desc_get(s->avctx->pix_fmt);
  335. if (!s->pix_desc) {
  336. av_log(s->avctx, AV_LOG_ERROR, "Could not get a pixel format descriptor.\n");
  337. return AVERROR_BUG;
  338. }
  339. av_frame_unref(s->picture_ptr);
  340. if (ff_get_buffer(s->avctx, s->picture_ptr, AV_GET_BUFFER_FLAG_REF) < 0) {
  341. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  342. return -1;
  343. }
  344. s->picture_ptr->pict_type = AV_PICTURE_TYPE_I;
  345. s->picture_ptr->key_frame = 1;
  346. s->got_picture = 1;
  347. for (i = 0; i < 3; i++)
  348. s->linesize[i] = s->picture_ptr->linesize[i] << s->interlaced;
  349. av_dlog(s->avctx, "%d %d %d %d %d %d\n",
  350. s->width, s->height, s->linesize[0], s->linesize[1],
  351. s->interlaced, s->avctx->height);
  352. if (len != (8 + (3 * nb_components)))
  353. av_log(s->avctx, AV_LOG_DEBUG, "decode_sof0: error, len(%d) mismatch\n", len);
  354. }
  355. /* totally blank picture as progressive JPEG will only add details to it */
  356. if (s->progressive) {
  357. int bw = (width + s->h_max * 8 - 1) / (s->h_max * 8);
  358. int bh = (height + s->v_max * 8 - 1) / (s->v_max * 8);
  359. for (i = 0; i < s->nb_components; i++) {
  360. int size = bw * bh * s->h_count[i] * s->v_count[i];
  361. av_freep(&s->blocks[i]);
  362. av_freep(&s->last_nnz[i]);
  363. s->blocks[i] = av_malloc(size * sizeof(**s->blocks));
  364. s->last_nnz[i] = av_mallocz(size * sizeof(**s->last_nnz));
  365. s->block_stride[i] = bw * s->h_count[i];
  366. }
  367. memset(s->coefs_finished, 0, sizeof(s->coefs_finished));
  368. }
  369. return 0;
  370. }
  371. static inline int mjpeg_decode_dc(MJpegDecodeContext *s, int dc_index)
  372. {
  373. int code;
  374. code = get_vlc2(&s->gb, s->vlcs[0][dc_index].table, 9, 2);
  375. if (code < 0) {
  376. av_log(s->avctx, AV_LOG_WARNING,
  377. "mjpeg_decode_dc: bad vlc: %d:%d (%p)\n",
  378. 0, dc_index, &s->vlcs[0][dc_index]);
  379. return 0xffff;
  380. }
  381. if (code)
  382. return get_xbits(&s->gb, code);
  383. else
  384. return 0;
  385. }
  386. /* decode block and dequantize */
  387. static int decode_block(MJpegDecodeContext *s, int16_t *block, int component,
  388. int dc_index, int ac_index, int16_t *quant_matrix)
  389. {
  390. int code, i, j, level, val;
  391. /* DC coef */
  392. val = mjpeg_decode_dc(s, dc_index);
  393. if (val == 0xffff) {
  394. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  395. return AVERROR_INVALIDDATA;
  396. }
  397. val = val * quant_matrix[0] + s->last_dc[component];
  398. s->last_dc[component] = val;
  399. block[0] = val;
  400. /* AC coefs */
  401. i = 0;
  402. {OPEN_READER(re, &s->gb);
  403. do {
  404. UPDATE_CACHE(re, &s->gb);
  405. GET_VLC(code, re, &s->gb, s->vlcs[1][ac_index].table, 9, 2);
  406. i += ((unsigned)code) >> 4;
  407. code &= 0xf;
  408. if (code) {
  409. if (code > MIN_CACHE_BITS - 16)
  410. UPDATE_CACHE(re, &s->gb);
  411. {
  412. int cache = GET_CACHE(re, &s->gb);
  413. int sign = (~cache) >> 31;
  414. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  415. }
  416. LAST_SKIP_BITS(re, &s->gb, code);
  417. if (i > 63) {
  418. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  419. return AVERROR_INVALIDDATA;
  420. }
  421. j = s->scantable.permutated[i];
  422. block[j] = level * quant_matrix[j];
  423. }
  424. } while (i < 63);
  425. CLOSE_READER(re, &s->gb);}
  426. return 0;
  427. }
  428. static int decode_dc_progressive(MJpegDecodeContext *s, int16_t *block,
  429. int component, int dc_index,
  430. int16_t *quant_matrix, int Al)
  431. {
  432. int val;
  433. s->bdsp.clear_block(block);
  434. val = mjpeg_decode_dc(s, dc_index);
  435. if (val == 0xffff) {
  436. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  437. return AVERROR_INVALIDDATA;
  438. }
  439. val = (val * quant_matrix[0] << Al) + s->last_dc[component];
  440. s->last_dc[component] = val;
  441. block[0] = val;
  442. return 0;
  443. }
  444. /* decode block and dequantize - progressive JPEG version */
  445. static int decode_block_progressive(MJpegDecodeContext *s, int16_t *block,
  446. uint8_t *last_nnz, int ac_index,
  447. int16_t *quant_matrix,
  448. int ss, int se, int Al, int *EOBRUN)
  449. {
  450. int code, i, j, level, val, run;
  451. if (*EOBRUN) {
  452. (*EOBRUN)--;
  453. return 0;
  454. }
  455. {
  456. OPEN_READER(re, &s->gb);
  457. for (i = ss; ; i++) {
  458. UPDATE_CACHE(re, &s->gb);
  459. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  460. run = ((unsigned) code) >> 4;
  461. code &= 0xF;
  462. if (code) {
  463. i += run;
  464. if (code > MIN_CACHE_BITS - 16)
  465. UPDATE_CACHE(re, &s->gb);
  466. {
  467. int cache = GET_CACHE(re, &s->gb);
  468. int sign = (~cache) >> 31;
  469. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  470. }
  471. LAST_SKIP_BITS(re, &s->gb, code);
  472. if (i >= se) {
  473. if (i == se) {
  474. j = s->scantable.permutated[se];
  475. block[j] = level * quant_matrix[j] << Al;
  476. break;
  477. }
  478. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  479. return AVERROR_INVALIDDATA;
  480. }
  481. j = s->scantable.permutated[i];
  482. block[j] = level * quant_matrix[j] << Al;
  483. } else {
  484. if (run == 0xF) {// ZRL - skip 15 coefficients
  485. i += 15;
  486. if (i >= se) {
  487. av_log(s->avctx, AV_LOG_ERROR, "ZRL overflow: %d\n", i);
  488. return AVERROR_INVALIDDATA;
  489. }
  490. } else {
  491. val = (1 << run);
  492. if (run) {
  493. UPDATE_CACHE(re, &s->gb);
  494. val += NEG_USR32(GET_CACHE(re, &s->gb), run);
  495. LAST_SKIP_BITS(re, &s->gb, run);
  496. }
  497. *EOBRUN = val - 1;
  498. break;
  499. }
  500. }
  501. }
  502. CLOSE_READER(re, &s->gb);
  503. }
  504. if (i > *last_nnz)
  505. *last_nnz = i;
  506. return 0;
  507. }
  508. #define REFINE_BIT(j) { \
  509. UPDATE_CACHE(re, &s->gb); \
  510. sign = block[j] >> 15; \
  511. block[j] += SHOW_UBITS(re, &s->gb, 1) * \
  512. ((quant_matrix[j] ^ sign) - sign) << Al; \
  513. LAST_SKIP_BITS(re, &s->gb, 1); \
  514. }
  515. #define ZERO_RUN \
  516. for (; ; i++) { \
  517. if (i > last) { \
  518. i += run; \
  519. if (i > se) { \
  520. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i); \
  521. return -1; \
  522. } \
  523. break; \
  524. } \
  525. j = s->scantable.permutated[i]; \
  526. if (block[j]) \
  527. REFINE_BIT(j) \
  528. else if (run-- == 0) \
  529. break; \
  530. }
  531. /* decode block and dequantize - progressive JPEG refinement pass */
  532. static int decode_block_refinement(MJpegDecodeContext *s, int16_t *block,
  533. uint8_t *last_nnz,
  534. int ac_index, int16_t *quant_matrix,
  535. int ss, int se, int Al, int *EOBRUN)
  536. {
  537. int code, i = ss, j, sign, val, run;
  538. int last = FFMIN(se, *last_nnz);
  539. OPEN_READER(re, &s->gb);
  540. if (*EOBRUN) {
  541. (*EOBRUN)--;
  542. } else {
  543. for (; ; i++) {
  544. UPDATE_CACHE(re, &s->gb);
  545. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  546. if (code & 0xF) {
  547. run = ((unsigned) code) >> 4;
  548. UPDATE_CACHE(re, &s->gb);
  549. val = SHOW_UBITS(re, &s->gb, 1);
  550. LAST_SKIP_BITS(re, &s->gb, 1);
  551. ZERO_RUN;
  552. j = s->scantable.permutated[i];
  553. val--;
  554. block[j] = ((quant_matrix[j]^val) - val) << Al;
  555. if (i == se) {
  556. if (i > *last_nnz)
  557. *last_nnz = i;
  558. CLOSE_READER(re, &s->gb);
  559. return 0;
  560. }
  561. } else {
  562. run = ((unsigned) code) >> 4;
  563. if (run == 0xF) {
  564. ZERO_RUN;
  565. } else {
  566. val = run;
  567. run = (1 << run);
  568. if (val) {
  569. UPDATE_CACHE(re, &s->gb);
  570. run += SHOW_UBITS(re, &s->gb, val);
  571. LAST_SKIP_BITS(re, &s->gb, val);
  572. }
  573. *EOBRUN = run - 1;
  574. break;
  575. }
  576. }
  577. }
  578. if (i > *last_nnz)
  579. *last_nnz = i;
  580. }
  581. for (; i <= last; i++) {
  582. j = s->scantable.permutated[i];
  583. if (block[j])
  584. REFINE_BIT(j)
  585. }
  586. CLOSE_READER(re, &s->gb);
  587. return 0;
  588. }
  589. #undef REFINE_BIT
  590. #undef ZERO_RUN
  591. static int ljpeg_decode_rgb_scan(MJpegDecodeContext *s, int predictor,
  592. int point_transform)
  593. {
  594. int i, mb_x, mb_y;
  595. uint16_t (*buffer)[4];
  596. int left[3], top[3], topleft[3];
  597. const int linesize = s->linesize[0];
  598. const int mask = (1 << s->bits) - 1;
  599. av_fast_malloc(&s->ljpeg_buffer, &s->ljpeg_buffer_size,
  600. (unsigned)s->mb_width * 4 * sizeof(s->ljpeg_buffer[0][0]));
  601. buffer = s->ljpeg_buffer;
  602. for (i = 0; i < 3; i++)
  603. buffer[0][i] = 1 << (s->bits + point_transform - 1);
  604. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  605. const int modified_predictor = mb_y ? predictor : 1;
  606. uint8_t *ptr = s->picture_ptr->data[0] + (linesize * mb_y);
  607. if (s->interlaced && s->bottom_field)
  608. ptr += linesize >> 1;
  609. for (i = 0; i < 3; i++)
  610. top[i] = left[i] = topleft[i] = buffer[0][i];
  611. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  612. if (s->restart_interval && !s->restart_count)
  613. s->restart_count = s->restart_interval;
  614. for (i = 0; i < 3; i++) {
  615. int pred;
  616. topleft[i] = top[i];
  617. top[i] = buffer[mb_x][i];
  618. PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
  619. left[i] = buffer[mb_x][i] =
  620. mask & (pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform));
  621. }
  622. if (s->restart_interval && !--s->restart_count) {
  623. align_get_bits(&s->gb);
  624. skip_bits(&s->gb, 16); /* skip RSTn */
  625. }
  626. }
  627. if (s->rct) {
  628. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  629. ptr[4 * mb_x + 1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2] - 0x200) >> 2);
  630. ptr[4 * mb_x + 0] = buffer[mb_x][1] + ptr[4 * mb_x + 1];
  631. ptr[4 * mb_x + 2] = buffer[mb_x][2] + ptr[4 * mb_x + 1];
  632. }
  633. } else if (s->pegasus_rct) {
  634. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  635. ptr[4 * mb_x + 1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2]) >> 2);
  636. ptr[4 * mb_x + 0] = buffer[mb_x][1] + ptr[4 * mb_x + 1];
  637. ptr[4 * mb_x + 2] = buffer[mb_x][2] + ptr[4 * mb_x + 1];
  638. }
  639. } else {
  640. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  641. ptr[4 * mb_x + 0] = buffer[mb_x][2];
  642. ptr[4 * mb_x + 1] = buffer[mb_x][1];
  643. ptr[4 * mb_x + 2] = buffer[mb_x][0];
  644. }
  645. }
  646. }
  647. return 0;
  648. }
  649. static int ljpeg_decode_yuv_scan(MJpegDecodeContext *s, int predictor,
  650. int point_transform, int nb_components)
  651. {
  652. int i, mb_x, mb_y;
  653. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  654. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  655. if (s->restart_interval && !s->restart_count)
  656. s->restart_count = s->restart_interval;
  657. if (mb_x == 0 || mb_y == 0 || s->interlaced) {
  658. for (i = 0; i < nb_components; i++) {
  659. uint8_t *ptr;
  660. int n, h, v, x, y, c, j, linesize;
  661. n = s->nb_blocks[i];
  662. c = s->comp_index[i];
  663. h = s->h_scount[i];
  664. v = s->v_scount[i];
  665. x = 0;
  666. y = 0;
  667. linesize = s->linesize[c];
  668. for (j = 0; j < n; j++) {
  669. int pred;
  670. // FIXME optimize this crap
  671. ptr = s->picture_ptr->data[c] +
  672. (linesize * (v * mb_y + y)) +
  673. (h * mb_x + x);
  674. if (y == 0 && mb_y == 0) {
  675. if (x == 0 && mb_x == 0)
  676. pred = 128 << point_transform;
  677. else
  678. pred = ptr[-1];
  679. } else {
  680. if (x == 0 && mb_x == 0)
  681. pred = ptr[-linesize];
  682. else
  683. PREDICT(pred, ptr[-linesize - 1],
  684. ptr[-linesize], ptr[-1], predictor);
  685. }
  686. if (s->interlaced && s->bottom_field)
  687. ptr += linesize >> 1;
  688. *ptr = pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
  689. if (++x == h) {
  690. x = 0;
  691. y++;
  692. }
  693. }
  694. }
  695. } else {
  696. for (i = 0; i < nb_components; i++) {
  697. uint8_t *ptr;
  698. int n, h, v, x, y, c, j, linesize;
  699. n = s->nb_blocks[i];
  700. c = s->comp_index[i];
  701. h = s->h_scount[i];
  702. v = s->v_scount[i];
  703. x = 0;
  704. y = 0;
  705. linesize = s->linesize[c];
  706. for (j = 0; j < n; j++) {
  707. int pred;
  708. // FIXME optimize this crap
  709. ptr = s->picture_ptr->data[c] +
  710. (linesize * (v * mb_y + y)) +
  711. (h * mb_x + x);
  712. PREDICT(pred, ptr[-linesize - 1],
  713. ptr[-linesize], ptr[-1], predictor);
  714. *ptr = pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
  715. if (++x == h) {
  716. x = 0;
  717. y++;
  718. }
  719. }
  720. }
  721. }
  722. if (s->restart_interval && !--s->restart_count) {
  723. align_get_bits(&s->gb);
  724. skip_bits(&s->gb, 16); /* skip RSTn */
  725. }
  726. }
  727. }
  728. return 0;
  729. }
  730. static int mjpeg_decode_scan(MJpegDecodeContext *s, int nb_components, int Ah,
  731. int Al, const uint8_t *mb_bitmask,
  732. const AVFrame *reference)
  733. {
  734. int i, mb_x, mb_y;
  735. uint8_t *data[MAX_COMPONENTS];
  736. const uint8_t *reference_data[MAX_COMPONENTS];
  737. int linesize[MAX_COMPONENTS];
  738. GetBitContext mb_bitmask_gb;
  739. if (mb_bitmask)
  740. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width * s->mb_height);
  741. for (i = 0; i < nb_components; i++) {
  742. int c = s->comp_index[i];
  743. data[c] = s->picture_ptr->data[c];
  744. reference_data[c] = reference ? reference->data[c] : NULL;
  745. linesize[c] = s->linesize[c];
  746. s->coefs_finished[c] |= 1;
  747. }
  748. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  749. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  750. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  751. if (s->restart_interval && !s->restart_count)
  752. s->restart_count = s->restart_interval;
  753. if (get_bits_left(&s->gb) < 0) {
  754. av_log(s->avctx, AV_LOG_ERROR, "overread %d\n",
  755. -get_bits_left(&s->gb));
  756. return AVERROR_INVALIDDATA;
  757. }
  758. for (i = 0; i < nb_components; i++) {
  759. uint8_t *ptr;
  760. int n, h, v, x, y, c, j;
  761. int block_offset;
  762. n = s->nb_blocks[i];
  763. c = s->comp_index[i];
  764. h = s->h_scount[i];
  765. v = s->v_scount[i];
  766. x = 0;
  767. y = 0;
  768. for (j = 0; j < n; j++) {
  769. block_offset = ((linesize[c] * (v * mb_y + y) * 8) +
  770. (h * mb_x + x) * 8);
  771. if (s->interlaced && s->bottom_field)
  772. block_offset += linesize[c] >> 1;
  773. ptr = data[c] + block_offset;
  774. if (!s->progressive) {
  775. if (copy_mb)
  776. s->hdsp.put_pixels_tab[1][0](ptr,
  777. reference_data[c] + block_offset,
  778. linesize[c], 8);
  779. else {
  780. s->bdsp.clear_block(s->block);
  781. if (decode_block(s, s->block, i,
  782. s->dc_index[i], s->ac_index[i],
  783. s->quant_matrixes[s->quant_index[c]]) < 0) {
  784. av_log(s->avctx, AV_LOG_ERROR,
  785. "error y=%d x=%d\n", mb_y, mb_x);
  786. return AVERROR_INVALIDDATA;
  787. }
  788. s->idsp.idct_put(ptr, linesize[c], s->block);
  789. }
  790. } else {
  791. int block_idx = s->block_stride[c] * (v * mb_y + y) +
  792. (h * mb_x + x);
  793. int16_t *block = s->blocks[c][block_idx];
  794. if (Ah)
  795. block[0] += get_bits1(&s->gb) *
  796. s->quant_matrixes[s->quant_index[c]][0] << Al;
  797. else if (decode_dc_progressive(s, block, i, s->dc_index[i],
  798. s->quant_matrixes[s->quant_index[c]],
  799. Al) < 0) {
  800. av_log(s->avctx, AV_LOG_ERROR,
  801. "error y=%d x=%d\n", mb_y, mb_x);
  802. return AVERROR_INVALIDDATA;
  803. }
  804. }
  805. av_dlog(s->avctx, "mb: %d %d processed\n", mb_y, mb_x);
  806. av_dlog(s->avctx, "%d %d %d %d %d %d %d %d \n",
  807. mb_x, mb_y, x, y, c, s->bottom_field,
  808. (v * mb_y + y) * 8, (h * mb_x + x) * 8);
  809. if (++x == h) {
  810. x = 0;
  811. y++;
  812. }
  813. }
  814. }
  815. if (s->restart_interval) {
  816. s->restart_count--;
  817. i = 8 + ((-get_bits_count(&s->gb)) & 7);
  818. /* skip RSTn */
  819. if (show_bits(&s->gb, i) == (1 << i) - 1) {
  820. int pos = get_bits_count(&s->gb);
  821. align_get_bits(&s->gb);
  822. while (get_bits_left(&s->gb) >= 8 && show_bits(&s->gb, 8) == 0xFF)
  823. skip_bits(&s->gb, 8);
  824. if ((get_bits(&s->gb, 8) & 0xF8) == 0xD0) {
  825. for (i = 0; i < nb_components; i++) /* reset dc */
  826. s->last_dc[i] = 1024;
  827. } else
  828. skip_bits_long(&s->gb, pos - get_bits_count(&s->gb));
  829. }
  830. }
  831. }
  832. }
  833. return 0;
  834. }
  835. static int mjpeg_decode_scan_progressive_ac(MJpegDecodeContext *s, int ss,
  836. int se, int Ah, int Al,
  837. const uint8_t *mb_bitmask,
  838. const AVFrame *reference)
  839. {
  840. int mb_x, mb_y;
  841. int EOBRUN = 0;
  842. int c = s->comp_index[0];
  843. uint8_t *data = s->picture_ptr->data[c];
  844. const uint8_t *reference_data = reference ? reference->data[c] : NULL;
  845. int linesize = s->linesize[c];
  846. int last_scan = 0;
  847. int16_t *quant_matrix = s->quant_matrixes[s->quant_index[c]];
  848. GetBitContext mb_bitmask_gb;
  849. if (ss < 0 || ss >= 64 ||
  850. se < ss || se >= 64 ||
  851. Ah < 0 || Al < 0)
  852. return AVERROR_INVALIDDATA;
  853. if (mb_bitmask)
  854. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width * s->mb_height);
  855. if (!Al) {
  856. s->coefs_finished[c] |= (1LL << (se + 1)) - (1LL << ss);
  857. last_scan = !~s->coefs_finished[c];
  858. }
  859. if (s->interlaced && s->bottom_field) {
  860. int offset = linesize >> 1;
  861. data += offset;
  862. reference_data += offset;
  863. }
  864. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  865. int block_offset = mb_y * linesize * 8;
  866. uint8_t *ptr = data + block_offset;
  867. int block_idx = mb_y * s->block_stride[c];
  868. int16_t (*block)[64] = &s->blocks[c][block_idx];
  869. uint8_t *last_nnz = &s->last_nnz[c][block_idx];
  870. for (mb_x = 0; mb_x < s->mb_width; mb_x++, block++, last_nnz++) {
  871. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  872. if (!copy_mb) {
  873. int ret;
  874. if (Ah)
  875. ret = decode_block_refinement(s, *block, last_nnz, s->ac_index[0],
  876. quant_matrix, ss, se, Al, &EOBRUN);
  877. else
  878. ret = decode_block_progressive(s, *block, last_nnz, s->ac_index[0],
  879. quant_matrix, ss, se, Al, &EOBRUN);
  880. if (ret < 0) {
  881. av_log(s->avctx, AV_LOG_ERROR,
  882. "error y=%d x=%d\n", mb_y, mb_x);
  883. return AVERROR_INVALIDDATA;
  884. }
  885. }
  886. if (last_scan) {
  887. if (copy_mb) {
  888. s->hdsp.put_pixels_tab[1][0](ptr,
  889. reference_data + block_offset,
  890. linesize, 8);
  891. } else {
  892. s->idsp.idct_put(ptr, linesize, *block);
  893. ptr += 8;
  894. }
  895. }
  896. }
  897. }
  898. return 0;
  899. }
  900. int ff_mjpeg_decode_sos(MJpegDecodeContext *s, const uint8_t *mb_bitmask,
  901. const AVFrame *reference)
  902. {
  903. int len, nb_components, i, h, v, predictor, point_transform;
  904. int index, id, ret;
  905. const int block_size = s->lossless ? 1 : 8;
  906. int ilv, prev_shift;
  907. /* XXX: verify len field validity */
  908. len = get_bits(&s->gb, 16);
  909. nb_components = get_bits(&s->gb, 8);
  910. if (nb_components == 0 || nb_components > MAX_COMPONENTS) {
  911. av_log(s->avctx, AV_LOG_ERROR,
  912. "decode_sos: nb_components (%d) unsupported\n", nb_components);
  913. return AVERROR_PATCHWELCOME;
  914. }
  915. if (len != 6 + 2 * nb_components) {
  916. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: invalid len (%d)\n", len);
  917. return AVERROR_INVALIDDATA;
  918. }
  919. for (i = 0; i < nb_components; i++) {
  920. id = get_bits(&s->gb, 8) - 1;
  921. av_log(s->avctx, AV_LOG_DEBUG, "component: %d\n", id);
  922. /* find component index */
  923. for (index = 0; index < s->nb_components; index++)
  924. if (id == s->component_id[index])
  925. break;
  926. if (index == s->nb_components) {
  927. av_log(s->avctx, AV_LOG_ERROR,
  928. "decode_sos: index(%d) out of components\n", index);
  929. return AVERROR_INVALIDDATA;
  930. }
  931. /* Metasoft MJPEG codec has Cb and Cr swapped */
  932. if (s->avctx->codec_tag == MKTAG('M', 'T', 'S', 'J')
  933. && nb_components == 3 && s->nb_components == 3 && i)
  934. index = 3 - i;
  935. s->comp_index[i] = index;
  936. s->nb_blocks[i] = s->h_count[index] * s->v_count[index];
  937. s->h_scount[i] = s->h_count[index];
  938. s->v_scount[i] = s->v_count[index];
  939. s->dc_index[i] = get_bits(&s->gb, 4);
  940. s->ac_index[i] = get_bits(&s->gb, 4);
  941. if (s->dc_index[i] < 0 || s->ac_index[i] < 0 ||
  942. s->dc_index[i] >= 4 || s->ac_index[i] >= 4)
  943. goto out_of_range;
  944. if (!s->vlcs[0][s->dc_index[i]].table ||
  945. !s->vlcs[1][s->ac_index[i]].table)
  946. goto out_of_range;
  947. }
  948. predictor = get_bits(&s->gb, 8); /* JPEG Ss / lossless JPEG predictor /JPEG-LS NEAR */
  949. ilv = get_bits(&s->gb, 8); /* JPEG Se / JPEG-LS ILV */
  950. prev_shift = get_bits(&s->gb, 4); /* Ah */
  951. point_transform = get_bits(&s->gb, 4); /* Al */
  952. if (nb_components > 1) {
  953. /* interleaved stream */
  954. s->mb_width = (s->width + s->h_max * block_size - 1) / (s->h_max * block_size);
  955. s->mb_height = (s->height + s->v_max * block_size - 1) / (s->v_max * block_size);
  956. } else if (!s->ls) { /* skip this for JPEG-LS */
  957. h = s->h_max / s->h_scount[0];
  958. v = s->v_max / s->v_scount[0];
  959. s->mb_width = (s->width + h * block_size - 1) / (h * block_size);
  960. s->mb_height = (s->height + v * block_size - 1) / (v * block_size);
  961. s->nb_blocks[0] = 1;
  962. s->h_scount[0] = 1;
  963. s->v_scount[0] = 1;
  964. }
  965. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  966. av_log(s->avctx, AV_LOG_DEBUG, "%s %s p:%d >>:%d ilv:%d bits:%d %s\n",
  967. s->lossless ? "lossless" : "sequential DCT", s->rgb ? "RGB" : "",
  968. predictor, point_transform, ilv, s->bits,
  969. s->pegasus_rct ? "PRCT" : (s->rct ? "RCT" : ""));
  970. /* mjpeg-b can have padding bytes between sos and image data, skip them */
  971. for (i = s->mjpb_skiptosod; i > 0; i--)
  972. skip_bits(&s->gb, 8);
  973. next_field:
  974. for (i = 0; i < nb_components; i++)
  975. s->last_dc[i] = 1024;
  976. if (s->lossless) {
  977. if (CONFIG_JPEGLS_DECODER && s->ls) {
  978. // for () {
  979. // reset_ls_coding_parameters(s, 0);
  980. if ((ret = ff_jpegls_decode_picture(s, predictor,
  981. point_transform, ilv)) < 0)
  982. return ret;
  983. } else {
  984. if (s->rgb) {
  985. if ((ret = ljpeg_decode_rgb_scan(s, predictor,
  986. point_transform)) < 0)
  987. return ret;
  988. } else {
  989. if ((ret = ljpeg_decode_yuv_scan(s, predictor,
  990. point_transform,
  991. nb_components)) < 0)
  992. return ret;
  993. }
  994. }
  995. } else {
  996. if (s->progressive && predictor) {
  997. if ((ret = mjpeg_decode_scan_progressive_ac(s, predictor,
  998. ilv, prev_shift,
  999. point_transform,
  1000. mb_bitmask,
  1001. reference)) < 0)
  1002. return ret;
  1003. } else {
  1004. if ((ret = mjpeg_decode_scan(s, nb_components,
  1005. prev_shift, point_transform,
  1006. mb_bitmask, reference)) < 0)
  1007. return ret;
  1008. }
  1009. }
  1010. if (s->interlaced &&
  1011. get_bits_left(&s->gb) > 32 &&
  1012. show_bits(&s->gb, 8) == 0xFF) {
  1013. GetBitContext bak = s->gb;
  1014. align_get_bits(&bak);
  1015. if (show_bits(&bak, 16) == 0xFFD1) {
  1016. av_dlog(s->avctx, "AVRn interlaced picture marker found\n");
  1017. s->gb = bak;
  1018. skip_bits(&s->gb, 16);
  1019. s->bottom_field ^= 1;
  1020. goto next_field;
  1021. }
  1022. }
  1023. emms_c();
  1024. return 0;
  1025. out_of_range:
  1026. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: ac/dc index out of range\n");
  1027. return AVERROR_INVALIDDATA;
  1028. }
  1029. static int mjpeg_decode_dri(MJpegDecodeContext *s)
  1030. {
  1031. if (get_bits(&s->gb, 16) != 4)
  1032. return AVERROR_INVALIDDATA;
  1033. s->restart_interval = get_bits(&s->gb, 16);
  1034. s->restart_count = 0;
  1035. av_log(s->avctx, AV_LOG_DEBUG, "restart interval: %d\n",
  1036. s->restart_interval);
  1037. return 0;
  1038. }
  1039. static int mjpeg_decode_app(MJpegDecodeContext *s)
  1040. {
  1041. int len, id, i;
  1042. len = get_bits(&s->gb, 16);
  1043. if (len < 5)
  1044. return AVERROR_INVALIDDATA;
  1045. if (8 * len > get_bits_left(&s->gb))
  1046. return AVERROR_INVALIDDATA;
  1047. id = get_bits_long(&s->gb, 32);
  1048. id = av_be2ne32(id);
  1049. len -= 6;
  1050. if (s->avctx->debug & FF_DEBUG_STARTCODE)
  1051. av_log(s->avctx, AV_LOG_DEBUG, "APPx %8X\n", id);
  1052. /* Buggy AVID, it puts EOI only at every 10th frame. */
  1053. /* Also, this fourcc is used by non-avid files too, it holds some
  1054. information, but it's always present in AVID-created files. */
  1055. if (id == AV_RL32("AVI1")) {
  1056. /* structure:
  1057. 4bytes AVI1
  1058. 1bytes polarity
  1059. 1bytes always zero
  1060. 4bytes field_size
  1061. 4bytes field_size_less_padding
  1062. */
  1063. s->buggy_avid = 1;
  1064. i = get_bits(&s->gb, 8);
  1065. if (i == 2)
  1066. s->bottom_field = 1;
  1067. else if (i == 1)
  1068. s->bottom_field = 0;
  1069. #if 0
  1070. skip_bits(&s->gb, 8);
  1071. skip_bits(&s->gb, 32);
  1072. skip_bits(&s->gb, 32);
  1073. len -= 10;
  1074. #endif
  1075. goto out;
  1076. }
  1077. // len -= 2;
  1078. if (id == AV_RL32("JFIF")) {
  1079. int t_w, t_h, v1, v2;
  1080. skip_bits(&s->gb, 8); /* the trailing zero-byte */
  1081. v1 = get_bits(&s->gb, 8);
  1082. v2 = get_bits(&s->gb, 8);
  1083. skip_bits(&s->gb, 8);
  1084. s->avctx->sample_aspect_ratio.num = get_bits(&s->gb, 16);
  1085. s->avctx->sample_aspect_ratio.den = get_bits(&s->gb, 16);
  1086. ff_set_sar(s->avctx, s->avctx->sample_aspect_ratio);
  1087. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1088. av_log(s->avctx, AV_LOG_INFO,
  1089. "mjpeg: JFIF header found (version: %x.%x) SAR=%d/%d\n",
  1090. v1, v2,
  1091. s->avctx->sample_aspect_ratio.num,
  1092. s->avctx->sample_aspect_ratio.den);
  1093. t_w = get_bits(&s->gb, 8);
  1094. t_h = get_bits(&s->gb, 8);
  1095. if (t_w && t_h) {
  1096. /* skip thumbnail */
  1097. if (len -10 - (t_w * t_h * 3) > 0)
  1098. len -= t_w * t_h * 3;
  1099. }
  1100. len -= 10;
  1101. goto out;
  1102. }
  1103. if (id == AV_RL32("Adob") && (get_bits(&s->gb, 8) == 'e')) {
  1104. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1105. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Adobe header found\n");
  1106. skip_bits(&s->gb, 16); /* version */
  1107. skip_bits(&s->gb, 16); /* flags0 */
  1108. skip_bits(&s->gb, 16); /* flags1 */
  1109. skip_bits(&s->gb, 8); /* transform */
  1110. len -= 7;
  1111. goto out;
  1112. }
  1113. if (id == AV_RL32("LJIF")) {
  1114. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1115. av_log(s->avctx, AV_LOG_INFO,
  1116. "Pegasus lossless jpeg header found\n");
  1117. skip_bits(&s->gb, 16); /* version ? */
  1118. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1119. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1120. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1121. switch (get_bits(&s->gb, 8)) {
  1122. case 1:
  1123. s->rgb = 1;
  1124. s->pegasus_rct = 0;
  1125. break;
  1126. case 2:
  1127. s->rgb = 1;
  1128. s->pegasus_rct = 1;
  1129. break;
  1130. default:
  1131. av_log(s->avctx, AV_LOG_ERROR, "unknown colorspace\n");
  1132. }
  1133. len -= 9;
  1134. goto out;
  1135. }
  1136. /* Apple MJPEG-A */
  1137. if ((s->start_code == APP1) && (len > (0x28 - 8))) {
  1138. id = get_bits_long(&s->gb, 32);
  1139. id = av_be2ne32(id);
  1140. len -= 4;
  1141. /* Apple MJPEG-A */
  1142. if (id == AV_RL32("mjpg")) {
  1143. #if 0
  1144. skip_bits(&s->gb, 32); /* field size */
  1145. skip_bits(&s->gb, 32); /* pad field size */
  1146. skip_bits(&s->gb, 32); /* next off */
  1147. skip_bits(&s->gb, 32); /* quant off */
  1148. skip_bits(&s->gb, 32); /* huff off */
  1149. skip_bits(&s->gb, 32); /* image off */
  1150. skip_bits(&s->gb, 32); /* scan off */
  1151. skip_bits(&s->gb, 32); /* data off */
  1152. #endif
  1153. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1154. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Apple MJPEG-A header found\n");
  1155. }
  1156. }
  1157. out:
  1158. /* slow but needed for extreme adobe jpegs */
  1159. if (len < 0)
  1160. av_log(s->avctx, AV_LOG_ERROR,
  1161. "mjpeg: error, decode_app parser read over the end\n");
  1162. while (--len > 0)
  1163. skip_bits(&s->gb, 8);
  1164. return 0;
  1165. }
  1166. static int mjpeg_decode_com(MJpegDecodeContext *s)
  1167. {
  1168. int len = get_bits(&s->gb, 16);
  1169. if (len >= 2 && 8 * len - 16 <= get_bits_left(&s->gb)) {
  1170. char *cbuf = av_malloc(len - 1);
  1171. if (cbuf) {
  1172. int i;
  1173. for (i = 0; i < len - 2; i++)
  1174. cbuf[i] = get_bits(&s->gb, 8);
  1175. if (i > 0 && cbuf[i - 1] == '\n')
  1176. cbuf[i - 1] = 0;
  1177. else
  1178. cbuf[i] = 0;
  1179. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1180. av_log(s->avctx, AV_LOG_INFO, "mjpeg comment: '%s'\n", cbuf);
  1181. /* buggy avid, it puts EOI only at every 10th frame */
  1182. if (!strcmp(cbuf, "AVID")) {
  1183. s->buggy_avid = 1;
  1184. } else if (!strcmp(cbuf, "CS=ITU601"))
  1185. s->cs_itu601 = 1;
  1186. else if ((len > 20 && !strncmp(cbuf, "Intel(R) JPEG Library", 21)) ||
  1187. (len > 19 && !strncmp(cbuf, "Metasoft MJPEG Codec", 20)))
  1188. s->flipped = 1;
  1189. av_free(cbuf);
  1190. }
  1191. }
  1192. return 0;
  1193. }
  1194. /* return the 8 bit start code value and update the search
  1195. state. Return -1 if no start code found */
  1196. static int find_marker(const uint8_t **pbuf_ptr, const uint8_t *buf_end)
  1197. {
  1198. const uint8_t *buf_ptr;
  1199. unsigned int v, v2;
  1200. int val;
  1201. #ifdef DEBUG
  1202. int skipped = 0;
  1203. #endif
  1204. buf_ptr = *pbuf_ptr;
  1205. while (buf_ptr < buf_end) {
  1206. v = *buf_ptr++;
  1207. v2 = *buf_ptr;
  1208. if ((v == 0xff) && (v2 >= 0xc0) && (v2 <= 0xfe) && buf_ptr < buf_end) {
  1209. val = *buf_ptr++;
  1210. goto found;
  1211. }
  1212. #ifdef DEBUG
  1213. skipped++;
  1214. #endif
  1215. }
  1216. val = -1;
  1217. found:
  1218. av_dlog(NULL, "find_marker skipped %d bytes\n", skipped);
  1219. *pbuf_ptr = buf_ptr;
  1220. return val;
  1221. }
  1222. int ff_mjpeg_find_marker(MJpegDecodeContext *s,
  1223. const uint8_t **buf_ptr, const uint8_t *buf_end,
  1224. const uint8_t **unescaped_buf_ptr,
  1225. int *unescaped_buf_size)
  1226. {
  1227. int start_code;
  1228. start_code = find_marker(buf_ptr, buf_end);
  1229. av_fast_padded_malloc(&s->buffer, &s->buffer_size, buf_end - *buf_ptr);
  1230. if (!s->buffer)
  1231. return AVERROR(ENOMEM);
  1232. /* unescape buffer of SOS, use special treatment for JPEG-LS */
  1233. if (start_code == SOS && !s->ls) {
  1234. const uint8_t *src = *buf_ptr;
  1235. uint8_t *dst = s->buffer;
  1236. while (src < buf_end) {
  1237. uint8_t x = *(src++);
  1238. *(dst++) = x;
  1239. if (s->avctx->codec_id != AV_CODEC_ID_THP) {
  1240. if (x == 0xff) {
  1241. while (src < buf_end && x == 0xff)
  1242. x = *(src++);
  1243. if (x >= 0xd0 && x <= 0xd7)
  1244. *(dst++) = x;
  1245. else if (x)
  1246. break;
  1247. }
  1248. }
  1249. }
  1250. *unescaped_buf_ptr = s->buffer;
  1251. *unescaped_buf_size = dst - s->buffer;
  1252. memset(s->buffer + *unescaped_buf_size, 0,
  1253. FF_INPUT_BUFFER_PADDING_SIZE);
  1254. av_log(s->avctx, AV_LOG_DEBUG, "escaping removed %td bytes\n",
  1255. (buf_end - *buf_ptr) - (dst - s->buffer));
  1256. } else if (start_code == SOS && s->ls) {
  1257. const uint8_t *src = *buf_ptr;
  1258. uint8_t *dst = s->buffer;
  1259. int bit_count = 0;
  1260. int t = 0, b = 0;
  1261. PutBitContext pb;
  1262. s->cur_scan++;
  1263. /* find marker */
  1264. while (src + t < buf_end) {
  1265. uint8_t x = src[t++];
  1266. if (x == 0xff) {
  1267. while ((src + t < buf_end) && x == 0xff)
  1268. x = src[t++];
  1269. if (x & 0x80) {
  1270. t -= 2;
  1271. break;
  1272. }
  1273. }
  1274. }
  1275. bit_count = t * 8;
  1276. init_put_bits(&pb, dst, t);
  1277. /* unescape bitstream */
  1278. while (b < t) {
  1279. uint8_t x = src[b++];
  1280. put_bits(&pb, 8, x);
  1281. if (x == 0xFF) {
  1282. x = src[b++];
  1283. put_bits(&pb, 7, x);
  1284. bit_count--;
  1285. }
  1286. }
  1287. flush_put_bits(&pb);
  1288. *unescaped_buf_ptr = dst;
  1289. *unescaped_buf_size = (bit_count + 7) >> 3;
  1290. memset(s->buffer + *unescaped_buf_size, 0,
  1291. FF_INPUT_BUFFER_PADDING_SIZE);
  1292. } else {
  1293. *unescaped_buf_ptr = *buf_ptr;
  1294. *unescaped_buf_size = buf_end - *buf_ptr;
  1295. }
  1296. return start_code;
  1297. }
  1298. int ff_mjpeg_decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
  1299. AVPacket *avpkt)
  1300. {
  1301. AVFrame *frame = data;
  1302. const uint8_t *buf = avpkt->data;
  1303. int buf_size = avpkt->size;
  1304. MJpegDecodeContext *s = avctx->priv_data;
  1305. const uint8_t *buf_end, *buf_ptr;
  1306. const uint8_t *unescaped_buf_ptr;
  1307. int unescaped_buf_size;
  1308. int start_code;
  1309. int ret = 0;
  1310. s->got_picture = 0; // picture from previous image can not be reused
  1311. buf_ptr = buf;
  1312. buf_end = buf + buf_size;
  1313. while (buf_ptr < buf_end) {
  1314. /* find start next marker */
  1315. start_code = ff_mjpeg_find_marker(s, &buf_ptr, buf_end,
  1316. &unescaped_buf_ptr,
  1317. &unescaped_buf_size);
  1318. /* EOF */
  1319. if (start_code < 0) {
  1320. goto the_end;
  1321. } else if (unescaped_buf_size > INT_MAX / 8) {
  1322. av_log(avctx, AV_LOG_ERROR,
  1323. "MJPEG packet 0x%x too big (%d/%d), corrupt data?\n",
  1324. start_code, unescaped_buf_size, buf_size);
  1325. return AVERROR_INVALIDDATA;
  1326. }
  1327. av_log(avctx, AV_LOG_DEBUG, "marker=%x avail_size_in_buf=%td\n",
  1328. start_code, buf_end - buf_ptr);
  1329. ret = init_get_bits(&s->gb, unescaped_buf_ptr,
  1330. unescaped_buf_size * 8);
  1331. if (ret < 0)
  1332. return ret;
  1333. s->start_code = start_code;
  1334. if (s->avctx->debug & FF_DEBUG_STARTCODE)
  1335. av_log(avctx, AV_LOG_DEBUG, "startcode: %X\n", start_code);
  1336. /* process markers */
  1337. if (start_code >= 0xd0 && start_code <= 0xd7)
  1338. av_log(avctx, AV_LOG_DEBUG,
  1339. "restart marker: %d\n", start_code & 0x0f);
  1340. /* APP fields */
  1341. else if (start_code >= APP0 && start_code <= APP15)
  1342. mjpeg_decode_app(s);
  1343. /* Comment */
  1344. else if (start_code == COM)
  1345. mjpeg_decode_com(s);
  1346. if (!CONFIG_JPEGLS_DECODER &&
  1347. (start_code == SOF48 || start_code == LSE)) {
  1348. av_log(avctx, AV_LOG_ERROR, "JPEG-LS support not enabled.\n");
  1349. return AVERROR(ENOSYS);
  1350. }
  1351. switch (start_code) {
  1352. case SOI:
  1353. s->restart_interval = 0;
  1354. s->restart_count = 0;
  1355. /* nothing to do on SOI */
  1356. break;
  1357. case DQT:
  1358. ff_mjpeg_decode_dqt(s);
  1359. break;
  1360. case DHT:
  1361. if ((ret = ff_mjpeg_decode_dht(s)) < 0) {
  1362. av_log(avctx, AV_LOG_ERROR, "huffman table decode error\n");
  1363. return ret;
  1364. }
  1365. break;
  1366. case SOF0:
  1367. case SOF1:
  1368. s->lossless = 0;
  1369. s->ls = 0;
  1370. s->progressive = 0;
  1371. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1372. return ret;
  1373. break;
  1374. case SOF2:
  1375. s->lossless = 0;
  1376. s->ls = 0;
  1377. s->progressive = 1;
  1378. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1379. return ret;
  1380. break;
  1381. case SOF3:
  1382. s->lossless = 1;
  1383. s->ls = 0;
  1384. s->progressive = 0;
  1385. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1386. return ret;
  1387. break;
  1388. case SOF48:
  1389. s->lossless = 1;
  1390. s->ls = 1;
  1391. s->progressive = 0;
  1392. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1393. return ret;
  1394. break;
  1395. case LSE:
  1396. if (!CONFIG_JPEGLS_DECODER ||
  1397. (ret = ff_jpegls_decode_lse(s)) < 0)
  1398. return ret;
  1399. break;
  1400. case EOI:
  1401. s->cur_scan = 0;
  1402. if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
  1403. break;
  1404. eoi_parser:
  1405. if (!s->got_picture) {
  1406. av_log(avctx, AV_LOG_WARNING,
  1407. "Found EOI before any SOF, ignoring\n");
  1408. break;
  1409. }
  1410. if (s->interlaced) {
  1411. s->bottom_field ^= 1;
  1412. /* if not bottom field, do not output image yet */
  1413. if (s->bottom_field == !s->interlace_polarity)
  1414. goto not_the_end;
  1415. }
  1416. if ((ret = av_frame_ref(frame, s->picture_ptr)) < 0)
  1417. return ret;
  1418. if (s->flipped) {
  1419. int i;
  1420. for (i = 0; frame->data[i]; i++) {
  1421. int h = frame->height >> ((i == 1 || i == 2) ?
  1422. s->pix_desc->log2_chroma_h : 0);
  1423. frame->data[i] += frame->linesize[i] * (h - 1);
  1424. frame->linesize[i] *= -1;
  1425. }
  1426. }
  1427. *got_frame = 1;
  1428. if (!s->lossless &&
  1429. avctx->debug & FF_DEBUG_QP) {
  1430. av_log(avctx, AV_LOG_DEBUG,
  1431. "QP: %d\n", FFMAX3(s->qscale[0],
  1432. s->qscale[1],
  1433. s->qscale[2]));
  1434. }
  1435. goto the_end;
  1436. case SOS:
  1437. if (!s->got_picture) {
  1438. av_log(avctx, AV_LOG_WARNING,
  1439. "Can not process SOS before SOF, skipping\n");
  1440. break;
  1441. }
  1442. if ((ret = ff_mjpeg_decode_sos(s, NULL, NULL)) < 0 &&
  1443. (avctx->err_recognition & AV_EF_EXPLODE))
  1444. return ret;
  1445. /* buggy avid puts EOI every 10-20th frame */
  1446. /* if restart period is over process EOI */
  1447. if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
  1448. goto eoi_parser;
  1449. break;
  1450. case DRI:
  1451. mjpeg_decode_dri(s);
  1452. break;
  1453. case SOF5:
  1454. case SOF6:
  1455. case SOF7:
  1456. case SOF9:
  1457. case SOF10:
  1458. case SOF11:
  1459. case SOF13:
  1460. case SOF14:
  1461. case SOF15:
  1462. case JPG:
  1463. av_log(avctx, AV_LOG_ERROR,
  1464. "mjpeg: unsupported coding type (%x)\n", start_code);
  1465. break;
  1466. }
  1467. not_the_end:
  1468. /* eof process start code */
  1469. buf_ptr += (get_bits_count(&s->gb) + 7) / 8;
  1470. av_log(avctx, AV_LOG_DEBUG,
  1471. "marker parser used %d bytes (%d bits)\n",
  1472. (get_bits_count(&s->gb) + 7) / 8, get_bits_count(&s->gb));
  1473. }
  1474. if (s->got_picture) {
  1475. av_log(avctx, AV_LOG_WARNING, "EOI missing, emulating\n");
  1476. goto eoi_parser;
  1477. }
  1478. av_log(avctx, AV_LOG_FATAL, "No JPEG data found in image\n");
  1479. return AVERROR_INVALIDDATA;
  1480. the_end:
  1481. av_log(avctx, AV_LOG_DEBUG, "mjpeg decode frame unused %td bytes\n",
  1482. buf_end - buf_ptr);
  1483. // return buf_end - buf_ptr;
  1484. return buf_ptr - buf;
  1485. }
  1486. av_cold int ff_mjpeg_decode_end(AVCodecContext *avctx)
  1487. {
  1488. MJpegDecodeContext *s = avctx->priv_data;
  1489. int i, j;
  1490. if (s->picture) {
  1491. av_frame_free(&s->picture);
  1492. s->picture_ptr = NULL;
  1493. } else if (s->picture_ptr)
  1494. av_frame_unref(s->picture_ptr);
  1495. av_free(s->buffer);
  1496. av_freep(&s->ljpeg_buffer);
  1497. s->ljpeg_buffer_size = 0;
  1498. for (i = 0; i < 3; i++) {
  1499. for (j = 0; j < 4; j++)
  1500. ff_free_vlc(&s->vlcs[i][j]);
  1501. }
  1502. for (i = 0; i < MAX_COMPONENTS; i++) {
  1503. av_freep(&s->blocks[i]);
  1504. av_freep(&s->last_nnz[i]);
  1505. }
  1506. return 0;
  1507. }
  1508. #define OFFSET(x) offsetof(MJpegDecodeContext, x)
  1509. #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
  1510. static const AVOption options[] = {
  1511. { "extern_huff", "Use external huffman table.",
  1512. OFFSET(extern_huff), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VD },
  1513. { NULL },
  1514. };
  1515. static const AVClass mjpegdec_class = {
  1516. .class_name = "MJPEG decoder",
  1517. .item_name = av_default_item_name,
  1518. .option = options,
  1519. .version = LIBAVUTIL_VERSION_INT,
  1520. };
  1521. AVCodec ff_mjpeg_decoder = {
  1522. .name = "mjpeg",
  1523. .long_name = NULL_IF_CONFIG_SMALL("MJPEG (Motion JPEG)"),
  1524. .type = AVMEDIA_TYPE_VIDEO,
  1525. .id = AV_CODEC_ID_MJPEG,
  1526. .priv_data_size = sizeof(MJpegDecodeContext),
  1527. .init = ff_mjpeg_decode_init,
  1528. .close = ff_mjpeg_decode_end,
  1529. .decode = ff_mjpeg_decode_frame,
  1530. .capabilities = CODEC_CAP_DR1,
  1531. .priv_class = &mjpegdec_class,
  1532. };
  1533. AVCodec ff_thp_decoder = {
  1534. .name = "thp",
  1535. .long_name = NULL_IF_CONFIG_SMALL("Nintendo Gamecube THP video"),
  1536. .type = AVMEDIA_TYPE_VIDEO,
  1537. .id = AV_CODEC_ID_THP,
  1538. .priv_data_size = sizeof(MJpegDecodeContext),
  1539. .init = ff_mjpeg_decode_init,
  1540. .close = ff_mjpeg_decode_end,
  1541. .decode = ff_mjpeg_decode_frame,
  1542. .capabilities = CODEC_CAP_DR1,
  1543. };