You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1760 lines
60KB

  1. /*
  2. * MJPEG decoder
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. * Copyright (c) 2003 Alex Beregszaszi
  5. * Copyright (c) 2003-2004 Michael Niedermayer
  6. *
  7. * Support for external huffman table, various fixes (AVID workaround),
  8. * aspecting, new decode_frame mechanism and apple mjpeg-b support
  9. * by Alex Beregszaszi
  10. *
  11. * This file is part of Libav.
  12. *
  13. * Libav is free software; you can redistribute it and/or
  14. * modify it under the terms of the GNU Lesser General Public
  15. * License as published by the Free Software Foundation; either
  16. * version 2.1 of the License, or (at your option) any later version.
  17. *
  18. * Libav is distributed in the hope that it will be useful,
  19. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  20. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  21. * Lesser General Public License for more details.
  22. *
  23. * You should have received a copy of the GNU Lesser General Public
  24. * License along with Libav; if not, write to the Free Software
  25. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  26. */
  27. /**
  28. * @file
  29. * MJPEG decoder.
  30. */
  31. #include <assert.h>
  32. #include "libavutil/imgutils.h"
  33. #include "libavutil/opt.h"
  34. #include "avcodec.h"
  35. #include "blockdsp.h"
  36. #include "idctdsp.h"
  37. #include "internal.h"
  38. #include "jpegtables.h"
  39. #include "mjpeg.h"
  40. #include "mjpegdec.h"
  41. #include "jpeglsdec.h"
  42. #include "put_bits.h"
  43. static int build_vlc(VLC *vlc, const uint8_t *bits_table,
  44. const uint8_t *val_table, int nb_codes,
  45. int use_static, int is_ac)
  46. {
  47. uint8_t huff_size[256] = { 0 };
  48. uint16_t huff_code[256];
  49. uint16_t huff_sym[256];
  50. int i;
  51. assert(nb_codes <= 256);
  52. ff_mjpeg_build_huffman_codes(huff_size, huff_code, bits_table, val_table);
  53. for (i = 0; i < 256; i++)
  54. huff_sym[i] = i + 16 * is_ac;
  55. if (is_ac)
  56. huff_sym[0] = 16 * 256;
  57. return ff_init_vlc_sparse(vlc, 9, nb_codes, huff_size, 1, 1,
  58. huff_code, 2, 2, huff_sym, 2, 2, use_static);
  59. }
  60. static int build_basic_mjpeg_vlc(MJpegDecodeContext *s)
  61. {
  62. int ret;
  63. if ((ret = build_vlc(&s->vlcs[0][0], avpriv_mjpeg_bits_dc_luminance,
  64. avpriv_mjpeg_val_dc, 12, 0, 0)) < 0)
  65. return ret;
  66. if ((ret = build_vlc(&s->vlcs[0][1], avpriv_mjpeg_bits_dc_chrominance,
  67. avpriv_mjpeg_val_dc, 12, 0, 0)) < 0)
  68. return ret;
  69. if ((ret = build_vlc(&s->vlcs[1][0], avpriv_mjpeg_bits_ac_luminance,
  70. avpriv_mjpeg_val_ac_luminance, 251, 0, 1)) < 0)
  71. return ret;
  72. if ((ret = build_vlc(&s->vlcs[1][1], avpriv_mjpeg_bits_ac_chrominance,
  73. avpriv_mjpeg_val_ac_chrominance, 251, 0, 1)) < 0)
  74. return ret;
  75. if ((ret = build_vlc(&s->vlcs[2][0], avpriv_mjpeg_bits_ac_luminance,
  76. avpriv_mjpeg_val_ac_luminance, 251, 0, 0)) < 0)
  77. return ret;
  78. if ((ret = build_vlc(&s->vlcs[2][1], avpriv_mjpeg_bits_ac_chrominance,
  79. avpriv_mjpeg_val_ac_chrominance, 251, 0, 0)) < 0)
  80. return ret;
  81. return 0;
  82. }
  83. av_cold int ff_mjpeg_decode_init(AVCodecContext *avctx)
  84. {
  85. MJpegDecodeContext *s = avctx->priv_data;
  86. int ret;
  87. if (!s->picture_ptr) {
  88. s->picture = av_frame_alloc();
  89. if (!s->picture)
  90. return AVERROR(ENOMEM);
  91. s->picture_ptr = s->picture;
  92. }
  93. s->avctx = avctx;
  94. ff_blockdsp_init(&s->bdsp);
  95. ff_hpeldsp_init(&s->hdsp, avctx->flags);
  96. ff_idctdsp_init(&s->idsp, avctx);
  97. ff_init_scantable(s->idsp.idct_permutation, &s->scantable,
  98. ff_zigzag_direct);
  99. s->buffer_size = 0;
  100. s->buffer = NULL;
  101. s->start_code = -1;
  102. s->first_picture = 1;
  103. s->org_height = avctx->coded_height;
  104. avctx->chroma_sample_location = AVCHROMA_LOC_CENTER;
  105. avctx->colorspace = AVCOL_SPC_BT470BG;
  106. if ((ret = build_basic_mjpeg_vlc(s)) < 0)
  107. return ret;
  108. if (s->extern_huff) {
  109. av_log(avctx, AV_LOG_INFO, "mjpeg: using external huffman table\n");
  110. if ((ret = init_get_bits(&s->gb, avctx->extradata, avctx->extradata_size * 8)) < 0)
  111. return ret;
  112. if ((ret = ff_mjpeg_decode_dht(s))) {
  113. av_log(avctx, AV_LOG_ERROR,
  114. "mjpeg: error using external huffman table\n");
  115. return ret;
  116. }
  117. }
  118. if (avctx->field_order == AV_FIELD_BB) { /* quicktime icefloe 019 */
  119. s->interlace_polarity = 1; /* bottom field first */
  120. av_log(avctx, AV_LOG_DEBUG, "mjpeg bottom field first\n");
  121. }
  122. if (avctx->codec->id == AV_CODEC_ID_AMV)
  123. s->flipped = 1;
  124. return 0;
  125. }
  126. /* quantize tables */
  127. int ff_mjpeg_decode_dqt(MJpegDecodeContext *s)
  128. {
  129. int len, index, i, j;
  130. len = get_bits(&s->gb, 16) - 2;
  131. while (len >= 65) {
  132. /* only 8-bit precision handled */
  133. if (get_bits(&s->gb, 4) != 0) {
  134. av_log(s->avctx, AV_LOG_ERROR, "dqt: 16-bit precision\n");
  135. return -1;
  136. }
  137. index = get_bits(&s->gb, 4);
  138. if (index >= 4)
  139. return -1;
  140. av_log(s->avctx, AV_LOG_DEBUG, "index=%d\n", index);
  141. /* read quant table */
  142. for (i = 0; i < 64; i++) {
  143. j = s->scantable.permutated[i];
  144. s->quant_matrixes[index][j] = get_bits(&s->gb, 8);
  145. }
  146. // XXX FIXME fine-tune, and perhaps add dc too
  147. s->qscale[index] = FFMAX(s->quant_matrixes[index][s->scantable.permutated[1]],
  148. s->quant_matrixes[index][s->scantable.permutated[8]]) >> 1;
  149. av_log(s->avctx, AV_LOG_DEBUG, "qscale[%d]: %d\n",
  150. index, s->qscale[index]);
  151. len -= 65;
  152. }
  153. return 0;
  154. }
  155. /* decode huffman tables and build VLC decoders */
  156. int ff_mjpeg_decode_dht(MJpegDecodeContext *s)
  157. {
  158. int len, index, i, class, n, v, code_max;
  159. uint8_t bits_table[17];
  160. uint8_t val_table[256];
  161. int ret = 0;
  162. len = get_bits(&s->gb, 16) - 2;
  163. while (len > 0) {
  164. if (len < 17)
  165. return AVERROR_INVALIDDATA;
  166. class = get_bits(&s->gb, 4);
  167. if (class >= 2)
  168. return AVERROR_INVALIDDATA;
  169. index = get_bits(&s->gb, 4);
  170. if (index >= 4)
  171. return AVERROR_INVALIDDATA;
  172. n = 0;
  173. for (i = 1; i <= 16; i++) {
  174. bits_table[i] = get_bits(&s->gb, 8);
  175. n += bits_table[i];
  176. }
  177. len -= 17;
  178. if (len < n || n > 256)
  179. return AVERROR_INVALIDDATA;
  180. code_max = 0;
  181. for (i = 0; i < n; i++) {
  182. v = get_bits(&s->gb, 8);
  183. if (v > code_max)
  184. code_max = v;
  185. val_table[i] = v;
  186. }
  187. len -= n;
  188. /* build VLC and flush previous vlc if present */
  189. ff_free_vlc(&s->vlcs[class][index]);
  190. av_log(s->avctx, AV_LOG_DEBUG, "class=%d index=%d nb_codes=%d\n",
  191. class, index, code_max + 1);
  192. if ((ret = build_vlc(&s->vlcs[class][index], bits_table, val_table,
  193. code_max + 1, 0, class > 0)) < 0)
  194. return ret;
  195. if (class > 0) {
  196. ff_free_vlc(&s->vlcs[2][index]);
  197. if ((ret = build_vlc(&s->vlcs[2][index], bits_table, val_table,
  198. code_max + 1, 0, 0)) < 0)
  199. return ret;
  200. }
  201. }
  202. return 0;
  203. }
  204. int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
  205. {
  206. int h_count[MAX_COMPONENTS] = { 0 };
  207. int v_count[MAX_COMPONENTS] = { 0 };
  208. int len, nb_components, i, width, height, bits, pix_fmt_id, ret;
  209. /* XXX: verify len field validity */
  210. len = get_bits(&s->gb, 16);
  211. bits = get_bits(&s->gb, 8);
  212. if (s->pegasus_rct)
  213. bits = 9;
  214. if (bits == 9 && !s->pegasus_rct)
  215. s->rct = 1; // FIXME ugly
  216. if (bits != 8 && !s->lossless) {
  217. av_log(s->avctx, AV_LOG_ERROR, "only 8 bits/component accepted\n");
  218. return -1;
  219. }
  220. height = get_bits(&s->gb, 16);
  221. width = get_bits(&s->gb, 16);
  222. // HACK for odd_height.mov
  223. if (s->interlaced && s->width == width && s->height == height + 1)
  224. height= s->height;
  225. av_log(s->avctx, AV_LOG_DEBUG, "sof0: picture: %dx%d\n", width, height);
  226. if (av_image_check_size(width, height, 0, s->avctx) < 0)
  227. return AVERROR_INVALIDDATA;
  228. nb_components = get_bits(&s->gb, 8);
  229. if (nb_components <= 0 ||
  230. nb_components > MAX_COMPONENTS)
  231. return -1;
  232. if (s->interlaced && (s->bottom_field == !s->interlace_polarity)) {
  233. if (nb_components != s->nb_components) {
  234. av_log(s->avctx, AV_LOG_ERROR,
  235. "nb_components changing in interlaced picture\n");
  236. return AVERROR_INVALIDDATA;
  237. }
  238. }
  239. if (s->ls && !(bits <= 8 || nb_components == 1)) {
  240. avpriv_report_missing_feature(s->avctx,
  241. "JPEG-LS that is not <= 8 "
  242. "bits/component or 16-bit gray");
  243. return AVERROR_PATCHWELCOME;
  244. }
  245. s->nb_components = nb_components;
  246. s->h_max = 1;
  247. s->v_max = 1;
  248. for (i = 0; i < nb_components; i++) {
  249. /* component id */
  250. s->component_id[i] = get_bits(&s->gb, 8) - 1;
  251. h_count[i] = get_bits(&s->gb, 4);
  252. v_count[i] = get_bits(&s->gb, 4);
  253. /* compute hmax and vmax (only used in interleaved case) */
  254. if (h_count[i] > s->h_max)
  255. s->h_max = h_count[i];
  256. if (v_count[i] > s->v_max)
  257. s->v_max = v_count[i];
  258. s->quant_index[i] = get_bits(&s->gb, 8);
  259. if (s->quant_index[i] >= 4)
  260. return AVERROR_INVALIDDATA;
  261. if (!h_count[i] || !v_count[i]) {
  262. av_log(s->avctx, AV_LOG_ERROR,
  263. "Invalid sampling factor in component %d %d:%d\n",
  264. i, h_count[i], v_count[i]);
  265. return AVERROR_INVALIDDATA;
  266. }
  267. av_log(s->avctx, AV_LOG_DEBUG, "component %d %d:%d id: %d quant:%d\n",
  268. i, h_count[i], v_count[i],
  269. s->component_id[i], s->quant_index[i]);
  270. }
  271. if (s->ls && (s->h_max > 1 || s->v_max > 1)) {
  272. avpriv_report_missing_feature(s->avctx, "Subsampling in JPEG-LS");
  273. return AVERROR_PATCHWELCOME;
  274. }
  275. if (s->v_max == 1 && s->h_max == 1 && s->lossless == 1)
  276. s->rgb = 1;
  277. /* if different size, realloc/alloc picture */
  278. if (width != s->width || height != s->height || bits != s->bits ||
  279. memcmp(s->h_count, h_count, sizeof(h_count)) ||
  280. memcmp(s->v_count, v_count, sizeof(v_count))) {
  281. s->width = width;
  282. s->height = height;
  283. s->bits = bits;
  284. memcpy(s->h_count, h_count, sizeof(h_count));
  285. memcpy(s->v_count, v_count, sizeof(v_count));
  286. s->interlaced = 0;
  287. /* test interlaced mode */
  288. if (s->first_picture &&
  289. s->org_height != 0 &&
  290. s->height < ((s->org_height * 3) / 4)) {
  291. s->interlaced = 1;
  292. s->bottom_field = s->interlace_polarity;
  293. s->picture_ptr->interlaced_frame = 1;
  294. s->picture_ptr->top_field_first = !s->interlace_polarity;
  295. height *= 2;
  296. }
  297. ret = ff_set_dimensions(s->avctx, width, height);
  298. if (ret < 0)
  299. return ret;
  300. s->first_picture = 0;
  301. }
  302. if (!(s->interlaced && (s->bottom_field == !s->interlace_polarity))) {
  303. /* XXX: not complete test ! */
  304. pix_fmt_id = (s->h_count[0] << 28) | (s->v_count[0] << 24) |
  305. (s->h_count[1] << 20) | (s->v_count[1] << 16) |
  306. (s->h_count[2] << 12) | (s->v_count[2] << 8) |
  307. (s->h_count[3] << 4) | s->v_count[3];
  308. av_log(s->avctx, AV_LOG_DEBUG, "pix fmt id %x\n", pix_fmt_id);
  309. /* NOTE we do not allocate pictures large enough for the possible
  310. * padding of h/v_count being 4 */
  311. if (!(pix_fmt_id & 0xD0D0D0D0))
  312. pix_fmt_id -= (pix_fmt_id & 0xF0F0F0F0) >> 1;
  313. if (!(pix_fmt_id & 0x0D0D0D0D))
  314. pix_fmt_id -= (pix_fmt_id & 0x0F0F0F0F) >> 1;
  315. switch (pix_fmt_id) {
  316. case 0x11111100:
  317. if (s->rgb)
  318. s->avctx->pix_fmt = AV_PIX_FMT_BGRA;
  319. else {
  320. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV444P : AV_PIX_FMT_YUVJ444P;
  321. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  322. }
  323. assert(s->nb_components == 3);
  324. break;
  325. case 0x11000000:
  326. s->avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  327. break;
  328. case 0x12111100:
  329. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV440P : AV_PIX_FMT_YUVJ440P;
  330. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  331. break;
  332. case 0x21111100:
  333. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV422P : AV_PIX_FMT_YUVJ422P;
  334. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  335. break;
  336. case 0x22111100:
  337. s->avctx->pix_fmt = s->cs_itu601 ? AV_PIX_FMT_YUV420P : AV_PIX_FMT_YUVJ420P;
  338. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  339. break;
  340. default:
  341. avpriv_report_missing_feature(s->avctx, "Pixel format 0x%x", pix_fmt_id);
  342. return AVERROR_PATCHWELCOME;
  343. }
  344. if (s->ls) {
  345. if (s->nb_components > 1)
  346. s->avctx->pix_fmt = AV_PIX_FMT_RGB24;
  347. else if (s->bits <= 8)
  348. s->avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  349. else
  350. s->avctx->pix_fmt = AV_PIX_FMT_GRAY16;
  351. }
  352. s->pix_desc = av_pix_fmt_desc_get(s->avctx->pix_fmt);
  353. if (!s->pix_desc) {
  354. av_log(s->avctx, AV_LOG_ERROR, "Could not get a pixel format descriptor.\n");
  355. return AVERROR_BUG;
  356. }
  357. av_frame_unref(s->picture_ptr);
  358. if (ff_get_buffer(s->avctx, s->picture_ptr, AV_GET_BUFFER_FLAG_REF) < 0) {
  359. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  360. return -1;
  361. }
  362. s->picture_ptr->pict_type = AV_PICTURE_TYPE_I;
  363. s->picture_ptr->key_frame = 1;
  364. s->got_picture = 1;
  365. for (i = 0; i < 3; i++)
  366. s->linesize[i] = s->picture_ptr->linesize[i] << s->interlaced;
  367. ff_dlog(s->avctx, "%d %d %d %d %d %d\n",
  368. s->width, s->height, s->linesize[0], s->linesize[1],
  369. s->interlaced, s->avctx->height);
  370. if (len != (8 + (3 * nb_components)))
  371. av_log(s->avctx, AV_LOG_DEBUG, "decode_sof0: error, len(%d) mismatch\n", len);
  372. }
  373. /* totally blank picture as progressive JPEG will only add details to it */
  374. if (s->progressive) {
  375. int bw = (width + s->h_max * 8 - 1) / (s->h_max * 8);
  376. int bh = (height + s->v_max * 8 - 1) / (s->v_max * 8);
  377. for (i = 0; i < s->nb_components; i++) {
  378. int size = bw * bh * s->h_count[i] * s->v_count[i];
  379. av_freep(&s->blocks[i]);
  380. av_freep(&s->last_nnz[i]);
  381. s->blocks[i] = av_malloc(size * sizeof(**s->blocks));
  382. s->last_nnz[i] = av_mallocz(size * sizeof(**s->last_nnz));
  383. s->block_stride[i] = bw * s->h_count[i];
  384. }
  385. memset(s->coefs_finished, 0, sizeof(s->coefs_finished));
  386. }
  387. return 0;
  388. }
  389. static inline int mjpeg_decode_dc(MJpegDecodeContext *s, int dc_index)
  390. {
  391. int code;
  392. code = get_vlc2(&s->gb, s->vlcs[0][dc_index].table, 9, 2);
  393. if (code < 0) {
  394. av_log(s->avctx, AV_LOG_WARNING,
  395. "mjpeg_decode_dc: bad vlc: %d:%d (%p)\n",
  396. 0, dc_index, &s->vlcs[0][dc_index]);
  397. return 0xffff;
  398. }
  399. if (code)
  400. return get_xbits(&s->gb, code);
  401. else
  402. return 0;
  403. }
  404. /* decode block and dequantize */
  405. static int decode_block(MJpegDecodeContext *s, int16_t *block, int component,
  406. int dc_index, int ac_index, int16_t *quant_matrix)
  407. {
  408. int code, i, j, level, val;
  409. /* DC coef */
  410. val = mjpeg_decode_dc(s, dc_index);
  411. if (val == 0xffff) {
  412. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  413. return AVERROR_INVALIDDATA;
  414. }
  415. val = val * quant_matrix[0] + s->last_dc[component];
  416. s->last_dc[component] = val;
  417. block[0] = val;
  418. /* AC coefs */
  419. i = 0;
  420. {OPEN_READER(re, &s->gb);
  421. do {
  422. UPDATE_CACHE(re, &s->gb);
  423. GET_VLC(code, re, &s->gb, s->vlcs[1][ac_index].table, 9, 2);
  424. i += ((unsigned)code) >> 4;
  425. code &= 0xf;
  426. if (code) {
  427. if (code > MIN_CACHE_BITS - 16)
  428. UPDATE_CACHE(re, &s->gb);
  429. {
  430. int cache = GET_CACHE(re, &s->gb);
  431. int sign = (~cache) >> 31;
  432. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  433. }
  434. LAST_SKIP_BITS(re, &s->gb, code);
  435. if (i > 63) {
  436. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  437. return AVERROR_INVALIDDATA;
  438. }
  439. j = s->scantable.permutated[i];
  440. block[j] = level * quant_matrix[j];
  441. }
  442. } while (i < 63);
  443. CLOSE_READER(re, &s->gb);}
  444. return 0;
  445. }
  446. static int decode_dc_progressive(MJpegDecodeContext *s, int16_t *block,
  447. int component, int dc_index,
  448. int16_t *quant_matrix, int Al)
  449. {
  450. int val;
  451. s->bdsp.clear_block(block);
  452. val = mjpeg_decode_dc(s, dc_index);
  453. if (val == 0xffff) {
  454. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  455. return AVERROR_INVALIDDATA;
  456. }
  457. val = (val * quant_matrix[0] << Al) + s->last_dc[component];
  458. s->last_dc[component] = val;
  459. block[0] = val;
  460. return 0;
  461. }
  462. /* decode block and dequantize - progressive JPEG version */
  463. static int decode_block_progressive(MJpegDecodeContext *s, int16_t *block,
  464. uint8_t *last_nnz, int ac_index,
  465. int16_t *quant_matrix,
  466. int ss, int se, int Al, int *EOBRUN)
  467. {
  468. int code, i, j, level, val, run;
  469. if (*EOBRUN) {
  470. (*EOBRUN)--;
  471. return 0;
  472. }
  473. {
  474. OPEN_READER(re, &s->gb);
  475. for (i = ss; ; i++) {
  476. UPDATE_CACHE(re, &s->gb);
  477. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  478. run = ((unsigned) code) >> 4;
  479. code &= 0xF;
  480. if (code) {
  481. i += run;
  482. if (code > MIN_CACHE_BITS - 16)
  483. UPDATE_CACHE(re, &s->gb);
  484. {
  485. int cache = GET_CACHE(re, &s->gb);
  486. int sign = (~cache) >> 31;
  487. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  488. }
  489. LAST_SKIP_BITS(re, &s->gb, code);
  490. if (i >= se) {
  491. if (i == se) {
  492. j = s->scantable.permutated[se];
  493. block[j] = level * quant_matrix[j] << Al;
  494. break;
  495. }
  496. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  497. return AVERROR_INVALIDDATA;
  498. }
  499. j = s->scantable.permutated[i];
  500. block[j] = level * quant_matrix[j] << Al;
  501. } else {
  502. if (run == 0xF) {// ZRL - skip 15 coefficients
  503. i += 15;
  504. if (i >= se) {
  505. av_log(s->avctx, AV_LOG_ERROR, "ZRL overflow: %d\n", i);
  506. return AVERROR_INVALIDDATA;
  507. }
  508. } else {
  509. val = (1 << run);
  510. if (run) {
  511. UPDATE_CACHE(re, &s->gb);
  512. val += NEG_USR32(GET_CACHE(re, &s->gb), run);
  513. LAST_SKIP_BITS(re, &s->gb, run);
  514. }
  515. *EOBRUN = val - 1;
  516. break;
  517. }
  518. }
  519. }
  520. CLOSE_READER(re, &s->gb);
  521. }
  522. if (i > *last_nnz)
  523. *last_nnz = i;
  524. return 0;
  525. }
  526. #define REFINE_BIT(j) { \
  527. UPDATE_CACHE(re, &s->gb); \
  528. sign = block[j] >> 15; \
  529. block[j] += SHOW_UBITS(re, &s->gb, 1) * \
  530. ((quant_matrix[j] ^ sign) - sign) << Al; \
  531. LAST_SKIP_BITS(re, &s->gb, 1); \
  532. }
  533. #define ZERO_RUN \
  534. for (; ; i++) { \
  535. if (i > last) { \
  536. i += run; \
  537. if (i > se) { \
  538. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i); \
  539. return -1; \
  540. } \
  541. break; \
  542. } \
  543. j = s->scantable.permutated[i]; \
  544. if (block[j]) \
  545. REFINE_BIT(j) \
  546. else if (run-- == 0) \
  547. break; \
  548. }
  549. /* decode block and dequantize - progressive JPEG refinement pass */
  550. static int decode_block_refinement(MJpegDecodeContext *s, int16_t *block,
  551. uint8_t *last_nnz,
  552. int ac_index, int16_t *quant_matrix,
  553. int ss, int se, int Al, int *EOBRUN)
  554. {
  555. int code, i = ss, j, sign, val, run;
  556. int last = FFMIN(se, *last_nnz);
  557. OPEN_READER(re, &s->gb);
  558. if (*EOBRUN) {
  559. (*EOBRUN)--;
  560. } else {
  561. for (; ; i++) {
  562. UPDATE_CACHE(re, &s->gb);
  563. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  564. if (code & 0xF) {
  565. run = ((unsigned) code) >> 4;
  566. UPDATE_CACHE(re, &s->gb);
  567. val = SHOW_UBITS(re, &s->gb, 1);
  568. LAST_SKIP_BITS(re, &s->gb, 1);
  569. ZERO_RUN;
  570. j = s->scantable.permutated[i];
  571. val--;
  572. block[j] = ((quant_matrix[j]^val) - val) << Al;
  573. if (i == se) {
  574. if (i > *last_nnz)
  575. *last_nnz = i;
  576. CLOSE_READER(re, &s->gb);
  577. return 0;
  578. }
  579. } else {
  580. run = ((unsigned) code) >> 4;
  581. if (run == 0xF) {
  582. ZERO_RUN;
  583. } else {
  584. val = run;
  585. run = (1 << run);
  586. if (val) {
  587. UPDATE_CACHE(re, &s->gb);
  588. run += SHOW_UBITS(re, &s->gb, val);
  589. LAST_SKIP_BITS(re, &s->gb, val);
  590. }
  591. *EOBRUN = run - 1;
  592. break;
  593. }
  594. }
  595. }
  596. if (i > *last_nnz)
  597. *last_nnz = i;
  598. }
  599. for (; i <= last; i++) {
  600. j = s->scantable.permutated[i];
  601. if (block[j])
  602. REFINE_BIT(j)
  603. }
  604. CLOSE_READER(re, &s->gb);
  605. return 0;
  606. }
  607. #undef REFINE_BIT
  608. #undef ZERO_RUN
  609. static int ljpeg_decode_rgb_scan(MJpegDecodeContext *s, int predictor,
  610. int point_transform)
  611. {
  612. int i, mb_x, mb_y;
  613. uint16_t (*buffer)[4];
  614. int left[3], top[3], topleft[3];
  615. const int linesize = s->linesize[0];
  616. const int mask = (1 << s->bits) - 1;
  617. av_fast_malloc(&s->ljpeg_buffer, &s->ljpeg_buffer_size,
  618. (unsigned)s->mb_width * 4 * sizeof(s->ljpeg_buffer[0][0]));
  619. if (!s->ljpeg_buffer)
  620. return AVERROR(ENOMEM);
  621. buffer = s->ljpeg_buffer;
  622. for (i = 0; i < 3; i++)
  623. buffer[0][i] = 1 << (s->bits + point_transform - 1);
  624. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  625. const int modified_predictor = mb_y ? predictor : 1;
  626. uint8_t *ptr = s->picture_ptr->data[0] + (linesize * mb_y);
  627. if (s->interlaced && s->bottom_field)
  628. ptr += linesize >> 1;
  629. for (i = 0; i < 3; i++)
  630. top[i] = left[i] = topleft[i] = buffer[0][i];
  631. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  632. if (s->restart_interval && !s->restart_count)
  633. s->restart_count = s->restart_interval;
  634. for (i = 0; i < 3; i++) {
  635. int pred;
  636. topleft[i] = top[i];
  637. top[i] = buffer[mb_x][i];
  638. PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
  639. left[i] = buffer[mb_x][i] =
  640. mask & (pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform));
  641. }
  642. if (s->restart_interval && !--s->restart_count) {
  643. align_get_bits(&s->gb);
  644. skip_bits(&s->gb, 16); /* skip RSTn */
  645. }
  646. }
  647. if (s->rct) {
  648. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  649. ptr[4 * mb_x + 1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2] - 0x200) >> 2);
  650. ptr[4 * mb_x + 0] = buffer[mb_x][1] + ptr[4 * mb_x + 1];
  651. ptr[4 * mb_x + 2] = buffer[mb_x][2] + ptr[4 * mb_x + 1];
  652. }
  653. } else if (s->pegasus_rct) {
  654. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  655. ptr[4 * mb_x + 1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2]) >> 2);
  656. ptr[4 * mb_x + 0] = buffer[mb_x][1] + ptr[4 * mb_x + 1];
  657. ptr[4 * mb_x + 2] = buffer[mb_x][2] + ptr[4 * mb_x + 1];
  658. }
  659. } else {
  660. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  661. ptr[4 * mb_x + 0] = buffer[mb_x][2];
  662. ptr[4 * mb_x + 1] = buffer[mb_x][1];
  663. ptr[4 * mb_x + 2] = buffer[mb_x][0];
  664. }
  665. }
  666. }
  667. return 0;
  668. }
  669. static int ljpeg_decode_yuv_scan(MJpegDecodeContext *s, int predictor,
  670. int point_transform, int nb_components)
  671. {
  672. int i, mb_x, mb_y;
  673. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  674. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  675. if (s->restart_interval && !s->restart_count)
  676. s->restart_count = s->restart_interval;
  677. if (mb_x == 0 || mb_y == 0 || s->interlaced) {
  678. for (i = 0; i < nb_components; i++) {
  679. uint8_t *ptr;
  680. int n, h, v, x, y, c, j, linesize;
  681. n = s->nb_blocks[i];
  682. c = s->comp_index[i];
  683. h = s->h_scount[i];
  684. v = s->v_scount[i];
  685. x = 0;
  686. y = 0;
  687. linesize = s->linesize[c];
  688. for (j = 0; j < n; j++) {
  689. int pred;
  690. // FIXME optimize this crap
  691. ptr = s->picture_ptr->data[c] +
  692. (linesize * (v * mb_y + y)) +
  693. (h * mb_x + x);
  694. if (y == 0 && mb_y == 0) {
  695. if (x == 0 && mb_x == 0)
  696. pred = 128 << point_transform;
  697. else
  698. pred = ptr[-1];
  699. } else {
  700. if (x == 0 && mb_x == 0)
  701. pred = ptr[-linesize];
  702. else
  703. PREDICT(pred, ptr[-linesize - 1],
  704. ptr[-linesize], ptr[-1], predictor);
  705. }
  706. if (s->interlaced && s->bottom_field)
  707. ptr += linesize >> 1;
  708. *ptr = pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
  709. if (++x == h) {
  710. x = 0;
  711. y++;
  712. }
  713. }
  714. }
  715. } else {
  716. for (i = 0; i < nb_components; i++) {
  717. uint8_t *ptr;
  718. int n, h, v, x, y, c, j, linesize;
  719. n = s->nb_blocks[i];
  720. c = s->comp_index[i];
  721. h = s->h_scount[i];
  722. v = s->v_scount[i];
  723. x = 0;
  724. y = 0;
  725. linesize = s->linesize[c];
  726. for (j = 0; j < n; j++) {
  727. int pred;
  728. // FIXME optimize this crap
  729. ptr = s->picture_ptr->data[c] +
  730. (linesize * (v * mb_y + y)) +
  731. (h * mb_x + x);
  732. PREDICT(pred, ptr[-linesize - 1],
  733. ptr[-linesize], ptr[-1], predictor);
  734. *ptr = pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
  735. if (++x == h) {
  736. x = 0;
  737. y++;
  738. }
  739. }
  740. }
  741. }
  742. if (s->restart_interval && !--s->restart_count) {
  743. align_get_bits(&s->gb);
  744. skip_bits(&s->gb, 16); /* skip RSTn */
  745. }
  746. }
  747. }
  748. return 0;
  749. }
  750. static int mjpeg_decode_scan(MJpegDecodeContext *s, int nb_components, int Ah,
  751. int Al, const uint8_t *mb_bitmask,
  752. const AVFrame *reference)
  753. {
  754. int i, mb_x, mb_y;
  755. uint8_t *data[MAX_COMPONENTS];
  756. const uint8_t *reference_data[MAX_COMPONENTS];
  757. int linesize[MAX_COMPONENTS];
  758. GetBitContext mb_bitmask_gb;
  759. if (mb_bitmask)
  760. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width * s->mb_height);
  761. for (i = 0; i < nb_components; i++) {
  762. int c = s->comp_index[i];
  763. data[c] = s->picture_ptr->data[c];
  764. reference_data[c] = reference ? reference->data[c] : NULL;
  765. linesize[c] = s->linesize[c];
  766. s->coefs_finished[c] |= 1;
  767. }
  768. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  769. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  770. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  771. if (s->restart_interval && !s->restart_count)
  772. s->restart_count = s->restart_interval;
  773. if (get_bits_left(&s->gb) < 0) {
  774. av_log(s->avctx, AV_LOG_ERROR, "overread %d\n",
  775. -get_bits_left(&s->gb));
  776. return AVERROR_INVALIDDATA;
  777. }
  778. for (i = 0; i < nb_components; i++) {
  779. uint8_t *ptr;
  780. int n, h, v, x, y, c, j;
  781. int block_offset;
  782. n = s->nb_blocks[i];
  783. c = s->comp_index[i];
  784. h = s->h_scount[i];
  785. v = s->v_scount[i];
  786. x = 0;
  787. y = 0;
  788. for (j = 0; j < n; j++) {
  789. block_offset = ((linesize[c] * (v * mb_y + y) * 8) +
  790. (h * mb_x + x) * 8);
  791. if (s->interlaced && s->bottom_field)
  792. block_offset += linesize[c] >> 1;
  793. ptr = data[c] + block_offset;
  794. if (!s->progressive) {
  795. if (copy_mb)
  796. s->hdsp.put_pixels_tab[1][0](ptr,
  797. reference_data[c] + block_offset,
  798. linesize[c], 8);
  799. else {
  800. s->bdsp.clear_block(s->block);
  801. if (decode_block(s, s->block, i,
  802. s->dc_index[i], s->ac_index[i],
  803. s->quant_matrixes[s->quant_index[c]]) < 0) {
  804. av_log(s->avctx, AV_LOG_ERROR,
  805. "error y=%d x=%d\n", mb_y, mb_x);
  806. return AVERROR_INVALIDDATA;
  807. }
  808. s->idsp.idct_put(ptr, linesize[c], s->block);
  809. }
  810. } else {
  811. int block_idx = s->block_stride[c] * (v * mb_y + y) +
  812. (h * mb_x + x);
  813. int16_t *block = s->blocks[c][block_idx];
  814. if (Ah)
  815. block[0] += get_bits1(&s->gb) *
  816. s->quant_matrixes[s->quant_index[c]][0] << Al;
  817. else if (decode_dc_progressive(s, block, i, s->dc_index[i],
  818. s->quant_matrixes[s->quant_index[c]],
  819. Al) < 0) {
  820. av_log(s->avctx, AV_LOG_ERROR,
  821. "error y=%d x=%d\n", mb_y, mb_x);
  822. return AVERROR_INVALIDDATA;
  823. }
  824. }
  825. ff_dlog(s->avctx, "mb: %d %d processed\n", mb_y, mb_x);
  826. ff_dlog(s->avctx, "%d %d %d %d %d %d %d %d \n",
  827. mb_x, mb_y, x, y, c, s->bottom_field,
  828. (v * mb_y + y) * 8, (h * mb_x + x) * 8);
  829. if (++x == h) {
  830. x = 0;
  831. y++;
  832. }
  833. }
  834. }
  835. if (s->restart_interval) {
  836. s->restart_count--;
  837. i = 8 + ((-get_bits_count(&s->gb)) & 7);
  838. /* skip RSTn */
  839. if (show_bits(&s->gb, i) == (1 << i) - 1) {
  840. int pos = get_bits_count(&s->gb);
  841. align_get_bits(&s->gb);
  842. while (get_bits_left(&s->gb) >= 8 && show_bits(&s->gb, 8) == 0xFF)
  843. skip_bits(&s->gb, 8);
  844. if ((get_bits(&s->gb, 8) & 0xF8) == 0xD0) {
  845. for (i = 0; i < nb_components; i++) /* reset dc */
  846. s->last_dc[i] = 1024;
  847. } else
  848. skip_bits_long(&s->gb, pos - get_bits_count(&s->gb));
  849. }
  850. }
  851. }
  852. }
  853. return 0;
  854. }
  855. static int mjpeg_decode_scan_progressive_ac(MJpegDecodeContext *s, int ss,
  856. int se, int Ah, int Al,
  857. const uint8_t *mb_bitmask,
  858. const AVFrame *reference)
  859. {
  860. int mb_x, mb_y;
  861. int EOBRUN = 0;
  862. int c = s->comp_index[0];
  863. uint8_t *data = s->picture_ptr->data[c];
  864. const uint8_t *reference_data = reference ? reference->data[c] : NULL;
  865. int linesize = s->linesize[c];
  866. int last_scan = 0;
  867. int16_t *quant_matrix = s->quant_matrixes[s->quant_index[c]];
  868. GetBitContext mb_bitmask_gb;
  869. if (ss < 0 || ss >= 64 ||
  870. se < ss || se >= 64 ||
  871. Ah < 0 || Al < 0)
  872. return AVERROR_INVALIDDATA;
  873. if (mb_bitmask)
  874. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width * s->mb_height);
  875. if (!Al) {
  876. // s->coefs_finished is a bitmask for coefficients coded
  877. // ss and se are parameters telling start and end coefficients
  878. s->coefs_finished[c] |= (~0ULL >> (63 - (se - ss))) << ss;
  879. last_scan = !~s->coefs_finished[c];
  880. }
  881. if (s->interlaced && s->bottom_field) {
  882. int offset = linesize >> 1;
  883. data += offset;
  884. reference_data += offset;
  885. }
  886. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  887. int block_offset = mb_y * linesize * 8;
  888. uint8_t *ptr = data + block_offset;
  889. int block_idx = mb_y * s->block_stride[c];
  890. int16_t (*block)[64] = &s->blocks[c][block_idx];
  891. uint8_t *last_nnz = &s->last_nnz[c][block_idx];
  892. for (mb_x = 0; mb_x < s->mb_width; mb_x++, block++, last_nnz++) {
  893. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  894. if (!copy_mb) {
  895. int ret;
  896. if (Ah)
  897. ret = decode_block_refinement(s, *block, last_nnz, s->ac_index[0],
  898. quant_matrix, ss, se, Al, &EOBRUN);
  899. else
  900. ret = decode_block_progressive(s, *block, last_nnz, s->ac_index[0],
  901. quant_matrix, ss, se, Al, &EOBRUN);
  902. if (ret < 0) {
  903. av_log(s->avctx, AV_LOG_ERROR,
  904. "error y=%d x=%d\n", mb_y, mb_x);
  905. return AVERROR_INVALIDDATA;
  906. }
  907. }
  908. if (last_scan) {
  909. if (copy_mb) {
  910. s->hdsp.put_pixels_tab[1][0](ptr,
  911. reference_data + block_offset,
  912. linesize, 8);
  913. } else {
  914. s->idsp.idct_put(ptr, linesize, *block);
  915. ptr += 8;
  916. }
  917. }
  918. }
  919. }
  920. return 0;
  921. }
  922. int ff_mjpeg_decode_sos(MJpegDecodeContext *s, const uint8_t *mb_bitmask,
  923. const AVFrame *reference)
  924. {
  925. int len, nb_components, i, h, v, predictor, point_transform;
  926. int index, id, ret;
  927. const int block_size = s->lossless ? 1 : 8;
  928. int ilv, prev_shift;
  929. /* XXX: verify len field validity */
  930. len = get_bits(&s->gb, 16);
  931. nb_components = get_bits(&s->gb, 8);
  932. if (nb_components == 0 || nb_components > MAX_COMPONENTS) {
  933. avpriv_report_missing_feature(s->avctx,
  934. "decode_sos: nb_components (%d)",
  935. nb_components);
  936. return AVERROR_PATCHWELCOME;
  937. }
  938. if (len != 6 + 2 * nb_components) {
  939. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: invalid len (%d)\n", len);
  940. return AVERROR_INVALIDDATA;
  941. }
  942. for (i = 0; i < nb_components; i++) {
  943. id = get_bits(&s->gb, 8) - 1;
  944. av_log(s->avctx, AV_LOG_DEBUG, "component: %d\n", id);
  945. /* find component index */
  946. for (index = 0; index < s->nb_components; index++)
  947. if (id == s->component_id[index])
  948. break;
  949. if (index == s->nb_components) {
  950. av_log(s->avctx, AV_LOG_ERROR,
  951. "decode_sos: index(%d) out of components\n", index);
  952. return AVERROR_INVALIDDATA;
  953. }
  954. /* Metasoft MJPEG codec has Cb and Cr swapped */
  955. if (s->avctx->codec_tag == MKTAG('M', 'T', 'S', 'J')
  956. && nb_components == 3 && s->nb_components == 3 && i)
  957. index = 3 - i;
  958. s->comp_index[i] = index;
  959. s->nb_blocks[i] = s->h_count[index] * s->v_count[index];
  960. s->h_scount[i] = s->h_count[index];
  961. s->v_scount[i] = s->v_count[index];
  962. s->dc_index[i] = get_bits(&s->gb, 4);
  963. s->ac_index[i] = get_bits(&s->gb, 4);
  964. if (s->dc_index[i] < 0 || s->ac_index[i] < 0 ||
  965. s->dc_index[i] >= 4 || s->ac_index[i] >= 4)
  966. goto out_of_range;
  967. if (!s->vlcs[0][s->dc_index[i]].table ||
  968. !s->vlcs[1][s->ac_index[i]].table)
  969. goto out_of_range;
  970. }
  971. predictor = get_bits(&s->gb, 8); /* JPEG Ss / lossless JPEG predictor /JPEG-LS NEAR */
  972. ilv = get_bits(&s->gb, 8); /* JPEG Se / JPEG-LS ILV */
  973. prev_shift = get_bits(&s->gb, 4); /* Ah */
  974. point_transform = get_bits(&s->gb, 4); /* Al */
  975. if (nb_components > 1) {
  976. /* interleaved stream */
  977. s->mb_width = (s->width + s->h_max * block_size - 1) / (s->h_max * block_size);
  978. s->mb_height = (s->height + s->v_max * block_size - 1) / (s->v_max * block_size);
  979. } else if (!s->ls) { /* skip this for JPEG-LS */
  980. h = s->h_max / s->h_scount[0];
  981. v = s->v_max / s->v_scount[0];
  982. s->mb_width = (s->width + h * block_size - 1) / (h * block_size);
  983. s->mb_height = (s->height + v * block_size - 1) / (v * block_size);
  984. s->nb_blocks[0] = 1;
  985. s->h_scount[0] = 1;
  986. s->v_scount[0] = 1;
  987. }
  988. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  989. av_log(s->avctx, AV_LOG_DEBUG, "%s %s p:%d >>:%d ilv:%d bits:%d %s\n",
  990. s->lossless ? "lossless" : "sequential DCT", s->rgb ? "RGB" : "",
  991. predictor, point_transform, ilv, s->bits,
  992. s->pegasus_rct ? "PRCT" : (s->rct ? "RCT" : ""));
  993. /* mjpeg-b can have padding bytes between sos and image data, skip them */
  994. for (i = s->mjpb_skiptosod; i > 0; i--)
  995. skip_bits(&s->gb, 8);
  996. if (s->lossless && s->rgb && nb_components != 3) {
  997. avpriv_request_sample(s->avctx,
  998. "Lossless RGB image without 3 components");
  999. return AVERROR_PATCHWELCOME;
  1000. }
  1001. next_field:
  1002. for (i = 0; i < nb_components; i++)
  1003. s->last_dc[i] = 1024;
  1004. if (s->lossless) {
  1005. if (CONFIG_JPEGLS_DECODER && s->ls) {
  1006. // for () {
  1007. // reset_ls_coding_parameters(s, 0);
  1008. if ((ret = ff_jpegls_decode_picture(s, predictor,
  1009. point_transform, ilv)) < 0)
  1010. return ret;
  1011. } else {
  1012. if (s->rgb) {
  1013. if ((ret = ljpeg_decode_rgb_scan(s, predictor,
  1014. point_transform)) < 0)
  1015. return ret;
  1016. } else {
  1017. if ((ret = ljpeg_decode_yuv_scan(s, predictor,
  1018. point_transform,
  1019. nb_components)) < 0)
  1020. return ret;
  1021. }
  1022. }
  1023. } else {
  1024. if (s->progressive && predictor) {
  1025. if ((ret = mjpeg_decode_scan_progressive_ac(s, predictor,
  1026. ilv, prev_shift,
  1027. point_transform,
  1028. mb_bitmask,
  1029. reference)) < 0)
  1030. return ret;
  1031. } else {
  1032. if ((ret = mjpeg_decode_scan(s, nb_components,
  1033. prev_shift, point_transform,
  1034. mb_bitmask, reference)) < 0)
  1035. return ret;
  1036. }
  1037. }
  1038. if (s->interlaced &&
  1039. get_bits_left(&s->gb) > 32 &&
  1040. show_bits(&s->gb, 8) == 0xFF) {
  1041. GetBitContext bak = s->gb;
  1042. align_get_bits(&bak);
  1043. if (show_bits(&bak, 16) == 0xFFD1) {
  1044. ff_dlog(s->avctx, "AVRn interlaced picture marker found\n");
  1045. s->gb = bak;
  1046. skip_bits(&s->gb, 16);
  1047. s->bottom_field ^= 1;
  1048. goto next_field;
  1049. }
  1050. }
  1051. emms_c();
  1052. return 0;
  1053. out_of_range:
  1054. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: ac/dc index out of range\n");
  1055. return AVERROR_INVALIDDATA;
  1056. }
  1057. static int mjpeg_decode_dri(MJpegDecodeContext *s)
  1058. {
  1059. if (get_bits(&s->gb, 16) != 4)
  1060. return AVERROR_INVALIDDATA;
  1061. s->restart_interval = get_bits(&s->gb, 16);
  1062. s->restart_count = 0;
  1063. av_log(s->avctx, AV_LOG_DEBUG, "restart interval: %d\n",
  1064. s->restart_interval);
  1065. return 0;
  1066. }
  1067. static int mjpeg_decode_app(MJpegDecodeContext *s)
  1068. {
  1069. int len, id, i;
  1070. len = get_bits(&s->gb, 16);
  1071. if (len < 5)
  1072. return AVERROR_INVALIDDATA;
  1073. if (8 * len > get_bits_left(&s->gb))
  1074. return AVERROR_INVALIDDATA;
  1075. id = get_bits_long(&s->gb, 32);
  1076. id = av_be2ne32(id);
  1077. len -= 6;
  1078. if (s->avctx->debug & FF_DEBUG_STARTCODE)
  1079. av_log(s->avctx, AV_LOG_DEBUG, "APPx %8X\n", id);
  1080. /* Buggy AVID, it puts EOI only at every 10th frame. */
  1081. /* Also, this fourcc is used by non-avid files too, it holds some
  1082. information, but it's always present in AVID-created files. */
  1083. if (id == AV_RL32("AVI1")) {
  1084. /* structure:
  1085. 4bytes AVI1
  1086. 1bytes polarity
  1087. 1bytes always zero
  1088. 4bytes field_size
  1089. 4bytes field_size_less_padding
  1090. */
  1091. s->buggy_avid = 1;
  1092. i = get_bits(&s->gb, 8);
  1093. if (i == 2)
  1094. s->bottom_field = 1;
  1095. else if (i == 1)
  1096. s->bottom_field = 0;
  1097. goto out;
  1098. }
  1099. if (id == AV_RL32("JFIF")) {
  1100. int t_w, t_h, v1, v2;
  1101. skip_bits(&s->gb, 8); /* the trailing zero-byte */
  1102. v1 = get_bits(&s->gb, 8);
  1103. v2 = get_bits(&s->gb, 8);
  1104. skip_bits(&s->gb, 8);
  1105. s->avctx->sample_aspect_ratio.num = get_bits(&s->gb, 16);
  1106. s->avctx->sample_aspect_ratio.den = get_bits(&s->gb, 16);
  1107. ff_set_sar(s->avctx, s->avctx->sample_aspect_ratio);
  1108. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1109. av_log(s->avctx, AV_LOG_INFO,
  1110. "mjpeg: JFIF header found (version: %x.%x) SAR=%d/%d\n",
  1111. v1, v2,
  1112. s->avctx->sample_aspect_ratio.num,
  1113. s->avctx->sample_aspect_ratio.den);
  1114. t_w = get_bits(&s->gb, 8);
  1115. t_h = get_bits(&s->gb, 8);
  1116. if (t_w && t_h) {
  1117. /* skip thumbnail */
  1118. if (len -10 - (t_w * t_h * 3) > 0)
  1119. len -= t_w * t_h * 3;
  1120. }
  1121. len -= 10;
  1122. goto out;
  1123. }
  1124. if (id == AV_RL32("Adob") && (get_bits(&s->gb, 8) == 'e')) {
  1125. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1126. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Adobe header found\n");
  1127. skip_bits(&s->gb, 16); /* version */
  1128. skip_bits(&s->gb, 16); /* flags0 */
  1129. skip_bits(&s->gb, 16); /* flags1 */
  1130. skip_bits(&s->gb, 8); /* transform */
  1131. len -= 7;
  1132. goto out;
  1133. }
  1134. if (id == AV_RL32("LJIF")) {
  1135. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1136. av_log(s->avctx, AV_LOG_INFO,
  1137. "Pegasus lossless jpeg header found\n");
  1138. skip_bits(&s->gb, 16); /* version ? */
  1139. skip_bits(&s->gb, 16); /* unknown always 0? */
  1140. skip_bits(&s->gb, 16); /* unknown always 0? */
  1141. skip_bits(&s->gb, 16); /* unknown always 0? */
  1142. switch (get_bits(&s->gb, 8)) {
  1143. case 1:
  1144. s->rgb = 1;
  1145. s->pegasus_rct = 0;
  1146. break;
  1147. case 2:
  1148. s->rgb = 1;
  1149. s->pegasus_rct = 1;
  1150. break;
  1151. default:
  1152. av_log(s->avctx, AV_LOG_ERROR, "unknown colorspace\n");
  1153. }
  1154. len -= 9;
  1155. goto out;
  1156. }
  1157. /* Apple MJPEG-A */
  1158. if ((s->start_code == APP1) && (len > (0x28 - 8))) {
  1159. id = get_bits_long(&s->gb, 32);
  1160. id = av_be2ne32(id);
  1161. len -= 4;
  1162. /* Apple MJPEG-A */
  1163. if (id == AV_RL32("mjpg")) {
  1164. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1165. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Apple MJPEG-A header found\n");
  1166. }
  1167. }
  1168. out:
  1169. /* slow but needed for extreme adobe jpegs */
  1170. if (len < 0)
  1171. av_log(s->avctx, AV_LOG_ERROR,
  1172. "mjpeg: error, decode_app parser read over the end\n");
  1173. while (--len > 0)
  1174. skip_bits(&s->gb, 8);
  1175. return 0;
  1176. }
  1177. static int mjpeg_decode_com(MJpegDecodeContext *s)
  1178. {
  1179. int len = get_bits(&s->gb, 16);
  1180. if (len >= 2 && 8 * len - 16 <= get_bits_left(&s->gb)) {
  1181. int i;
  1182. char *cbuf = av_malloc(len - 1);
  1183. if (!cbuf)
  1184. return AVERROR(ENOMEM);
  1185. for (i = 0; i < len - 2; i++)
  1186. cbuf[i] = get_bits(&s->gb, 8);
  1187. if (i > 0 && cbuf[i - 1] == '\n')
  1188. cbuf[i - 1] = 0;
  1189. else
  1190. cbuf[i] = 0;
  1191. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1192. av_log(s->avctx, AV_LOG_INFO, "mjpeg comment: '%s'\n", cbuf);
  1193. /* buggy avid, it puts EOI only at every 10th frame */
  1194. if (!strcmp(cbuf, "AVID")) {
  1195. s->buggy_avid = 1;
  1196. } else if (!strcmp(cbuf, "CS=ITU601"))
  1197. s->cs_itu601 = 1;
  1198. else if ((len > 20 && !strncmp(cbuf, "Intel(R) JPEG Library", 21)) ||
  1199. (len > 19 && !strncmp(cbuf, "Metasoft MJPEG Codec", 20)))
  1200. s->flipped = 1;
  1201. av_free(cbuf);
  1202. }
  1203. return 0;
  1204. }
  1205. /* return the 8 bit start code value and update the search
  1206. state. Return -1 if no start code found */
  1207. static int find_marker(const uint8_t **pbuf_ptr, const uint8_t *buf_end)
  1208. {
  1209. const uint8_t *buf_ptr;
  1210. unsigned int v, v2;
  1211. int val;
  1212. #ifdef DEBUG
  1213. int skipped = 0;
  1214. #endif
  1215. buf_ptr = *pbuf_ptr;
  1216. while (buf_ptr < buf_end) {
  1217. v = *buf_ptr++;
  1218. v2 = *buf_ptr;
  1219. if ((v == 0xff) && (v2 >= 0xc0) && (v2 <= 0xfe) && buf_ptr < buf_end) {
  1220. val = *buf_ptr++;
  1221. goto found;
  1222. }
  1223. #ifdef DEBUG
  1224. skipped++;
  1225. #endif
  1226. }
  1227. val = -1;
  1228. found:
  1229. ff_dlog(NULL, "find_marker skipped %d bytes\n", skipped);
  1230. *pbuf_ptr = buf_ptr;
  1231. return val;
  1232. }
  1233. int ff_mjpeg_find_marker(MJpegDecodeContext *s,
  1234. const uint8_t **buf_ptr, const uint8_t *buf_end,
  1235. const uint8_t **unescaped_buf_ptr,
  1236. int *unescaped_buf_size)
  1237. {
  1238. int start_code;
  1239. start_code = find_marker(buf_ptr, buf_end);
  1240. av_fast_padded_malloc(&s->buffer, &s->buffer_size, buf_end - *buf_ptr);
  1241. if (!s->buffer)
  1242. return AVERROR(ENOMEM);
  1243. /* unescape buffer of SOS, use special treatment for JPEG-LS */
  1244. if (start_code == SOS && !s->ls) {
  1245. const uint8_t *src = *buf_ptr;
  1246. uint8_t *dst = s->buffer;
  1247. while (src < buf_end) {
  1248. uint8_t x = *(src++);
  1249. *(dst++) = x;
  1250. if (s->avctx->codec_id != AV_CODEC_ID_THP) {
  1251. if (x == 0xff) {
  1252. while (src < buf_end && x == 0xff)
  1253. x = *(src++);
  1254. if (x >= 0xd0 && x <= 0xd7)
  1255. *(dst++) = x;
  1256. else if (x)
  1257. break;
  1258. }
  1259. }
  1260. }
  1261. *unescaped_buf_ptr = s->buffer;
  1262. *unescaped_buf_size = dst - s->buffer;
  1263. memset(s->buffer + *unescaped_buf_size, 0,
  1264. AV_INPUT_BUFFER_PADDING_SIZE);
  1265. av_log(s->avctx, AV_LOG_DEBUG, "escaping removed %td bytes\n",
  1266. (buf_end - *buf_ptr) - (dst - s->buffer));
  1267. } else if (start_code == SOS && s->ls) {
  1268. const uint8_t *src = *buf_ptr;
  1269. uint8_t *dst = s->buffer;
  1270. int bit_count = 0;
  1271. int t = 0, b = 0;
  1272. PutBitContext pb;
  1273. s->cur_scan++;
  1274. /* find marker */
  1275. while (src + t < buf_end) {
  1276. uint8_t x = src[t++];
  1277. if (x == 0xff) {
  1278. while ((src + t < buf_end) && x == 0xff)
  1279. x = src[t++];
  1280. if (x & 0x80) {
  1281. t -= 2;
  1282. break;
  1283. }
  1284. }
  1285. }
  1286. bit_count = t * 8;
  1287. init_put_bits(&pb, dst, t);
  1288. /* unescape bitstream */
  1289. while (b < t) {
  1290. uint8_t x = src[b++];
  1291. put_bits(&pb, 8, x);
  1292. if (x == 0xFF) {
  1293. x = src[b++];
  1294. put_bits(&pb, 7, x);
  1295. bit_count--;
  1296. }
  1297. }
  1298. flush_put_bits(&pb);
  1299. *unescaped_buf_ptr = dst;
  1300. *unescaped_buf_size = (bit_count + 7) >> 3;
  1301. memset(s->buffer + *unescaped_buf_size, 0,
  1302. AV_INPUT_BUFFER_PADDING_SIZE);
  1303. } else {
  1304. *unescaped_buf_ptr = *buf_ptr;
  1305. *unescaped_buf_size = buf_end - *buf_ptr;
  1306. }
  1307. return start_code;
  1308. }
  1309. int ff_mjpeg_decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
  1310. AVPacket *avpkt)
  1311. {
  1312. AVFrame *frame = data;
  1313. const uint8_t *buf = avpkt->data;
  1314. int buf_size = avpkt->size;
  1315. MJpegDecodeContext *s = avctx->priv_data;
  1316. const uint8_t *buf_end, *buf_ptr;
  1317. const uint8_t *unescaped_buf_ptr;
  1318. int unescaped_buf_size;
  1319. int start_code;
  1320. int ret = 0;
  1321. s->got_picture = 0; // picture from previous image can not be reused
  1322. buf_ptr = buf;
  1323. buf_end = buf + buf_size;
  1324. while (buf_ptr < buf_end) {
  1325. /* find start next marker */
  1326. start_code = ff_mjpeg_find_marker(s, &buf_ptr, buf_end,
  1327. &unescaped_buf_ptr,
  1328. &unescaped_buf_size);
  1329. /* EOF */
  1330. if (start_code < 0) {
  1331. goto the_end;
  1332. } else if (unescaped_buf_size > INT_MAX / 8) {
  1333. av_log(avctx, AV_LOG_ERROR,
  1334. "MJPEG packet 0x%x too big (%d/%d), corrupt data?\n",
  1335. start_code, unescaped_buf_size, buf_size);
  1336. return AVERROR_INVALIDDATA;
  1337. }
  1338. av_log(avctx, AV_LOG_DEBUG, "marker=%x avail_size_in_buf=%td\n",
  1339. start_code, buf_end - buf_ptr);
  1340. ret = init_get_bits(&s->gb, unescaped_buf_ptr,
  1341. unescaped_buf_size * 8);
  1342. if (ret < 0)
  1343. return ret;
  1344. s->start_code = start_code;
  1345. if (s->avctx->debug & FF_DEBUG_STARTCODE)
  1346. av_log(avctx, AV_LOG_DEBUG, "startcode: %X\n", start_code);
  1347. /* process markers */
  1348. if (start_code >= 0xd0 && start_code <= 0xd7) {
  1349. av_log(avctx, AV_LOG_DEBUG,
  1350. "restart marker: %d\n", start_code & 0x0f);
  1351. /* APP fields */
  1352. } else if (start_code >= APP0 && start_code <= APP15) {
  1353. if ((ret = mjpeg_decode_app(s)) < 0)
  1354. return ret;
  1355. /* Comment */
  1356. } else if (start_code == COM) {
  1357. ret = mjpeg_decode_com(s);
  1358. if (ret < 0)
  1359. return ret;
  1360. }
  1361. if (!CONFIG_JPEGLS_DECODER &&
  1362. (start_code == SOF48 || start_code == LSE)) {
  1363. av_log(avctx, AV_LOG_ERROR, "JPEG-LS support not enabled.\n");
  1364. return AVERROR(ENOSYS);
  1365. }
  1366. switch (start_code) {
  1367. case SOI:
  1368. s->restart_interval = 0;
  1369. s->restart_count = 0;
  1370. /* nothing to do on SOI */
  1371. break;
  1372. case DQT:
  1373. if ((ret = ff_mjpeg_decode_dqt(s)) < 0)
  1374. return ret;
  1375. break;
  1376. case DHT:
  1377. if ((ret = ff_mjpeg_decode_dht(s)) < 0) {
  1378. av_log(avctx, AV_LOG_ERROR, "huffman table decode error\n");
  1379. return ret;
  1380. }
  1381. break;
  1382. case SOF0:
  1383. case SOF1:
  1384. s->lossless = 0;
  1385. s->ls = 0;
  1386. s->progressive = 0;
  1387. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1388. return ret;
  1389. break;
  1390. case SOF2:
  1391. s->lossless = 0;
  1392. s->ls = 0;
  1393. s->progressive = 1;
  1394. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1395. return ret;
  1396. break;
  1397. case SOF3:
  1398. s->lossless = 1;
  1399. s->ls = 0;
  1400. s->progressive = 0;
  1401. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1402. return ret;
  1403. break;
  1404. case SOF48:
  1405. s->lossless = 1;
  1406. s->ls = 1;
  1407. s->progressive = 0;
  1408. if ((ret = ff_mjpeg_decode_sof(s)) < 0)
  1409. return ret;
  1410. break;
  1411. case LSE:
  1412. if (!CONFIG_JPEGLS_DECODER ||
  1413. (ret = ff_jpegls_decode_lse(s)) < 0)
  1414. return ret;
  1415. break;
  1416. case EOI:
  1417. s->cur_scan = 0;
  1418. if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
  1419. break;
  1420. eoi_parser:
  1421. if (!s->got_picture) {
  1422. av_log(avctx, AV_LOG_WARNING,
  1423. "Found EOI before any SOF, ignoring\n");
  1424. break;
  1425. }
  1426. if (s->interlaced) {
  1427. s->bottom_field ^= 1;
  1428. /* if not bottom field, do not output image yet */
  1429. if (s->bottom_field == !s->interlace_polarity)
  1430. goto not_the_end;
  1431. }
  1432. if ((ret = av_frame_ref(frame, s->picture_ptr)) < 0)
  1433. return ret;
  1434. if (s->flipped) {
  1435. int i;
  1436. for (i = 0; frame->data[i]; i++) {
  1437. int h = frame->height >> ((i == 1 || i == 2) ?
  1438. s->pix_desc->log2_chroma_h : 0);
  1439. frame->data[i] += frame->linesize[i] * (h - 1);
  1440. frame->linesize[i] *= -1;
  1441. }
  1442. }
  1443. *got_frame = 1;
  1444. if (!s->lossless &&
  1445. avctx->debug & FF_DEBUG_QP) {
  1446. av_log(avctx, AV_LOG_DEBUG,
  1447. "QP: %d\n", FFMAX3(s->qscale[0],
  1448. s->qscale[1],
  1449. s->qscale[2]));
  1450. }
  1451. goto the_end;
  1452. case SOS:
  1453. if (!s->got_picture) {
  1454. av_log(avctx, AV_LOG_WARNING,
  1455. "Can not process SOS before SOF, skipping\n");
  1456. break;
  1457. }
  1458. if ((ret = ff_mjpeg_decode_sos(s, NULL, NULL)) < 0 &&
  1459. (avctx->err_recognition & AV_EF_EXPLODE))
  1460. return ret;
  1461. /* buggy avid puts EOI every 10-20th frame */
  1462. /* if restart period is over process EOI */
  1463. if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
  1464. goto eoi_parser;
  1465. break;
  1466. case DRI:
  1467. if ((ret = mjpeg_decode_dri(s)) < 0)
  1468. return ret;
  1469. break;
  1470. case SOF5:
  1471. case SOF6:
  1472. case SOF7:
  1473. case SOF9:
  1474. case SOF10:
  1475. case SOF11:
  1476. case SOF13:
  1477. case SOF14:
  1478. case SOF15:
  1479. case JPG:
  1480. av_log(avctx, AV_LOG_ERROR,
  1481. "mjpeg: unsupported coding type (%x)\n", start_code);
  1482. break;
  1483. }
  1484. not_the_end:
  1485. /* eof process start code */
  1486. buf_ptr += (get_bits_count(&s->gb) + 7) / 8;
  1487. av_log(avctx, AV_LOG_DEBUG,
  1488. "marker parser used %d bytes (%d bits)\n",
  1489. (get_bits_count(&s->gb) + 7) / 8, get_bits_count(&s->gb));
  1490. }
  1491. if (s->got_picture) {
  1492. av_log(avctx, AV_LOG_WARNING, "EOI missing, emulating\n");
  1493. goto eoi_parser;
  1494. }
  1495. av_log(avctx, AV_LOG_FATAL, "No JPEG data found in image\n");
  1496. return AVERROR_INVALIDDATA;
  1497. the_end:
  1498. av_log(avctx, AV_LOG_DEBUG, "mjpeg decode frame unused %td bytes\n",
  1499. buf_end - buf_ptr);
  1500. // return buf_end - buf_ptr;
  1501. return buf_ptr - buf;
  1502. }
  1503. av_cold int ff_mjpeg_decode_end(AVCodecContext *avctx)
  1504. {
  1505. MJpegDecodeContext *s = avctx->priv_data;
  1506. int i, j;
  1507. if (s->picture) {
  1508. av_frame_free(&s->picture);
  1509. s->picture_ptr = NULL;
  1510. } else if (s->picture_ptr)
  1511. av_frame_unref(s->picture_ptr);
  1512. av_free(s->buffer);
  1513. av_freep(&s->ljpeg_buffer);
  1514. s->ljpeg_buffer_size = 0;
  1515. for (i = 0; i < 3; i++) {
  1516. for (j = 0; j < 4; j++)
  1517. ff_free_vlc(&s->vlcs[i][j]);
  1518. }
  1519. for (i = 0; i < MAX_COMPONENTS; i++) {
  1520. av_freep(&s->blocks[i]);
  1521. av_freep(&s->last_nnz[i]);
  1522. }
  1523. return 0;
  1524. }
  1525. #define OFFSET(x) offsetof(MJpegDecodeContext, x)
  1526. #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
  1527. static const AVOption options[] = {
  1528. { "extern_huff", "Use external huffman table.",
  1529. OFFSET(extern_huff), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VD },
  1530. { NULL },
  1531. };
  1532. static const AVClass mjpegdec_class = {
  1533. .class_name = "MJPEG decoder",
  1534. .item_name = av_default_item_name,
  1535. .option = options,
  1536. .version = LIBAVUTIL_VERSION_INT,
  1537. };
  1538. AVCodec ff_mjpeg_decoder = {
  1539. .name = "mjpeg",
  1540. .long_name = NULL_IF_CONFIG_SMALL("MJPEG (Motion JPEG)"),
  1541. .type = AVMEDIA_TYPE_VIDEO,
  1542. .id = AV_CODEC_ID_MJPEG,
  1543. .priv_data_size = sizeof(MJpegDecodeContext),
  1544. .init = ff_mjpeg_decode_init,
  1545. .close = ff_mjpeg_decode_end,
  1546. .decode = ff_mjpeg_decode_frame,
  1547. .capabilities = AV_CODEC_CAP_DR1,
  1548. .priv_class = &mjpegdec_class,
  1549. .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE,
  1550. };
  1551. AVCodec ff_thp_decoder = {
  1552. .name = "thp",
  1553. .long_name = NULL_IF_CONFIG_SMALL("Nintendo Gamecube THP video"),
  1554. .type = AVMEDIA_TYPE_VIDEO,
  1555. .id = AV_CODEC_ID_THP,
  1556. .priv_data_size = sizeof(MJpegDecodeContext),
  1557. .init = ff_mjpeg_decode_init,
  1558. .close = ff_mjpeg_decode_end,
  1559. .decode = ff_mjpeg_decode_frame,
  1560. .capabilities = AV_CODEC_CAP_DR1,
  1561. .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE,
  1562. };