You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1685 lines
57KB

  1. /*
  2. * MJPEG decoder
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. * Copyright (c) 2003 Alex Beregszaszi
  5. * Copyright (c) 2003-2004 Michael Niedermayer
  6. *
  7. * Support for external huffman table, various fixes (AVID workaround),
  8. * aspecting, new decode_frame mechanism and apple mjpeg-b support
  9. * by Alex Beregszaszi
  10. *
  11. * This file is part of Libav.
  12. *
  13. * Libav is free software; you can redistribute it and/or
  14. * modify it under the terms of the GNU Lesser General Public
  15. * License as published by the Free Software Foundation; either
  16. * version 2.1 of the License, or (at your option) any later version.
  17. *
  18. * Libav is distributed in the hope that it will be useful,
  19. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  20. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  21. * Lesser General Public License for more details.
  22. *
  23. * You should have received a copy of the GNU Lesser General Public
  24. * License along with Libav; if not, write to the Free Software
  25. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  26. */
  27. /**
  28. * @file
  29. * MJPEG decoder.
  30. */
  31. // #define DEBUG
  32. #include <assert.h>
  33. #include "libavutil/imgutils.h"
  34. #include "libavutil/opt.h"
  35. #include "avcodec.h"
  36. #include "dsputil.h"
  37. #include "mjpeg.h"
  38. #include "mjpegdec.h"
  39. #include "jpeglsdec.h"
  40. static int build_vlc(VLC *vlc, const uint8_t *bits_table,
  41. const uint8_t *val_table, int nb_codes,
  42. int use_static, int is_ac)
  43. {
  44. uint8_t huff_size[256];
  45. uint16_t huff_code[256];
  46. uint16_t huff_sym[256];
  47. int i;
  48. assert(nb_codes <= 256);
  49. memset(huff_size, 0, sizeof(huff_size));
  50. ff_mjpeg_build_huffman_codes(huff_size, huff_code, bits_table, val_table);
  51. for (i = 0; i < 256; i++)
  52. huff_sym[i] = i + 16 * is_ac;
  53. if (is_ac)
  54. huff_sym[0] = 16 * 256;
  55. return ff_init_vlc_sparse(vlc, 9, nb_codes, huff_size, 1, 1,
  56. huff_code, 2, 2, huff_sym, 2, 2, use_static);
  57. }
  58. static void build_basic_mjpeg_vlc(MJpegDecodeContext *s)
  59. {
  60. build_vlc(&s->vlcs[0][0], ff_mjpeg_bits_dc_luminance,
  61. ff_mjpeg_val_dc, 12, 0, 0);
  62. build_vlc(&s->vlcs[0][1], ff_mjpeg_bits_dc_chrominance,
  63. ff_mjpeg_val_dc, 12, 0, 0);
  64. build_vlc(&s->vlcs[1][0], ff_mjpeg_bits_ac_luminance,
  65. ff_mjpeg_val_ac_luminance, 251, 0, 1);
  66. build_vlc(&s->vlcs[1][1], ff_mjpeg_bits_ac_chrominance,
  67. ff_mjpeg_val_ac_chrominance, 251, 0, 1);
  68. build_vlc(&s->vlcs[2][0], ff_mjpeg_bits_ac_luminance,
  69. ff_mjpeg_val_ac_luminance, 251, 0, 0);
  70. build_vlc(&s->vlcs[2][1], ff_mjpeg_bits_ac_chrominance,
  71. ff_mjpeg_val_ac_chrominance, 251, 0, 0);
  72. }
  73. av_cold int ff_mjpeg_decode_init(AVCodecContext *avctx)
  74. {
  75. MJpegDecodeContext *s = avctx->priv_data;
  76. if (!s->picture_ptr)
  77. s->picture_ptr = &s->picture;
  78. s->avctx = avctx;
  79. ff_dsputil_init(&s->dsp, avctx);
  80. ff_init_scantable(s->dsp.idct_permutation, &s->scantable, ff_zigzag_direct);
  81. s->buffer_size = 0;
  82. s->buffer = NULL;
  83. s->start_code = -1;
  84. s->first_picture = 1;
  85. s->org_height = avctx->coded_height;
  86. avctx->chroma_sample_location = AVCHROMA_LOC_CENTER;
  87. build_basic_mjpeg_vlc(s);
  88. if (s->extern_huff) {
  89. av_log(avctx, AV_LOG_INFO, "mjpeg: using external huffman table\n");
  90. init_get_bits(&s->gb, avctx->extradata, avctx->extradata_size * 8);
  91. if (ff_mjpeg_decode_dht(s)) {
  92. av_log(avctx, AV_LOG_ERROR,
  93. "mjpeg: error using external huffman table\n");
  94. return AVERROR_INVALIDDATA;
  95. }
  96. }
  97. if (avctx->field_order == AV_FIELD_BB) { /* quicktime icefloe 019 */
  98. s->interlace_polarity = 1; /* bottom field first */
  99. av_log(avctx, AV_LOG_DEBUG, "mjpeg bottom field first\n");
  100. }
  101. if (avctx->codec->id == CODEC_ID_AMV)
  102. s->flipped = 1;
  103. return 0;
  104. }
  105. /* quantize tables */
  106. int ff_mjpeg_decode_dqt(MJpegDecodeContext *s)
  107. {
  108. int len, index, i, j;
  109. len = get_bits(&s->gb, 16) - 2;
  110. while (len >= 65) {
  111. /* only 8 bit precision handled */
  112. if (get_bits(&s->gb, 4) != 0) {
  113. av_log(s->avctx, AV_LOG_ERROR, "dqt: 16bit precision\n");
  114. return -1;
  115. }
  116. index = get_bits(&s->gb, 4);
  117. if (index >= 4)
  118. return -1;
  119. av_log(s->avctx, AV_LOG_DEBUG, "index=%d\n", index);
  120. /* read quant table */
  121. for (i = 0; i < 64; i++) {
  122. j = s->scantable.permutated[i];
  123. s->quant_matrixes[index][j] = get_bits(&s->gb, 8);
  124. }
  125. // XXX FIXME finetune, and perhaps add dc too
  126. s->qscale[index] = FFMAX(s->quant_matrixes[index][s->scantable.permutated[1]],
  127. s->quant_matrixes[index][s->scantable.permutated[8]]) >> 1;
  128. av_log(s->avctx, AV_LOG_DEBUG, "qscale[%d]: %d\n",
  129. index, s->qscale[index]);
  130. len -= 65;
  131. }
  132. return 0;
  133. }
  134. /* decode huffman tables and build VLC decoders */
  135. int ff_mjpeg_decode_dht(MJpegDecodeContext *s)
  136. {
  137. int len, index, i, class, n, v, code_max;
  138. uint8_t bits_table[17];
  139. uint8_t val_table[256];
  140. len = get_bits(&s->gb, 16) - 2;
  141. while (len > 0) {
  142. if (len < 17)
  143. return -1;
  144. class = get_bits(&s->gb, 4);
  145. if (class >= 2)
  146. return -1;
  147. index = get_bits(&s->gb, 4);
  148. if (index >= 4)
  149. return -1;
  150. n = 0;
  151. for (i = 1; i <= 16; i++) {
  152. bits_table[i] = get_bits(&s->gb, 8);
  153. n += bits_table[i];
  154. }
  155. len -= 17;
  156. if (len < n || n > 256)
  157. return -1;
  158. code_max = 0;
  159. for (i = 0; i < n; i++) {
  160. v = get_bits(&s->gb, 8);
  161. if (v > code_max)
  162. code_max = v;
  163. val_table[i] = v;
  164. }
  165. len -= n;
  166. /* build VLC and flush previous vlc if present */
  167. ff_free_vlc(&s->vlcs[class][index]);
  168. av_log(s->avctx, AV_LOG_DEBUG, "class=%d index=%d nb_codes=%d\n",
  169. class, index, code_max + 1);
  170. if (build_vlc(&s->vlcs[class][index], bits_table, val_table,
  171. code_max + 1, 0, class > 0) < 0)
  172. return -1;
  173. if (class > 0) {
  174. ff_free_vlc(&s->vlcs[2][index]);
  175. if (build_vlc(&s->vlcs[2][index], bits_table, val_table,
  176. code_max + 1, 0, 0) < 0)
  177. return -1;
  178. }
  179. }
  180. return 0;
  181. }
  182. int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
  183. {
  184. int len, nb_components, i, width, height, pix_fmt_id;
  185. /* XXX: verify len field validity */
  186. len = get_bits(&s->gb, 16);
  187. s->bits = get_bits(&s->gb, 8);
  188. if (s->pegasus_rct)
  189. s->bits = 9;
  190. if (s->bits == 9 && !s->pegasus_rct)
  191. s->rct = 1; // FIXME ugly
  192. if (s->bits != 8 && !s->lossless) {
  193. av_log(s->avctx, AV_LOG_ERROR, "only 8 bits/component accepted\n");
  194. return -1;
  195. }
  196. height = get_bits(&s->gb, 16);
  197. width = get_bits(&s->gb, 16);
  198. // HACK for odd_height.mov
  199. if (s->interlaced && s->width == width && s->height == height + 1)
  200. height= s->height;
  201. av_log(s->avctx, AV_LOG_DEBUG, "sof0: picture: %dx%d\n", width, height);
  202. if (av_image_check_size(width, height, 0, s->avctx))
  203. return -1;
  204. nb_components = get_bits(&s->gb, 8);
  205. if (nb_components <= 0 ||
  206. nb_components > MAX_COMPONENTS)
  207. return -1;
  208. if (s->ls && !(s->bits <= 8 || nb_components == 1)) {
  209. av_log(s->avctx, AV_LOG_ERROR,
  210. "only <= 8 bits/component or 16-bit gray accepted for JPEG-LS\n");
  211. return -1;
  212. }
  213. s->nb_components = nb_components;
  214. s->h_max = 1;
  215. s->v_max = 1;
  216. for (i = 0; i < nb_components; i++) {
  217. /* component id */
  218. s->component_id[i] = get_bits(&s->gb, 8) - 1;
  219. s->h_count[i] = get_bits(&s->gb, 4);
  220. s->v_count[i] = get_bits(&s->gb, 4);
  221. /* compute hmax and vmax (only used in interleaved case) */
  222. if (s->h_count[i] > s->h_max)
  223. s->h_max = s->h_count[i];
  224. if (s->v_count[i] > s->v_max)
  225. s->v_max = s->v_count[i];
  226. s->quant_index[i] = get_bits(&s->gb, 8);
  227. if (s->quant_index[i] >= 4)
  228. return -1;
  229. av_log(s->avctx, AV_LOG_DEBUG, "component %d %d:%d id: %d quant:%d\n",
  230. i, s->h_count[i], s->v_count[i],
  231. s->component_id[i], s->quant_index[i]);
  232. }
  233. if (s->ls && (s->h_max > 1 || s->v_max > 1)) {
  234. av_log(s->avctx, AV_LOG_ERROR,
  235. "Subsampling in JPEG-LS is not supported.\n");
  236. return -1;
  237. }
  238. if (s->v_max == 1 && s->h_max == 1 && s->lossless == 1)
  239. s->rgb = 1;
  240. /* if different size, realloc/alloc picture */
  241. /* XXX: also check h_count and v_count */
  242. if (width != s->width || height != s->height) {
  243. av_freep(&s->qscale_table);
  244. s->width = width;
  245. s->height = height;
  246. s->interlaced = 0;
  247. /* test interlaced mode */
  248. if (s->first_picture &&
  249. s->org_height != 0 &&
  250. s->height < ((s->org_height * 3) / 4)) {
  251. s->interlaced = 1;
  252. s->bottom_field = s->interlace_polarity;
  253. s->picture_ptr->interlaced_frame = 1;
  254. s->picture_ptr->top_field_first = !s->interlace_polarity;
  255. height *= 2;
  256. }
  257. avcodec_set_dimensions(s->avctx, width, height);
  258. s->qscale_table = av_mallocz((s->width + 15) / 16);
  259. s->first_picture = 0;
  260. }
  261. if (s->interlaced && (s->bottom_field == !s->interlace_polarity))
  262. return 0;
  263. /* XXX: not complete test ! */
  264. pix_fmt_id = (s->h_count[0] << 28) | (s->v_count[0] << 24) |
  265. (s->h_count[1] << 20) | (s->v_count[1] << 16) |
  266. (s->h_count[2] << 12) | (s->v_count[2] << 8) |
  267. (s->h_count[3] << 4) | s->v_count[3];
  268. av_log(s->avctx, AV_LOG_DEBUG, "pix fmt id %x\n", pix_fmt_id);
  269. /* NOTE we do not allocate pictures large enough for the possible
  270. * padding of h/v_count being 4 */
  271. if (!(pix_fmt_id & 0xD0D0D0D0))
  272. pix_fmt_id -= (pix_fmt_id & 0xF0F0F0F0) >> 1;
  273. if (!(pix_fmt_id & 0x0D0D0D0D))
  274. pix_fmt_id -= (pix_fmt_id & 0x0F0F0F0F) >> 1;
  275. switch (pix_fmt_id) {
  276. case 0x11111100:
  277. if (s->rgb)
  278. s->avctx->pix_fmt = PIX_FMT_BGRA;
  279. else
  280. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV444P : PIX_FMT_YUVJ444P;
  281. assert(s->nb_components == 3);
  282. break;
  283. case 0x11000000:
  284. s->avctx->pix_fmt = PIX_FMT_GRAY8;
  285. break;
  286. case 0x12111100:
  287. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV440P : PIX_FMT_YUVJ440P;
  288. break;
  289. case 0x21111100:
  290. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV422P : PIX_FMT_YUVJ422P;
  291. break;
  292. case 0x22111100:
  293. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV420P : PIX_FMT_YUVJ420P;
  294. break;
  295. default:
  296. av_log(s->avctx, AV_LOG_ERROR, "Unhandled pixel format 0x%x\n", pix_fmt_id);
  297. return -1;
  298. }
  299. if (s->ls) {
  300. if (s->nb_components > 1)
  301. s->avctx->pix_fmt = PIX_FMT_RGB24;
  302. else if (s->bits <= 8)
  303. s->avctx->pix_fmt = PIX_FMT_GRAY8;
  304. else
  305. s->avctx->pix_fmt = PIX_FMT_GRAY16;
  306. }
  307. if (s->picture_ptr->data[0])
  308. s->avctx->release_buffer(s->avctx, s->picture_ptr);
  309. if (s->avctx->get_buffer(s->avctx, s->picture_ptr) < 0) {
  310. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  311. return -1;
  312. }
  313. s->picture_ptr->pict_type = AV_PICTURE_TYPE_I;
  314. s->picture_ptr->key_frame = 1;
  315. s->got_picture = 1;
  316. for (i = 0; i < 3; i++)
  317. s->linesize[i] = s->picture_ptr->linesize[i] << s->interlaced;
  318. // printf("%d %d %d %d %d %d\n",
  319. // s->width, s->height, s->linesize[0], s->linesize[1],
  320. // s->interlaced, s->avctx->height);
  321. if (len != (8 + (3 * nb_components)))
  322. av_log(s->avctx, AV_LOG_DEBUG, "decode_sof0: error, len(%d) mismatch\n", len);
  323. /* totally blank picture as progressive JPEG will only add details to it */
  324. if (s->progressive) {
  325. int bw = (width + s->h_max * 8 - 1) / (s->h_max * 8);
  326. int bh = (height + s->v_max * 8 - 1) / (s->v_max * 8);
  327. for (i = 0; i < s->nb_components; i++) {
  328. int size = bw * bh * s->h_count[i] * s->v_count[i];
  329. av_freep(&s->blocks[i]);
  330. av_freep(&s->last_nnz[i]);
  331. s->blocks[i] = av_malloc(size * sizeof(**s->blocks));
  332. s->last_nnz[i] = av_mallocz(size * sizeof(**s->last_nnz));
  333. s->block_stride[i] = bw * s->h_count[i];
  334. }
  335. memset(s->coefs_finished, 0, sizeof(s->coefs_finished));
  336. }
  337. return 0;
  338. }
  339. static inline int mjpeg_decode_dc(MJpegDecodeContext *s, int dc_index)
  340. {
  341. int code;
  342. code = get_vlc2(&s->gb, s->vlcs[0][dc_index].table, 9, 2);
  343. if (code < 0) {
  344. av_log(s->avctx, AV_LOG_WARNING,
  345. "mjpeg_decode_dc: bad vlc: %d:%d (%p)\n",
  346. 0, dc_index, &s->vlcs[0][dc_index]);
  347. return 0xffff;
  348. }
  349. if (code)
  350. return get_xbits(&s->gb, code);
  351. else
  352. return 0;
  353. }
  354. /* decode block and dequantize */
  355. static int decode_block(MJpegDecodeContext *s, DCTELEM *block, int component,
  356. int dc_index, int ac_index, int16_t *quant_matrix)
  357. {
  358. int code, i, j, level, val;
  359. /* DC coef */
  360. val = mjpeg_decode_dc(s, dc_index);
  361. if (val == 0xffff) {
  362. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  363. return -1;
  364. }
  365. val = val * quant_matrix[0] + s->last_dc[component];
  366. s->last_dc[component] = val;
  367. block[0] = val;
  368. /* AC coefs */
  369. i = 0;
  370. {OPEN_READER(re, &s->gb);
  371. do {
  372. UPDATE_CACHE(re, &s->gb);
  373. GET_VLC(code, re, &s->gb, s->vlcs[1][ac_index].table, 9, 2);
  374. i += ((unsigned)code) >> 4;
  375. code &= 0xf;
  376. if (code) {
  377. if (code > MIN_CACHE_BITS - 16)
  378. UPDATE_CACHE(re, &s->gb);
  379. {
  380. int cache = GET_CACHE(re, &s->gb);
  381. int sign = (~cache) >> 31;
  382. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  383. }
  384. LAST_SKIP_BITS(re, &s->gb, code);
  385. if (i > 63) {
  386. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  387. return -1;
  388. }
  389. j = s->scantable.permutated[i];
  390. block[j] = level * quant_matrix[j];
  391. }
  392. } while (i < 63);
  393. CLOSE_READER(re, &s->gb);}
  394. return 0;
  395. }
  396. static int decode_dc_progressive(MJpegDecodeContext *s, DCTELEM *block,
  397. int component, int dc_index,
  398. int16_t *quant_matrix, int Al)
  399. {
  400. int val;
  401. s->dsp.clear_block(block);
  402. val = mjpeg_decode_dc(s, dc_index);
  403. if (val == 0xffff) {
  404. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  405. return -1;
  406. }
  407. val = (val * quant_matrix[0] << Al) + s->last_dc[component];
  408. s->last_dc[component] = val;
  409. block[0] = val;
  410. return 0;
  411. }
  412. /* decode block and dequantize - progressive JPEG version */
  413. static int decode_block_progressive(MJpegDecodeContext *s, DCTELEM *block,
  414. uint8_t *last_nnz, int ac_index,
  415. int16_t *quant_matrix,
  416. int ss, int se, int Al, int *EOBRUN)
  417. {
  418. int code, i, j, level, val, run;
  419. if (*EOBRUN) {
  420. (*EOBRUN)--;
  421. return 0;
  422. }
  423. {
  424. OPEN_READER(re, &s->gb);
  425. for (i = ss; ; i++) {
  426. UPDATE_CACHE(re, &s->gb);
  427. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  428. run = ((unsigned) code) >> 4;
  429. code &= 0xF;
  430. if (code) {
  431. i += run;
  432. if (code > MIN_CACHE_BITS - 16)
  433. UPDATE_CACHE(re, &s->gb);
  434. {
  435. int cache = GET_CACHE(re, &s->gb);
  436. int sign = (~cache) >> 31;
  437. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  438. }
  439. LAST_SKIP_BITS(re, &s->gb, code);
  440. if (i >= se) {
  441. if (i == se) {
  442. j = s->scantable.permutated[se];
  443. block[j] = level * quant_matrix[j] << Al;
  444. break;
  445. }
  446. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  447. return -1;
  448. }
  449. j = s->scantable.permutated[i];
  450. block[j] = level * quant_matrix[j] << Al;
  451. } else {
  452. if (run == 0xF) {// ZRL - skip 15 coefficients
  453. i += 15;
  454. if (i >= se) {
  455. av_log(s->avctx, AV_LOG_ERROR, "ZRL overflow: %d\n", i);
  456. return -1;
  457. }
  458. } else {
  459. val = (1 << run);
  460. if (run) {
  461. UPDATE_CACHE(re, &s->gb);
  462. val += NEG_USR32(GET_CACHE(re, &s->gb), run);
  463. LAST_SKIP_BITS(re, &s->gb, run);
  464. }
  465. *EOBRUN = val - 1;
  466. break;
  467. }
  468. }
  469. }
  470. CLOSE_READER(re, &s->gb);
  471. }
  472. if (i > *last_nnz)
  473. *last_nnz = i;
  474. return 0;
  475. }
  476. #define REFINE_BIT(j) { \
  477. UPDATE_CACHE(re, &s->gb); \
  478. sign = block[j] >> 15; \
  479. block[j] += SHOW_UBITS(re, &s->gb, 1) * \
  480. ((quant_matrix[j] ^ sign) - sign) << Al; \
  481. LAST_SKIP_BITS(re, &s->gb, 1); \
  482. }
  483. #define ZERO_RUN \
  484. for (; ; i++) { \
  485. if (i > last) { \
  486. i += run; \
  487. if (i > se) { \
  488. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i); \
  489. return -1; \
  490. } \
  491. break; \
  492. } \
  493. j = s->scantable.permutated[i]; \
  494. if (block[j]) \
  495. REFINE_BIT(j) \
  496. else if (run-- == 0) \
  497. break; \
  498. }
  499. /* decode block and dequantize - progressive JPEG refinement pass */
  500. static int decode_block_refinement(MJpegDecodeContext *s, DCTELEM *block,
  501. uint8_t *last_nnz,
  502. int ac_index, int16_t *quant_matrix,
  503. int ss, int se, int Al, int *EOBRUN)
  504. {
  505. int code, i = ss, j, sign, val, run;
  506. int last = FFMIN(se, *last_nnz);
  507. OPEN_READER(re, &s->gb);
  508. if (*EOBRUN) {
  509. (*EOBRUN)--;
  510. } else {
  511. for (; ; i++) {
  512. UPDATE_CACHE(re, &s->gb);
  513. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  514. if (code & 0xF) {
  515. run = ((unsigned) code) >> 4;
  516. UPDATE_CACHE(re, &s->gb);
  517. val = SHOW_UBITS(re, &s->gb, 1);
  518. LAST_SKIP_BITS(re, &s->gb, 1);
  519. ZERO_RUN;
  520. j = s->scantable.permutated[i];
  521. val--;
  522. block[j] = ((quant_matrix[j]^val) - val) << Al;
  523. if (i == se) {
  524. if (i > *last_nnz)
  525. *last_nnz = i;
  526. CLOSE_READER(re, &s->gb);
  527. return 0;
  528. }
  529. } else {
  530. run = ((unsigned) code) >> 4;
  531. if (run == 0xF) {
  532. ZERO_RUN;
  533. } else {
  534. val = run;
  535. run = (1 << run);
  536. if (val) {
  537. UPDATE_CACHE(re, &s->gb);
  538. run += SHOW_UBITS(re, &s->gb, val);
  539. LAST_SKIP_BITS(re, &s->gb, val);
  540. }
  541. *EOBRUN = run - 1;
  542. break;
  543. }
  544. }
  545. }
  546. if (i > *last_nnz)
  547. *last_nnz = i;
  548. }
  549. for (; i <= last; i++) {
  550. j = s->scantable.permutated[i];
  551. if (block[j])
  552. REFINE_BIT(j)
  553. }
  554. CLOSE_READER(re, &s->gb);
  555. return 0;
  556. }
  557. #undef REFINE_BIT
  558. #undef ZERO_RUN
  559. static int ljpeg_decode_rgb_scan(MJpegDecodeContext *s, int predictor,
  560. int point_transform)
  561. {
  562. int i, mb_x, mb_y;
  563. uint16_t (*buffer)[4];
  564. int left[3], top[3], topleft[3];
  565. const int linesize = s->linesize[0];
  566. const int mask = (1 << s->bits) - 1;
  567. av_fast_malloc(&s->ljpeg_buffer, &s->ljpeg_buffer_size,
  568. (unsigned)s->mb_width * 4 * sizeof(s->ljpeg_buffer[0][0]));
  569. buffer = s->ljpeg_buffer;
  570. for (i = 0; i < 3; i++)
  571. buffer[0][i] = 1 << (s->bits + point_transform - 1);
  572. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  573. const int modified_predictor = mb_y ? predictor : 1;
  574. uint8_t *ptr = s->picture_ptr->data[0] + (linesize * mb_y);
  575. if (s->interlaced && s->bottom_field)
  576. ptr += linesize >> 1;
  577. for (i = 0; i < 3; i++)
  578. top[i] = left[i] = topleft[i] = buffer[0][i];
  579. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  580. if (s->restart_interval && !s->restart_count)
  581. s->restart_count = s->restart_interval;
  582. for (i = 0; i < 3; i++) {
  583. int pred;
  584. topleft[i] = top[i];
  585. top[i] = buffer[mb_x][i];
  586. PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
  587. left[i] = buffer[mb_x][i] =
  588. mask & (pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform));
  589. }
  590. if (s->restart_interval && !--s->restart_count) {
  591. align_get_bits(&s->gb);
  592. skip_bits(&s->gb, 16); /* skip RSTn */
  593. }
  594. }
  595. if (s->rct) {
  596. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  597. ptr[4 * mb_x + 1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2] - 0x200) >> 2);
  598. ptr[4 * mb_x + 0] = buffer[mb_x][1] + ptr[4 * mb_x + 1];
  599. ptr[4 * mb_x + 2] = buffer[mb_x][2] + ptr[4 * mb_x + 1];
  600. }
  601. } else if (s->pegasus_rct) {
  602. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  603. ptr[4 * mb_x + 1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2]) >> 2);
  604. ptr[4 * mb_x + 0] = buffer[mb_x][1] + ptr[4 * mb_x + 1];
  605. ptr[4 * mb_x + 2] = buffer[mb_x][2] + ptr[4 * mb_x + 1];
  606. }
  607. } else {
  608. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  609. ptr[4 * mb_x + 0] = buffer[mb_x][2];
  610. ptr[4 * mb_x + 1] = buffer[mb_x][1];
  611. ptr[4 * mb_x + 2] = buffer[mb_x][0];
  612. }
  613. }
  614. }
  615. return 0;
  616. }
  617. static int ljpeg_decode_yuv_scan(MJpegDecodeContext *s, int predictor,
  618. int point_transform)
  619. {
  620. int i, mb_x, mb_y;
  621. const int nb_components = 3;
  622. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  623. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  624. if (s->restart_interval && !s->restart_count)
  625. s->restart_count = s->restart_interval;
  626. if (mb_x == 0 || mb_y == 0 || s->interlaced) {
  627. for (i = 0; i < nb_components; i++) {
  628. uint8_t *ptr;
  629. int n, h, v, x, y, c, j, linesize;
  630. n = s->nb_blocks[i];
  631. c = s->comp_index[i];
  632. h = s->h_scount[i];
  633. v = s->v_scount[i];
  634. x = 0;
  635. y = 0;
  636. linesize = s->linesize[c];
  637. for (j = 0; j < n; j++) {
  638. int pred;
  639. // FIXME optimize this crap
  640. ptr = s->picture_ptr->data[c] +
  641. (linesize * (v * mb_y + y)) +
  642. (h * mb_x + x);
  643. if (y == 0 && mb_y == 0) {
  644. if (x == 0 && mb_x == 0)
  645. pred = 128 << point_transform;
  646. else
  647. pred = ptr[-1];
  648. } else {
  649. if (x == 0 && mb_x == 0)
  650. pred = ptr[-linesize];
  651. else
  652. PREDICT(pred, ptr[-linesize - 1],
  653. ptr[-linesize], ptr[-1], predictor);
  654. }
  655. if (s->interlaced && s->bottom_field)
  656. ptr += linesize >> 1;
  657. *ptr = pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
  658. if (++x == h) {
  659. x = 0;
  660. y++;
  661. }
  662. }
  663. }
  664. } else {
  665. for (i = 0; i < nb_components; i++) {
  666. uint8_t *ptr;
  667. int n, h, v, x, y, c, j, linesize;
  668. n = s->nb_blocks[i];
  669. c = s->comp_index[i];
  670. h = s->h_scount[i];
  671. v = s->v_scount[i];
  672. x = 0;
  673. y = 0;
  674. linesize = s->linesize[c];
  675. for (j = 0; j < n; j++) {
  676. int pred;
  677. // FIXME optimize this crap
  678. ptr = s->picture_ptr->data[c] +
  679. (linesize * (v * mb_y + y)) +
  680. (h * mb_x + x);
  681. PREDICT(pred, ptr[-linesize - 1],
  682. ptr[-linesize], ptr[-1], predictor);
  683. *ptr = pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
  684. if (++x == h) {
  685. x = 0;
  686. y++;
  687. }
  688. }
  689. }
  690. }
  691. if (s->restart_interval && !--s->restart_count) {
  692. align_get_bits(&s->gb);
  693. skip_bits(&s->gb, 16); /* skip RSTn */
  694. }
  695. }
  696. }
  697. return 0;
  698. }
  699. static av_always_inline void mjpeg_copy_block(uint8_t *dst, const uint8_t *src,
  700. int linesize, int lowres)
  701. {
  702. switch (lowres) {
  703. case 0: copy_block8(dst, src, linesize, linesize, 8);
  704. break;
  705. case 1: copy_block4(dst, src, linesize, linesize, 4);
  706. break;
  707. case 2: copy_block2(dst, src, linesize, linesize, 2);
  708. break;
  709. case 3: *dst = *src;
  710. break;
  711. }
  712. }
  713. static int mjpeg_decode_scan(MJpegDecodeContext *s, int nb_components, int Ah,
  714. int Al, const uint8_t *mb_bitmask,
  715. const AVFrame *reference)
  716. {
  717. int i, mb_x, mb_y;
  718. uint8_t *data[MAX_COMPONENTS];
  719. const uint8_t *reference_data[MAX_COMPONENTS];
  720. int linesize[MAX_COMPONENTS];
  721. GetBitContext mb_bitmask_gb;
  722. if (mb_bitmask)
  723. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width * s->mb_height);
  724. if (s->flipped && s->avctx->flags & CODEC_FLAG_EMU_EDGE) {
  725. av_log(s->avctx, AV_LOG_ERROR,
  726. "Can not flip image with CODEC_FLAG_EMU_EDGE set!\n");
  727. s->flipped = 0;
  728. }
  729. for (i = 0; i < nb_components; i++) {
  730. int c = s->comp_index[i];
  731. data[c] = s->picture_ptr->data[c];
  732. reference_data[c] = reference ? reference->data[c] : NULL;
  733. linesize[c] = s->linesize[c];
  734. s->coefs_finished[c] |= 1;
  735. if (s->flipped) {
  736. // picture should be flipped upside-down for this codec
  737. int offset = (linesize[c] * (s->v_scount[i] *
  738. (8 * s->mb_height - ((s->height / s->v_max) & 7)) - 1));
  739. data[c] += offset;
  740. reference_data[c] += offset;
  741. linesize[c] *= -1;
  742. }
  743. }
  744. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  745. for (mb_x = 0; mb_x < s->mb_width; mb_x++) {
  746. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  747. if (s->restart_interval && !s->restart_count)
  748. s->restart_count = s->restart_interval;
  749. if (get_bits_count(&s->gb)>s->gb.size_in_bits) {
  750. av_log(s->avctx, AV_LOG_ERROR, "overread %d\n",
  751. get_bits_count(&s->gb) - s->gb.size_in_bits);
  752. return -1;
  753. }
  754. for (i = 0; i < nb_components; i++) {
  755. uint8_t *ptr;
  756. int n, h, v, x, y, c, j;
  757. int block_offset;
  758. n = s->nb_blocks[i];
  759. c = s->comp_index[i];
  760. h = s->h_scount[i];
  761. v = s->v_scount[i];
  762. x = 0;
  763. y = 0;
  764. for (j = 0; j < n; j++) {
  765. block_offset = (((linesize[c] * (v * mb_y + y) * 8) +
  766. (h * mb_x + x) * 8) >> s->avctx->lowres);
  767. if (s->interlaced && s->bottom_field)
  768. block_offset += linesize[c] >> 1;
  769. ptr = data[c] + block_offset;
  770. if (!s->progressive) {
  771. if (copy_mb)
  772. mjpeg_copy_block(ptr, reference_data[c] + block_offset,
  773. linesize[c], s->avctx->lowres);
  774. else {
  775. s->dsp.clear_block(s->block);
  776. if (decode_block(s, s->block, i,
  777. s->dc_index[i], s->ac_index[i],
  778. s->quant_matrixes[s->quant_index[c]]) < 0) {
  779. av_log(s->avctx, AV_LOG_ERROR,
  780. "error y=%d x=%d\n", mb_y, mb_x);
  781. return -1;
  782. }
  783. s->dsp.idct_put(ptr, linesize[c], s->block);
  784. }
  785. } else {
  786. int block_idx = s->block_stride[c] * (v * mb_y + y) +
  787. (h * mb_x + x);
  788. DCTELEM *block = s->blocks[c][block_idx];
  789. if (Ah)
  790. block[0] += get_bits1(&s->gb) *
  791. s->quant_matrixes[s->quant_index[c]][0] << Al;
  792. else if (decode_dc_progressive(s, block, i, s->dc_index[i],
  793. s->quant_matrixes[s->quant_index[c]],
  794. Al) < 0) {
  795. av_log(s->avctx, AV_LOG_ERROR,
  796. "error y=%d x=%d\n", mb_y, mb_x);
  797. return -1;
  798. }
  799. }
  800. // av_log(s->avctx, AV_LOG_DEBUG, "mb: %d %d processed\n",
  801. // mb_y, mb_x);
  802. // av_log(NULL, AV_LOG_DEBUG, "%d %d %d %d %d %d %d %d \n",
  803. // mb_x, mb_y, x, y, c, s->bottom_field,
  804. // (v * mb_y + y) * 8, (h * mb_x + x) * 8);
  805. if (++x == h) {
  806. x = 0;
  807. y++;
  808. }
  809. }
  810. }
  811. if (s->restart_interval) {
  812. s->restart_count--;
  813. i = 8 + ((-get_bits_count(&s->gb)) & 7);
  814. /* skip RSTn */
  815. if (show_bits(&s->gb, i) == (1 << i) - 1) {
  816. int pos = get_bits_count(&s->gb);
  817. align_get_bits(&s->gb);
  818. while (get_bits_left(&s->gb) >= 8 && show_bits(&s->gb, 8) == 0xFF)
  819. skip_bits(&s->gb, 8);
  820. if ((get_bits(&s->gb, 8) & 0xF8) == 0xD0) {
  821. for (i = 0; i < nb_components; i++) /* reset dc */
  822. s->last_dc[i] = 1024;
  823. } else
  824. skip_bits_long(&s->gb, pos - get_bits_count(&s->gb));
  825. }
  826. }
  827. }
  828. }
  829. return 0;
  830. }
  831. static int mjpeg_decode_scan_progressive_ac(MJpegDecodeContext *s, int ss,
  832. int se, int Ah, int Al,
  833. const uint8_t *mb_bitmask,
  834. const AVFrame *reference)
  835. {
  836. int mb_x, mb_y;
  837. int EOBRUN = 0;
  838. int c = s->comp_index[0];
  839. uint8_t *data = s->picture_ptr->data[c];
  840. const uint8_t *reference_data = reference ? reference->data[c] : NULL;
  841. int linesize = s->linesize[c];
  842. int last_scan = 0;
  843. int16_t *quant_matrix = s->quant_matrixes[s->quant_index[c]];
  844. GetBitContext mb_bitmask_gb;
  845. if (mb_bitmask)
  846. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width * s->mb_height);
  847. if (!Al) {
  848. s->coefs_finished[c] |= (1LL << (se + 1)) - (1LL << ss);
  849. last_scan = !~s->coefs_finished[c];
  850. }
  851. if (s->interlaced && s->bottom_field) {
  852. int offset = linesize >> 1;
  853. data += offset;
  854. reference_data += offset;
  855. }
  856. for (mb_y = 0; mb_y < s->mb_height; mb_y++) {
  857. int block_offset = (mb_y * linesize * 8 >> s->avctx->lowres);
  858. uint8_t *ptr = data + block_offset;
  859. int block_idx = mb_y * s->block_stride[c];
  860. DCTELEM (*block)[64] = &s->blocks[c][block_idx];
  861. uint8_t *last_nnz = &s->last_nnz[c][block_idx];
  862. for (mb_x = 0; mb_x < s->mb_width; mb_x++, block++, last_nnz++) {
  863. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  864. if (!copy_mb) {
  865. int ret;
  866. if (Ah)
  867. ret = decode_block_refinement(s, *block, last_nnz, s->ac_index[0],
  868. quant_matrix, ss, se, Al, &EOBRUN);
  869. else
  870. ret = decode_block_progressive(s, *block, last_nnz, s->ac_index[0],
  871. quant_matrix, ss, se, Al, &EOBRUN);
  872. if (ret < 0) {
  873. av_log(s->avctx, AV_LOG_ERROR,
  874. "error y=%d x=%d\n", mb_y, mb_x);
  875. return -1;
  876. }
  877. }
  878. if (last_scan) {
  879. if (copy_mb) {
  880. mjpeg_copy_block(ptr, reference_data + block_offset,
  881. linesize, s->avctx->lowres);
  882. } else {
  883. s->dsp.idct_put(ptr, linesize, *block);
  884. ptr += 8 >> s->avctx->lowres;
  885. }
  886. }
  887. }
  888. }
  889. return 0;
  890. }
  891. int ff_mjpeg_decode_sos(MJpegDecodeContext *s, const uint8_t *mb_bitmask,
  892. const AVFrame *reference)
  893. {
  894. int len, nb_components, i, h, v, predictor, point_transform;
  895. int index, id;
  896. const int block_size = s->lossless ? 1 : 8;
  897. int ilv, prev_shift;
  898. /* XXX: verify len field validity */
  899. len = get_bits(&s->gb, 16);
  900. nb_components = get_bits(&s->gb, 8);
  901. if (nb_components == 0 || nb_components > MAX_COMPONENTS) {
  902. av_log(s->avctx, AV_LOG_ERROR,
  903. "decode_sos: nb_components (%d) unsupported\n", nb_components);
  904. return -1;
  905. }
  906. if (len != 6 + 2 * nb_components) {
  907. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: invalid len (%d)\n", len);
  908. return -1;
  909. }
  910. for (i = 0; i < nb_components; i++) {
  911. id = get_bits(&s->gb, 8) - 1;
  912. av_log(s->avctx, AV_LOG_DEBUG, "component: %d\n", id);
  913. /* find component index */
  914. for (index = 0; index < s->nb_components; index++)
  915. if (id == s->component_id[index])
  916. break;
  917. if (index == s->nb_components) {
  918. av_log(s->avctx, AV_LOG_ERROR,
  919. "decode_sos: index(%d) out of components\n", index);
  920. return -1;
  921. }
  922. /* Metasoft MJPEG codec has Cb and Cr swapped */
  923. if (s->avctx->codec_tag == MKTAG('M', 'T', 'S', 'J')
  924. && nb_components == 3 && s->nb_components == 3 && i)
  925. index = 3 - i;
  926. s->comp_index[i] = index;
  927. s->nb_blocks[i] = s->h_count[index] * s->v_count[index];
  928. s->h_scount[i] = s->h_count[index];
  929. s->v_scount[i] = s->v_count[index];
  930. s->dc_index[i] = get_bits(&s->gb, 4);
  931. s->ac_index[i] = get_bits(&s->gb, 4);
  932. if (s->dc_index[i] < 0 || s->ac_index[i] < 0 ||
  933. s->dc_index[i] >= 4 || s->ac_index[i] >= 4)
  934. goto out_of_range;
  935. if (!s->vlcs[0][s->dc_index[i]].table ||
  936. !s->vlcs[1][s->ac_index[i]].table)
  937. goto out_of_range;
  938. }
  939. predictor = get_bits(&s->gb, 8); /* JPEG Ss / lossless JPEG predictor /JPEG-LS NEAR */
  940. ilv = get_bits(&s->gb, 8); /* JPEG Se / JPEG-LS ILV */
  941. prev_shift = get_bits(&s->gb, 4); /* Ah */
  942. point_transform = get_bits(&s->gb, 4); /* Al */
  943. for (i = 0; i < nb_components; i++)
  944. s->last_dc[i] = 1024;
  945. if (nb_components > 1) {
  946. /* interleaved stream */
  947. s->mb_width = (s->width + s->h_max * block_size - 1) / (s->h_max * block_size);
  948. s->mb_height = (s->height + s->v_max * block_size - 1) / (s->v_max * block_size);
  949. } else if (!s->ls) { /* skip this for JPEG-LS */
  950. h = s->h_max / s->h_scount[0];
  951. v = s->v_max / s->v_scount[0];
  952. s->mb_width = (s->width + h * block_size - 1) / (h * block_size);
  953. s->mb_height = (s->height + v * block_size - 1) / (v * block_size);
  954. s->nb_blocks[0] = 1;
  955. s->h_scount[0] = 1;
  956. s->v_scount[0] = 1;
  957. }
  958. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  959. av_log(s->avctx, AV_LOG_DEBUG, "%s %s p:%d >>:%d ilv:%d bits:%d %s\n",
  960. s->lossless ? "lossless" : "sequential DCT", s->rgb ? "RGB" : "",
  961. predictor, point_transform, ilv, s->bits,
  962. s->pegasus_rct ? "PRCT" : (s->rct ? "RCT" : ""));
  963. /* mjpeg-b can have padding bytes between sos and image data, skip them */
  964. for (i = s->mjpb_skiptosod; i > 0; i--)
  965. skip_bits(&s->gb, 8);
  966. if (s->lossless) {
  967. if (CONFIG_JPEGLS_DECODER && s->ls) {
  968. // for () {
  969. // reset_ls_coding_parameters(s, 0);
  970. if (ff_jpegls_decode_picture(s, predictor, point_transform, ilv) < 0)
  971. return -1;
  972. } else {
  973. if (s->rgb) {
  974. if (ljpeg_decode_rgb_scan(s, predictor, point_transform) < 0)
  975. return -1;
  976. } else {
  977. if (ljpeg_decode_yuv_scan(s, predictor, point_transform) < 0)
  978. return -1;
  979. }
  980. }
  981. } else {
  982. if (s->progressive && predictor) {
  983. if (mjpeg_decode_scan_progressive_ac(s, predictor, ilv, prev_shift,
  984. point_transform,
  985. mb_bitmask, reference) < 0)
  986. return -1;
  987. } else {
  988. if (mjpeg_decode_scan(s, nb_components, prev_shift, point_transform,
  989. mb_bitmask, reference) < 0)
  990. return -1;
  991. }
  992. }
  993. emms_c();
  994. return 0;
  995. out_of_range:
  996. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: ac/dc index out of range\n");
  997. return -1;
  998. }
  999. static int mjpeg_decode_dri(MJpegDecodeContext *s)
  1000. {
  1001. if (get_bits(&s->gb, 16) != 4)
  1002. return -1;
  1003. s->restart_interval = get_bits(&s->gb, 16);
  1004. s->restart_count = 0;
  1005. av_log(s->avctx, AV_LOG_DEBUG, "restart interval: %d\n",
  1006. s->restart_interval);
  1007. return 0;
  1008. }
  1009. static int mjpeg_decode_app(MJpegDecodeContext *s)
  1010. {
  1011. int len, id, i;
  1012. len = get_bits(&s->gb, 16);
  1013. if (len < 5)
  1014. return -1;
  1015. if (8 * len + get_bits_count(&s->gb) > s->gb.size_in_bits)
  1016. return -1;
  1017. id = get_bits_long(&s->gb, 32);
  1018. id = av_be2ne32(id);
  1019. len -= 6;
  1020. if (s->avctx->debug & FF_DEBUG_STARTCODE)
  1021. av_log(s->avctx, AV_LOG_DEBUG, "APPx %8X\n", id);
  1022. /* Buggy AVID, it puts EOI only at every 10th frame. */
  1023. /* Also, this fourcc is used by non-avid files too, it holds some
  1024. information, but it's always present in AVID-created files. */
  1025. if (id == AV_RL32("AVI1")) {
  1026. /* structure:
  1027. 4bytes AVI1
  1028. 1bytes polarity
  1029. 1bytes always zero
  1030. 4bytes field_size
  1031. 4bytes field_size_less_padding
  1032. */
  1033. s->buggy_avid = 1;
  1034. // if (s->first_picture)
  1035. // printf("mjpeg: workarounding buggy AVID\n");
  1036. i = get_bits(&s->gb, 8);
  1037. if (i == 2)
  1038. s->bottom_field = 1;
  1039. else if (i == 1)
  1040. s->bottom_field = 0;
  1041. #if 0
  1042. skip_bits(&s->gb, 8);
  1043. skip_bits(&s->gb, 32);
  1044. skip_bits(&s->gb, 32);
  1045. len -= 10;
  1046. #endif
  1047. // if (s->interlace_polarity)
  1048. // printf("mjpeg: interlace polarity: %d\n", s->interlace_polarity);
  1049. goto out;
  1050. }
  1051. // len -= 2;
  1052. if (id == AV_RL32("JFIF")) {
  1053. int t_w, t_h, v1, v2;
  1054. skip_bits(&s->gb, 8); /* the trailing zero-byte */
  1055. v1 = get_bits(&s->gb, 8);
  1056. v2 = get_bits(&s->gb, 8);
  1057. skip_bits(&s->gb, 8);
  1058. s->avctx->sample_aspect_ratio.num = get_bits(&s->gb, 16);
  1059. s->avctx->sample_aspect_ratio.den = get_bits(&s->gb, 16);
  1060. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1061. av_log(s->avctx, AV_LOG_INFO,
  1062. "mjpeg: JFIF header found (version: %x.%x) SAR=%d/%d\n",
  1063. v1, v2,
  1064. s->avctx->sample_aspect_ratio.num,
  1065. s->avctx->sample_aspect_ratio.den);
  1066. t_w = get_bits(&s->gb, 8);
  1067. t_h = get_bits(&s->gb, 8);
  1068. if (t_w && t_h) {
  1069. /* skip thumbnail */
  1070. if (len -10 - (t_w * t_h * 3) > 0)
  1071. len -= t_w * t_h * 3;
  1072. }
  1073. len -= 10;
  1074. goto out;
  1075. }
  1076. if (id == AV_RL32("Adob") && (get_bits(&s->gb, 8) == 'e')) {
  1077. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1078. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Adobe header found\n");
  1079. skip_bits(&s->gb, 16); /* version */
  1080. skip_bits(&s->gb, 16); /* flags0 */
  1081. skip_bits(&s->gb, 16); /* flags1 */
  1082. skip_bits(&s->gb, 8); /* transform */
  1083. len -= 7;
  1084. goto out;
  1085. }
  1086. if (id == AV_RL32("LJIF")) {
  1087. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1088. av_log(s->avctx, AV_LOG_INFO,
  1089. "Pegasus lossless jpeg header found\n");
  1090. skip_bits(&s->gb, 16); /* version ? */
  1091. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1092. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1093. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1094. switch (get_bits(&s->gb, 8)) {
  1095. case 1:
  1096. s->rgb = 1;
  1097. s->pegasus_rct = 0;
  1098. break;
  1099. case 2:
  1100. s->rgb = 1;
  1101. s->pegasus_rct = 1;
  1102. break;
  1103. default:
  1104. av_log(s->avctx, AV_LOG_ERROR, "unknown colorspace\n");
  1105. }
  1106. len -= 9;
  1107. goto out;
  1108. }
  1109. /* Apple MJPEG-A */
  1110. if ((s->start_code == APP1) && (len > (0x28 - 8))) {
  1111. id = get_bits_long(&s->gb, 32);
  1112. id = av_be2ne32(id);
  1113. len -= 4;
  1114. /* Apple MJPEG-A */
  1115. if (id == AV_RL32("mjpg")) {
  1116. #if 0
  1117. skip_bits(&s->gb, 32); /* field size */
  1118. skip_bits(&s->gb, 32); /* pad field size */
  1119. skip_bits(&s->gb, 32); /* next off */
  1120. skip_bits(&s->gb, 32); /* quant off */
  1121. skip_bits(&s->gb, 32); /* huff off */
  1122. skip_bits(&s->gb, 32); /* image off */
  1123. skip_bits(&s->gb, 32); /* scan off */
  1124. skip_bits(&s->gb, 32); /* data off */
  1125. #endif
  1126. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1127. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Apple MJPEG-A header found\n");
  1128. }
  1129. }
  1130. out:
  1131. /* slow but needed for extreme adobe jpegs */
  1132. if (len < 0)
  1133. av_log(s->avctx, AV_LOG_ERROR,
  1134. "mjpeg: error, decode_app parser read over the end\n");
  1135. while (--len > 0)
  1136. skip_bits(&s->gb, 8);
  1137. return 0;
  1138. }
  1139. static int mjpeg_decode_com(MJpegDecodeContext *s)
  1140. {
  1141. int len = get_bits(&s->gb, 16);
  1142. if (len >= 2 &&
  1143. 8 * len - 16 + get_bits_count(&s->gb) <= s->gb.size_in_bits) {
  1144. char *cbuf = av_malloc(len - 1);
  1145. if (cbuf) {
  1146. int i;
  1147. for (i = 0; i < len - 2; i++)
  1148. cbuf[i] = get_bits(&s->gb, 8);
  1149. if (i > 0 && cbuf[i - 1] == '\n')
  1150. cbuf[i - 1] = 0;
  1151. else
  1152. cbuf[i] = 0;
  1153. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1154. av_log(s->avctx, AV_LOG_INFO, "mjpeg comment: '%s'\n", cbuf);
  1155. /* buggy avid, it puts EOI only at every 10th frame */
  1156. if (!strcmp(cbuf, "AVID")) {
  1157. s->buggy_avid = 1;
  1158. // if (s->first_picture)
  1159. // printf("mjpeg: workarounding buggy AVID\n");
  1160. } else if (!strcmp(cbuf, "CS=ITU601"))
  1161. s->cs_itu601 = 1;
  1162. else if ((len > 20 && !strncmp(cbuf, "Intel(R) JPEG Library", 21)) ||
  1163. (len > 19 && !strncmp(cbuf, "Metasoft MJPEG Codec", 20)))
  1164. s->flipped = 1;
  1165. av_free(cbuf);
  1166. }
  1167. }
  1168. return 0;
  1169. }
  1170. /* return the 8 bit start code value and update the search
  1171. state. Return -1 if no start code found */
  1172. static int find_marker(const uint8_t **pbuf_ptr, const uint8_t *buf_end)
  1173. {
  1174. const uint8_t *buf_ptr;
  1175. unsigned int v, v2;
  1176. int val;
  1177. #ifdef DEBUG
  1178. int skipped = 0;
  1179. #endif
  1180. buf_ptr = *pbuf_ptr;
  1181. while (buf_ptr < buf_end) {
  1182. v = *buf_ptr++;
  1183. v2 = *buf_ptr;
  1184. if ((v == 0xff) && (v2 >= 0xc0) && (v2 <= 0xfe) && buf_ptr < buf_end) {
  1185. val = *buf_ptr++;
  1186. goto found;
  1187. }
  1188. #ifdef DEBUG
  1189. skipped++;
  1190. #endif
  1191. }
  1192. val = -1;
  1193. found:
  1194. av_dlog(NULL, "find_marker skipped %d bytes\n", skipped);
  1195. *pbuf_ptr = buf_ptr;
  1196. return val;
  1197. }
  1198. int ff_mjpeg_find_marker(MJpegDecodeContext *s,
  1199. const uint8_t **buf_ptr, const uint8_t *buf_end,
  1200. const uint8_t **unescaped_buf_ptr,
  1201. int *unescaped_buf_size)
  1202. {
  1203. int start_code;
  1204. start_code = find_marker(buf_ptr, buf_end);
  1205. av_fast_padded_malloc(&s->buffer, &s->buffer_size, buf_end - *buf_ptr);
  1206. if (!s->buffer)
  1207. return AVERROR(ENOMEM);
  1208. /* unescape buffer of SOS, use special treatment for JPEG-LS */
  1209. if (start_code == SOS && !s->ls) {
  1210. const uint8_t *src = *buf_ptr;
  1211. uint8_t *dst = s->buffer;
  1212. while (src < buf_end) {
  1213. uint8_t x = *(src++);
  1214. *(dst++) = x;
  1215. if (s->avctx->codec_id != CODEC_ID_THP) {
  1216. if (x == 0xff) {
  1217. while (src < buf_end && x == 0xff)
  1218. x = *(src++);
  1219. if (x >= 0xd0 && x <= 0xd7)
  1220. *(dst++) = x;
  1221. else if (x)
  1222. break;
  1223. }
  1224. }
  1225. }
  1226. *unescaped_buf_ptr = s->buffer;
  1227. *unescaped_buf_size = dst - s->buffer;
  1228. av_log(s->avctx, AV_LOG_DEBUG, "escaping removed %td bytes\n",
  1229. (buf_end - *buf_ptr) - (dst - s->buffer));
  1230. } else if (start_code == SOS && s->ls) {
  1231. const uint8_t *src = *buf_ptr;
  1232. uint8_t *dst = s->buffer;
  1233. int bit_count = 0;
  1234. int t = 0, b = 0;
  1235. PutBitContext pb;
  1236. s->cur_scan++;
  1237. /* find marker */
  1238. while (src + t < buf_end) {
  1239. uint8_t x = src[t++];
  1240. if (x == 0xff) {
  1241. while ((src + t < buf_end) && x == 0xff)
  1242. x = src[t++];
  1243. if (x & 0x80) {
  1244. t -= 2;
  1245. break;
  1246. }
  1247. }
  1248. }
  1249. bit_count = t * 8;
  1250. init_put_bits(&pb, dst, t);
  1251. /* unescape bitstream */
  1252. while (b < t) {
  1253. uint8_t x = src[b++];
  1254. put_bits(&pb, 8, x);
  1255. if (x == 0xFF) {
  1256. x = src[b++];
  1257. put_bits(&pb, 7, x);
  1258. bit_count--;
  1259. }
  1260. }
  1261. flush_put_bits(&pb);
  1262. *unescaped_buf_ptr = dst;
  1263. *unescaped_buf_size = (bit_count + 7) >> 3;
  1264. } else {
  1265. *unescaped_buf_ptr = *buf_ptr;
  1266. *unescaped_buf_size = buf_end - *buf_ptr;
  1267. }
  1268. return start_code;
  1269. }
  1270. int ff_mjpeg_decode_frame(AVCodecContext *avctx, void *data, int *data_size,
  1271. AVPacket *avpkt)
  1272. {
  1273. const uint8_t *buf = avpkt->data;
  1274. int buf_size = avpkt->size;
  1275. MJpegDecodeContext *s = avctx->priv_data;
  1276. const uint8_t *buf_end, *buf_ptr;
  1277. const uint8_t *unescaped_buf_ptr;
  1278. int unescaped_buf_size;
  1279. int start_code;
  1280. AVFrame *picture = data;
  1281. s->got_picture = 0; // picture from previous image can not be reused
  1282. buf_ptr = buf;
  1283. buf_end = buf + buf_size;
  1284. while (buf_ptr < buf_end) {
  1285. /* find start next marker */
  1286. start_code = ff_mjpeg_find_marker(s, &buf_ptr, buf_end,
  1287. &unescaped_buf_ptr,
  1288. &unescaped_buf_size);
  1289. /* EOF */
  1290. if (start_code < 0) {
  1291. goto the_end;
  1292. } else {
  1293. av_log(avctx, AV_LOG_DEBUG, "marker=%x avail_size_in_buf=%td\n",
  1294. start_code, buf_end - buf_ptr);
  1295. init_get_bits(&s->gb, unescaped_buf_ptr, unescaped_buf_size * 8);
  1296. s->start_code = start_code;
  1297. if (s->avctx->debug & FF_DEBUG_STARTCODE)
  1298. av_log(avctx, AV_LOG_DEBUG, "startcode: %X\n", start_code);
  1299. /* process markers */
  1300. if (start_code >= 0xd0 && start_code <= 0xd7)
  1301. av_log(avctx, AV_LOG_DEBUG,
  1302. "restart marker: %d\n", start_code & 0x0f);
  1303. /* APP fields */
  1304. else if (start_code >= APP0 && start_code <= APP15)
  1305. mjpeg_decode_app(s);
  1306. /* Comment */
  1307. else if (start_code == COM)
  1308. mjpeg_decode_com(s);
  1309. switch (start_code) {
  1310. case SOI:
  1311. s->restart_interval = 0;
  1312. s->restart_count = 0;
  1313. /* nothing to do on SOI */
  1314. break;
  1315. case DQT:
  1316. ff_mjpeg_decode_dqt(s);
  1317. break;
  1318. case DHT:
  1319. if (ff_mjpeg_decode_dht(s) < 0) {
  1320. av_log(avctx, AV_LOG_ERROR, "huffman table decode error\n");
  1321. return -1;
  1322. }
  1323. break;
  1324. case SOF0:
  1325. case SOF1:
  1326. s->lossless = 0;
  1327. s->ls = 0;
  1328. s->progressive = 0;
  1329. if (ff_mjpeg_decode_sof(s) < 0)
  1330. return -1;
  1331. break;
  1332. case SOF2:
  1333. s->lossless = 0;
  1334. s->ls = 0;
  1335. s->progressive = 1;
  1336. if (ff_mjpeg_decode_sof(s) < 0)
  1337. return -1;
  1338. break;
  1339. case SOF3:
  1340. s->lossless = 1;
  1341. s->ls = 0;
  1342. s->progressive = 0;
  1343. if (ff_mjpeg_decode_sof(s) < 0)
  1344. return -1;
  1345. break;
  1346. case SOF48:
  1347. s->lossless = 1;
  1348. s->ls = 1;
  1349. s->progressive = 0;
  1350. if (ff_mjpeg_decode_sof(s) < 0)
  1351. return -1;
  1352. break;
  1353. case LSE:
  1354. if (!CONFIG_JPEGLS_DECODER || ff_jpegls_decode_lse(s) < 0)
  1355. return -1;
  1356. break;
  1357. case EOI:
  1358. s->cur_scan = 0;
  1359. if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
  1360. break;
  1361. eoi_parser:
  1362. if (!s->got_picture) {
  1363. av_log(avctx, AV_LOG_WARNING,
  1364. "Found EOI before any SOF, ignoring\n");
  1365. break;
  1366. }
  1367. if (s->interlaced) {
  1368. s->bottom_field ^= 1;
  1369. /* if not bottom field, do not output image yet */
  1370. if (s->bottom_field == !s->interlace_polarity)
  1371. goto not_the_end;
  1372. }
  1373. *picture = *s->picture_ptr;
  1374. *data_size = sizeof(AVFrame);
  1375. if (!s->lossless) {
  1376. picture->quality = FFMAX3(s->qscale[0],
  1377. s->qscale[1],
  1378. s->qscale[2]);
  1379. picture->qstride = 0;
  1380. picture->qscale_table = s->qscale_table;
  1381. memset(picture->qscale_table, picture->quality,
  1382. (s->width + 15) / 16);
  1383. if (avctx->debug & FF_DEBUG_QP)
  1384. av_log(avctx, AV_LOG_DEBUG,
  1385. "QP: %d\n", picture->quality);
  1386. picture->quality *= FF_QP2LAMBDA;
  1387. }
  1388. goto the_end;
  1389. case SOS:
  1390. if (!s->got_picture) {
  1391. av_log(avctx, AV_LOG_WARNING,
  1392. "Can not process SOS before SOF, skipping\n");
  1393. break;
  1394. }
  1395. if (ff_mjpeg_decode_sos(s, NULL, NULL) < 0 &&
  1396. (avctx->err_recognition & AV_EF_EXPLODE))
  1397. return AVERROR_INVALIDDATA;
  1398. /* buggy avid puts EOI every 10-20th frame */
  1399. /* if restart period is over process EOI */
  1400. if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
  1401. goto eoi_parser;
  1402. break;
  1403. case DRI:
  1404. mjpeg_decode_dri(s);
  1405. break;
  1406. case SOF5:
  1407. case SOF6:
  1408. case SOF7:
  1409. case SOF9:
  1410. case SOF10:
  1411. case SOF11:
  1412. case SOF13:
  1413. case SOF14:
  1414. case SOF15:
  1415. case JPG:
  1416. av_log(avctx, AV_LOG_ERROR,
  1417. "mjpeg: unsupported coding type (%x)\n", start_code);
  1418. break;
  1419. // default:
  1420. // printf("mjpeg: unsupported marker (%x)\n", start_code);
  1421. // break;
  1422. }
  1423. not_the_end:
  1424. /* eof process start code */
  1425. buf_ptr += (get_bits_count(&s->gb) + 7) / 8;
  1426. av_log(avctx, AV_LOG_DEBUG,
  1427. "marker parser used %d bytes (%d bits)\n",
  1428. (get_bits_count(&s->gb) + 7) / 8, get_bits_count(&s->gb));
  1429. }
  1430. }
  1431. if (s->got_picture) {
  1432. av_log(avctx, AV_LOG_WARNING, "EOI missing, emulating\n");
  1433. goto eoi_parser;
  1434. }
  1435. av_log(avctx, AV_LOG_FATAL, "No JPEG data found in image\n");
  1436. return -1;
  1437. the_end:
  1438. av_log(avctx, AV_LOG_DEBUG, "mjpeg decode frame unused %td bytes\n",
  1439. buf_end - buf_ptr);
  1440. // return buf_end - buf_ptr;
  1441. return buf_ptr - buf;
  1442. }
  1443. av_cold int ff_mjpeg_decode_end(AVCodecContext *avctx)
  1444. {
  1445. MJpegDecodeContext *s = avctx->priv_data;
  1446. int i, j;
  1447. if (s->picture_ptr && s->picture_ptr->data[0])
  1448. avctx->release_buffer(avctx, s->picture_ptr);
  1449. av_free(s->buffer);
  1450. av_free(s->qscale_table);
  1451. av_freep(&s->ljpeg_buffer);
  1452. s->ljpeg_buffer_size = 0;
  1453. for (i = 0; i < 3; i++) {
  1454. for (j = 0; j < 4; j++)
  1455. ff_free_vlc(&s->vlcs[i][j]);
  1456. }
  1457. for (i = 0; i < MAX_COMPONENTS; i++) {
  1458. av_freep(&s->blocks[i]);
  1459. av_freep(&s->last_nnz[i]);
  1460. }
  1461. return 0;
  1462. }
  1463. #define OFFSET(x) offsetof(MJpegDecodeContext, x)
  1464. #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
  1465. static const AVOption options[] = {
  1466. { "extern_huff", "Use external huffman table.",
  1467. OFFSET(extern_huff), AV_OPT_TYPE_INT, { 0 }, 0, 1, VD },
  1468. { NULL },
  1469. };
  1470. static const AVClass mjpegdec_class = {
  1471. .class_name = "MJPEG decoder",
  1472. .item_name = av_default_item_name,
  1473. .option = options,
  1474. .version = LIBAVUTIL_VERSION_INT,
  1475. };
  1476. AVCodec ff_mjpeg_decoder = {
  1477. .name = "mjpeg",
  1478. .type = AVMEDIA_TYPE_VIDEO,
  1479. .id = CODEC_ID_MJPEG,
  1480. .priv_data_size = sizeof(MJpegDecodeContext),
  1481. .init = ff_mjpeg_decode_init,
  1482. .close = ff_mjpeg_decode_end,
  1483. .decode = ff_mjpeg_decode_frame,
  1484. .capabilities = CODEC_CAP_DR1,
  1485. .max_lowres = 3,
  1486. .long_name = NULL_IF_CONFIG_SMALL("MJPEG (Motion JPEG)"),
  1487. .priv_class = &mjpegdec_class,
  1488. };
  1489. AVCodec ff_thp_decoder = {
  1490. .name = "thp",
  1491. .type = AVMEDIA_TYPE_VIDEO,
  1492. .id = CODEC_ID_THP,
  1493. .priv_data_size = sizeof(MJpegDecodeContext),
  1494. .init = ff_mjpeg_decode_init,
  1495. .close = ff_mjpeg_decode_end,
  1496. .decode = ff_mjpeg_decode_frame,
  1497. .capabilities = CODEC_CAP_DR1,
  1498. .max_lowres = 3,
  1499. .long_name = NULL_IF_CONFIG_SMALL("Nintendo Gamecube THP video"),
  1500. };