You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1651 lines
55KB

  1. /*
  2. * MJPEG decoder
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. * Copyright (c) 2003 Alex Beregszaszi
  5. * Copyright (c) 2003-2004 Michael Niedermayer
  6. *
  7. * Support for external huffman table, various fixes (AVID workaround),
  8. * aspecting, new decode_frame mechanism and apple mjpeg-b support
  9. * by Alex Beregszaszi
  10. *
  11. * This file is part of FFmpeg.
  12. *
  13. * FFmpeg is free software; you can redistribute it and/or
  14. * modify it under the terms of the GNU Lesser General Public
  15. * License as published by the Free Software Foundation; either
  16. * version 2.1 of the License, or (at your option) any later version.
  17. *
  18. * FFmpeg is distributed in the hope that it will be useful,
  19. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  20. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  21. * Lesser General Public License for more details.
  22. *
  23. * You should have received a copy of the GNU Lesser General Public
  24. * License along with FFmpeg; if not, write to the Free Software
  25. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  26. */
  27. /**
  28. * @file
  29. * MJPEG decoder.
  30. */
  31. //#define DEBUG
  32. #include <assert.h>
  33. #include "libavutil/imgutils.h"
  34. #include "libavutil/avassert.h"
  35. #include "libavutil/opt.h"
  36. #include "avcodec.h"
  37. #include "dsputil.h"
  38. #include "mjpeg.h"
  39. #include "mjpegdec.h"
  40. #include "jpeglsdec.h"
  41. static int build_vlc(VLC *vlc, const uint8_t *bits_table, const uint8_t *val_table,
  42. int nb_codes, int use_static, int is_ac)
  43. {
  44. uint8_t huff_size[256];
  45. uint16_t huff_code[256];
  46. uint16_t huff_sym[256];
  47. int i;
  48. assert(nb_codes <= 256);
  49. memset(huff_size, 0, sizeof(huff_size));
  50. ff_mjpeg_build_huffman_codes(huff_size, huff_code, bits_table, val_table);
  51. for(i=0; i<256; i++)
  52. huff_sym[i]= i + 16*is_ac;
  53. if(is_ac) huff_sym[0]= 16*256;
  54. return init_vlc_sparse(vlc, 9, nb_codes, huff_size, 1, 1, huff_code, 2, 2, huff_sym, 2, 2, use_static);
  55. }
  56. static void build_basic_mjpeg_vlc(MJpegDecodeContext * s) {
  57. build_vlc(&s->vlcs[0][0], ff_mjpeg_bits_dc_luminance,
  58. ff_mjpeg_val_dc, 12, 0, 0);
  59. build_vlc(&s->vlcs[0][1], ff_mjpeg_bits_dc_chrominance,
  60. ff_mjpeg_val_dc, 12, 0, 0);
  61. build_vlc(&s->vlcs[1][0], ff_mjpeg_bits_ac_luminance,
  62. ff_mjpeg_val_ac_luminance, 251, 0, 1);
  63. build_vlc(&s->vlcs[1][1], ff_mjpeg_bits_ac_chrominance,
  64. ff_mjpeg_val_ac_chrominance, 251, 0, 1);
  65. build_vlc(&s->vlcs[2][0], ff_mjpeg_bits_ac_luminance,
  66. ff_mjpeg_val_ac_luminance, 251, 0, 0);
  67. build_vlc(&s->vlcs[2][1], ff_mjpeg_bits_ac_chrominance,
  68. ff_mjpeg_val_ac_chrominance, 251, 0, 0);
  69. }
  70. av_cold int ff_mjpeg_decode_init(AVCodecContext *avctx)
  71. {
  72. MJpegDecodeContext *s = avctx->priv_data;
  73. if (!s->picture_ptr)
  74. s->picture_ptr = &s->picture;
  75. avcodec_get_frame_defaults(&s->picture);
  76. s->avctx = avctx;
  77. dsputil_init(&s->dsp, avctx);
  78. ff_init_scantable(s->dsp.idct_permutation, &s->scantable, ff_zigzag_direct);
  79. s->buffer_size = 0;
  80. s->buffer = NULL;
  81. s->start_code = -1;
  82. s->first_picture = 1;
  83. s->org_height = avctx->coded_height;
  84. avctx->chroma_sample_location = AVCHROMA_LOC_CENTER;
  85. build_basic_mjpeg_vlc(s);
  86. #if FF_API_MJPEG_GLOBAL_OPTS
  87. if (avctx->flags & CODEC_FLAG_EXTERN_HUFF)
  88. s->extern_huff = 1;
  89. #endif
  90. if (s->extern_huff)
  91. {
  92. av_log(avctx, AV_LOG_INFO, "mjpeg: using external huffman table\n");
  93. init_get_bits(&s->gb, avctx->extradata, avctx->extradata_size*8);
  94. if (ff_mjpeg_decode_dht(s)) {
  95. av_log(avctx, AV_LOG_ERROR, "mjpeg: error using external huffman table, switching back to internal\n");
  96. build_basic_mjpeg_vlc(s);
  97. }
  98. }
  99. if (avctx->field_order == AV_FIELD_BB) { /* quicktime icefloe 019 */
  100. s->interlace_polarity = 1; /* bottom field first */
  101. av_log(avctx, AV_LOG_DEBUG, "mjpeg bottom field first\n");
  102. }
  103. if (avctx->codec->id == CODEC_ID_AMV)
  104. s->flipped = 1;
  105. return 0;
  106. }
  107. /* quantize tables */
  108. int ff_mjpeg_decode_dqt(MJpegDecodeContext *s)
  109. {
  110. int len, index, i, j;
  111. len = get_bits(&s->gb, 16) - 2;
  112. while (len >= 65) {
  113. /* only 8 bit precision handled */
  114. if (get_bits(&s->gb, 4) != 0)
  115. {
  116. av_log(s->avctx, AV_LOG_ERROR, "dqt: 16bit precision\n");
  117. return -1;
  118. }
  119. index = get_bits(&s->gb, 4);
  120. if (index >= 4)
  121. return -1;
  122. av_log(s->avctx, AV_LOG_DEBUG, "index=%d\n", index);
  123. /* read quant table */
  124. for(i=0;i<64;i++) {
  125. j = s->scantable.permutated[i];
  126. s->quant_matrixes[index][j] = get_bits(&s->gb, 8);
  127. }
  128. //XXX FIXME finetune, and perhaps add dc too
  129. s->qscale[index]= FFMAX(
  130. s->quant_matrixes[index][s->scantable.permutated[1]],
  131. s->quant_matrixes[index][s->scantable.permutated[8]]) >> 1;
  132. av_log(s->avctx, AV_LOG_DEBUG, "qscale[%d]: %d\n", index, s->qscale[index]);
  133. len -= 65;
  134. }
  135. return 0;
  136. }
  137. /* decode huffman tables and build VLC decoders */
  138. int ff_mjpeg_decode_dht(MJpegDecodeContext *s)
  139. {
  140. int len, index, i, class, n, v, code_max;
  141. uint8_t bits_table[17];
  142. uint8_t val_table[256];
  143. len = get_bits(&s->gb, 16) - 2;
  144. while (len > 0) {
  145. if (len < 17)
  146. return -1;
  147. class = get_bits(&s->gb, 4);
  148. if (class >= 2)
  149. return -1;
  150. index = get_bits(&s->gb, 4);
  151. if (index >= 4)
  152. return -1;
  153. n = 0;
  154. for(i=1;i<=16;i++) {
  155. bits_table[i] = get_bits(&s->gb, 8);
  156. n += bits_table[i];
  157. }
  158. len -= 17;
  159. if (len < n || n > 256)
  160. return -1;
  161. code_max = 0;
  162. for(i=0;i<n;i++) {
  163. v = get_bits(&s->gb, 8);
  164. if (v > code_max)
  165. code_max = v;
  166. val_table[i] = v;
  167. }
  168. len -= n;
  169. /* build VLC and flush previous vlc if present */
  170. free_vlc(&s->vlcs[class][index]);
  171. av_log(s->avctx, AV_LOG_DEBUG, "class=%d index=%d nb_codes=%d\n",
  172. class, index, code_max + 1);
  173. if(build_vlc(&s->vlcs[class][index], bits_table, val_table, code_max + 1, 0, class > 0) < 0){
  174. return -1;
  175. }
  176. if(class>0){
  177. free_vlc(&s->vlcs[2][index]);
  178. if(build_vlc(&s->vlcs[2][index], bits_table, val_table, code_max + 1, 0, 0) < 0){
  179. return -1;
  180. }
  181. }
  182. }
  183. return 0;
  184. }
  185. int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
  186. {
  187. int len, nb_components, i, width, height, pix_fmt_id;
  188. s->cur_scan = 0;
  189. /* XXX: verify len field validity */
  190. len = get_bits(&s->gb, 16);
  191. s->bits= get_bits(&s->gb, 8);
  192. if(s->pegasus_rct) s->bits=9;
  193. if(s->bits==9 && !s->pegasus_rct) s->rct=1; //FIXME ugly
  194. if (s->bits != 8 && !s->lossless){
  195. av_log(s->avctx, AV_LOG_ERROR, "only 8 bits/component accepted\n");
  196. return -1;
  197. }
  198. if(s->lossless && s->avctx->lowres){
  199. av_log(s->avctx, AV_LOG_ERROR, "lowres is not possible with lossless jpeg\n");
  200. return -1;
  201. }
  202. height = get_bits(&s->gb, 16);
  203. width = get_bits(&s->gb, 16);
  204. //HACK for odd_height.mov
  205. if(s->interlaced && s->width == width && s->height == height + 1)
  206. height= s->height;
  207. av_log(s->avctx, AV_LOG_DEBUG, "sof0: picture: %dx%d\n", width, height);
  208. if(av_image_check_size(width, height, 0, s->avctx))
  209. return -1;
  210. nb_components = get_bits(&s->gb, 8);
  211. if (nb_components <= 0 ||
  212. nb_components > MAX_COMPONENTS)
  213. return -1;
  214. if (s->ls && !(s->bits <= 8 || nb_components == 1)){
  215. av_log(s->avctx, AV_LOG_ERROR, "only <= 8 bits/component or 16-bit gray accepted for JPEG-LS\n");
  216. return -1;
  217. }
  218. s->nb_components = nb_components;
  219. s->h_max = 1;
  220. s->v_max = 1;
  221. for(i=0;i<nb_components;i++) {
  222. /* component id */
  223. s->component_id[i] = get_bits(&s->gb, 8) - 1;
  224. s->h_count[i] = get_bits(&s->gb, 4);
  225. s->v_count[i] = get_bits(&s->gb, 4);
  226. /* compute hmax and vmax (only used in interleaved case) */
  227. if (s->h_count[i] > s->h_max)
  228. s->h_max = s->h_count[i];
  229. if (s->v_count[i] > s->v_max)
  230. s->v_max = s->v_count[i];
  231. s->quant_index[i] = get_bits(&s->gb, 8);
  232. if (s->quant_index[i] >= 4)
  233. return -1;
  234. av_log(s->avctx, AV_LOG_DEBUG, "component %d %d:%d id: %d quant:%d\n", i, s->h_count[i],
  235. s->v_count[i], s->component_id[i], s->quant_index[i]);
  236. }
  237. if(s->ls && (s->h_max > 1 || s->v_max > 1)) {
  238. av_log(s->avctx, AV_LOG_ERROR, "Subsampling in JPEG-LS is not supported.\n");
  239. return -1;
  240. }
  241. if(s->v_max==1 && s->h_max==1 && s->lossless==1) s->rgb=1;
  242. /* if different size, realloc/alloc picture */
  243. /* XXX: also check h_count and v_count */
  244. if (width != s->width || height != s->height) {
  245. av_freep(&s->qscale_table);
  246. s->width = width;
  247. s->height = height;
  248. s->interlaced = 0;
  249. /* test interlaced mode */
  250. if (s->first_picture &&
  251. s->org_height != 0 &&
  252. s->height < ((s->org_height * 3) / 4)) {
  253. s->interlaced = 1;
  254. s->bottom_field = s->interlace_polarity;
  255. s->picture_ptr->interlaced_frame = 1;
  256. s->picture_ptr->top_field_first = !s->interlace_polarity;
  257. height *= 2;
  258. }
  259. avcodec_set_dimensions(s->avctx, width, height);
  260. s->qscale_table= av_mallocz((s->width+15)/16);
  261. s->first_picture = 0;
  262. }
  263. if(s->interlaced && (s->bottom_field == !s->interlace_polarity))
  264. return 0;
  265. /* XXX: not complete test ! */
  266. pix_fmt_id = (s->h_count[0] << 28) | (s->v_count[0] << 24) |
  267. (s->h_count[1] << 20) | (s->v_count[1] << 16) |
  268. (s->h_count[2] << 12) | (s->v_count[2] << 8) |
  269. (s->h_count[3] << 4) | s->v_count[3];
  270. av_log(s->avctx, AV_LOG_DEBUG, "pix fmt id %x\n", pix_fmt_id);
  271. //NOTE we do not allocate pictures large enough for the possible padding of h/v_count being 4
  272. if(!(pix_fmt_id & 0xD0D0D0D0))
  273. pix_fmt_id-= (pix_fmt_id & 0xF0F0F0F0)>>1;
  274. if(!(pix_fmt_id & 0x0D0D0D0D))
  275. pix_fmt_id-= (pix_fmt_id & 0x0F0F0F0F)>>1;
  276. switch(pix_fmt_id){
  277. case 0x11111100:
  278. if(s->rgb){
  279. s->avctx->pix_fmt = PIX_FMT_BGR24;
  280. }else{
  281. if(s->component_id[0] == 'Q' && s->component_id[1] == 'F' && s->component_id[2] == 'A'){
  282. s->avctx->pix_fmt = PIX_FMT_GBR24P;
  283. }else{
  284. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV444P : PIX_FMT_YUVJ444P;
  285. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  286. }
  287. }
  288. assert(s->nb_components==3);
  289. break;
  290. case 0x11000000:
  291. s->avctx->pix_fmt = PIX_FMT_GRAY8;
  292. break;
  293. case 0x12111100:
  294. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV440P : PIX_FMT_YUVJ440P;
  295. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  296. break;
  297. case 0x21111100:
  298. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV422P : PIX_FMT_YUVJ422P;
  299. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  300. break;
  301. case 0x22111100:
  302. s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV420P : PIX_FMT_YUVJ420P;
  303. s->avctx->color_range = s->cs_itu601 ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
  304. break;
  305. default:
  306. av_log(s->avctx, AV_LOG_ERROR, "Unhandled pixel format 0x%x\n", pix_fmt_id);
  307. return -1;
  308. }
  309. if(s->ls){
  310. if(s->nb_components > 1)
  311. s->avctx->pix_fmt = PIX_FMT_RGB24;
  312. else if(s->bits <= 8)
  313. s->avctx->pix_fmt = PIX_FMT_GRAY8;
  314. else
  315. s->avctx->pix_fmt = PIX_FMT_GRAY16;
  316. }
  317. if(s->picture_ptr->data[0])
  318. s->avctx->release_buffer(s->avctx, s->picture_ptr);
  319. if(s->avctx->get_buffer(s->avctx, s->picture_ptr) < 0){
  320. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  321. return -1;
  322. }
  323. s->picture_ptr->pict_type= AV_PICTURE_TYPE_I;
  324. s->picture_ptr->key_frame= 1;
  325. s->got_picture = 1;
  326. for(i=0; i<3; i++){
  327. s->linesize[i]= s->picture_ptr->linesize[i] << s->interlaced;
  328. }
  329. // printf("%d %d %d %d %d %d\n", s->width, s->height, s->linesize[0], s->linesize[1], s->interlaced, s->avctx->height);
  330. if (len != (8+(3*nb_components)))
  331. {
  332. av_log(s->avctx, AV_LOG_DEBUG, "decode_sof0: error, len(%d) mismatch\n", len);
  333. }
  334. /* totally blank picture as progressive JPEG will only add details to it */
  335. if(s->progressive){
  336. int bw = (width + s->h_max*8-1) / (s->h_max*8);
  337. int bh = (height + s->v_max*8-1) / (s->v_max*8);
  338. for(i=0; i<s->nb_components; i++) {
  339. int size = bw * bh * s->h_count[i] * s->v_count[i];
  340. av_freep(&s->blocks[i]);
  341. av_freep(&s->last_nnz[i]);
  342. s->blocks[i] = av_malloc(size * sizeof(**s->blocks));
  343. s->last_nnz[i] = av_mallocz(size * sizeof(**s->last_nnz));
  344. s->block_stride[i] = bw * s->h_count[i];
  345. }
  346. memset(s->coefs_finished, 0, sizeof(s->coefs_finished));
  347. }
  348. return 0;
  349. }
  350. static inline int mjpeg_decode_dc(MJpegDecodeContext *s, int dc_index)
  351. {
  352. int code;
  353. code = get_vlc2(&s->gb, s->vlcs[0][dc_index].table, 9, 2);
  354. if (code < 0)
  355. {
  356. av_log(s->avctx, AV_LOG_WARNING, "mjpeg_decode_dc: bad vlc: %d:%d (%p)\n", 0, dc_index,
  357. &s->vlcs[0][dc_index]);
  358. return 0xffff;
  359. }
  360. if(code)
  361. return get_xbits(&s->gb, code);
  362. else
  363. return 0;
  364. }
  365. /* decode block and dequantize */
  366. static int decode_block(MJpegDecodeContext *s, DCTELEM *block,
  367. int component, int dc_index, int ac_index, int16_t *quant_matrix)
  368. {
  369. int code, i, j, level, val;
  370. /* DC coef */
  371. val = mjpeg_decode_dc(s, dc_index);
  372. if (val == 0xffff) {
  373. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  374. return -1;
  375. }
  376. val = val * quant_matrix[0] + s->last_dc[component];
  377. s->last_dc[component] = val;
  378. block[0] = val;
  379. /* AC coefs */
  380. i = 0;
  381. {OPEN_READER(re, &s->gb);
  382. do {
  383. UPDATE_CACHE(re, &s->gb);
  384. GET_VLC(code, re, &s->gb, s->vlcs[1][ac_index].table, 9, 2);
  385. i += ((unsigned)code) >> 4;
  386. code &= 0xf;
  387. if(code){
  388. if(code > MIN_CACHE_BITS - 16){
  389. UPDATE_CACHE(re, &s->gb);
  390. }
  391. {
  392. int cache=GET_CACHE(re,&s->gb);
  393. int sign=(~cache)>>31;
  394. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  395. }
  396. LAST_SKIP_BITS(re, &s->gb, code);
  397. if (i > 63) {
  398. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  399. return -1;
  400. }
  401. j = s->scantable.permutated[i];
  402. block[j] = level * quant_matrix[j];
  403. }
  404. }while(i<63);
  405. CLOSE_READER(re, &s->gb);}
  406. return 0;
  407. }
  408. static int decode_dc_progressive(MJpegDecodeContext *s, DCTELEM *block, int component,
  409. int dc_index, int16_t *quant_matrix, int Al)
  410. {
  411. int val;
  412. s->dsp.clear_block(block);
  413. val = mjpeg_decode_dc(s, dc_index);
  414. if (val == 0xffff) {
  415. av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
  416. return -1;
  417. }
  418. val = (val * quant_matrix[0] << Al) + s->last_dc[component];
  419. s->last_dc[component] = val;
  420. block[0] = val;
  421. return 0;
  422. }
  423. /* decode block and dequantize - progressive JPEG version */
  424. static int decode_block_progressive(MJpegDecodeContext *s, DCTELEM *block, uint8_t *last_nnz,
  425. int ac_index, int16_t *quant_matrix,
  426. int ss, int se, int Al, int *EOBRUN)
  427. {
  428. int code, i, j, level, val, run;
  429. if(*EOBRUN){
  430. (*EOBRUN)--;
  431. return 0;
  432. }
  433. {OPEN_READER(re, &s->gb);
  434. for(i=ss;;i++) {
  435. UPDATE_CACHE(re, &s->gb);
  436. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  437. run = ((unsigned) code) >> 4;
  438. code &= 0xF;
  439. if(code) {
  440. i += run;
  441. if(code > MIN_CACHE_BITS - 16){
  442. UPDATE_CACHE(re, &s->gb);
  443. }
  444. {
  445. int cache=GET_CACHE(re,&s->gb);
  446. int sign=(~cache)>>31;
  447. level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
  448. }
  449. LAST_SKIP_BITS(re, &s->gb, code);
  450. if (i >= se) {
  451. if(i == se){
  452. j = s->scantable.permutated[se];
  453. block[j] = level * quant_matrix[j] << Al;
  454. break;
  455. }
  456. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
  457. return -1;
  458. }
  459. j = s->scantable.permutated[i];
  460. block[j] = level * quant_matrix[j] << Al;
  461. }else{
  462. if(run == 0xF){// ZRL - skip 15 coefficients
  463. i += 15;
  464. if (i >= se) {
  465. av_log(s->avctx, AV_LOG_ERROR, "ZRL overflow: %d\n", i);
  466. return -1;
  467. }
  468. }else{
  469. val = (1 << run);
  470. if(run){
  471. UPDATE_CACHE(re, &s->gb);
  472. val += NEG_USR32(GET_CACHE(re, &s->gb), run);
  473. LAST_SKIP_BITS(re, &s->gb, run);
  474. }
  475. *EOBRUN = val - 1;
  476. break;
  477. }
  478. }
  479. }
  480. CLOSE_READER(re, &s->gb);}
  481. if(i > *last_nnz)
  482. *last_nnz = i;
  483. return 0;
  484. }
  485. #define REFINE_BIT(j) {\
  486. UPDATE_CACHE(re, &s->gb);\
  487. sign = block[j]>>15;\
  488. block[j] += SHOW_UBITS(re, &s->gb, 1) * ((quant_matrix[j]^sign)-sign) << Al;\
  489. LAST_SKIP_BITS(re, &s->gb, 1);\
  490. }
  491. #define ZERO_RUN \
  492. for(;;i++) {\
  493. if(i > last) {\
  494. i += run;\
  495. if(i > se) {\
  496. av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);\
  497. return -1;\
  498. }\
  499. break;\
  500. }\
  501. j = s->scantable.permutated[i];\
  502. if(block[j])\
  503. REFINE_BIT(j)\
  504. else if(run-- == 0)\
  505. break;\
  506. }
  507. /* decode block and dequantize - progressive JPEG refinement pass */
  508. static int decode_block_refinement(MJpegDecodeContext *s, DCTELEM *block, uint8_t *last_nnz,
  509. int ac_index, int16_t *quant_matrix,
  510. int ss, int se, int Al, int *EOBRUN)
  511. {
  512. int code, i=ss, j, sign, val, run;
  513. int last = FFMIN(se, *last_nnz);
  514. OPEN_READER(re, &s->gb);
  515. if(*EOBRUN)
  516. (*EOBRUN)--;
  517. else {
  518. for(;;i++) {
  519. UPDATE_CACHE(re, &s->gb);
  520. GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
  521. if(code & 0xF) {
  522. run = ((unsigned) code) >> 4;
  523. UPDATE_CACHE(re, &s->gb);
  524. val = SHOW_UBITS(re, &s->gb, 1);
  525. LAST_SKIP_BITS(re, &s->gb, 1);
  526. ZERO_RUN;
  527. j = s->scantable.permutated[i];
  528. val--;
  529. block[j] = ((quant_matrix[j]^val)-val) << Al;
  530. if(i == se) {
  531. if(i > *last_nnz)
  532. *last_nnz = i;
  533. CLOSE_READER(re, &s->gb);
  534. return 0;
  535. }
  536. }else{
  537. run = ((unsigned) code) >> 4;
  538. if(run == 0xF){
  539. ZERO_RUN;
  540. }else{
  541. val = run;
  542. run = (1 << run);
  543. if(val) {
  544. UPDATE_CACHE(re, &s->gb);
  545. run += SHOW_UBITS(re, &s->gb, val);
  546. LAST_SKIP_BITS(re, &s->gb, val);
  547. }
  548. *EOBRUN = run - 1;
  549. break;
  550. }
  551. }
  552. }
  553. if(i > *last_nnz)
  554. *last_nnz = i;
  555. }
  556. for(;i<=last;i++) {
  557. j = s->scantable.permutated[i];
  558. if(block[j])
  559. REFINE_BIT(j)
  560. }
  561. CLOSE_READER(re, &s->gb);
  562. return 0;
  563. }
  564. #undef REFINE_BIT
  565. #undef ZERO_RUN
  566. static int ljpeg_decode_rgb_scan(MJpegDecodeContext *s, int predictor, int point_transform){
  567. int i, mb_x, mb_y;
  568. uint16_t (*buffer)[4];
  569. int left[3], top[3], topleft[3];
  570. const int linesize= s->linesize[0];
  571. const int mask= (1<<s->bits)-1;
  572. av_fast_malloc(&s->ljpeg_buffer, &s->ljpeg_buffer_size, (unsigned)s->mb_width * 4 * sizeof(s->ljpeg_buffer[0][0]));
  573. buffer= s->ljpeg_buffer;
  574. for(i=0; i<3; i++){
  575. buffer[0][i]= 1 << (s->bits + point_transform - 1);
  576. }
  577. for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
  578. const int modified_predictor= mb_y ? predictor : 1;
  579. uint8_t *ptr = s->picture.data[0] + (linesize * mb_y);
  580. if (s->interlaced && s->bottom_field)
  581. ptr += linesize >> 1;
  582. for(i=0; i<3; i++){
  583. top[i]= left[i]= topleft[i]= buffer[0][i];
  584. }
  585. for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
  586. if (s->restart_interval && !s->restart_count)
  587. s->restart_count = s->restart_interval;
  588. for(i=0;i<3;i++) {
  589. int pred, dc;
  590. topleft[i]= top[i];
  591. top[i]= buffer[mb_x][i];
  592. PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
  593. dc = mjpeg_decode_dc(s, s->dc_index[i]);
  594. if(dc == 0xFFFF)
  595. return -1;
  596. left[i]=
  597. buffer[mb_x][i]= mask & (pred + (dc << point_transform));
  598. }
  599. if (s->restart_interval && !--s->restart_count) {
  600. align_get_bits(&s->gb);
  601. skip_bits(&s->gb, 16); /* skip RSTn */
  602. }
  603. }
  604. if(s->rct){
  605. for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
  606. ptr[3*mb_x+1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2] - 0x200)>>2);
  607. ptr[3*mb_x+0] = buffer[mb_x][1] + ptr[3*mb_x+1];
  608. ptr[3*mb_x+2] = buffer[mb_x][2] + ptr[3*mb_x+1];
  609. }
  610. }else if(s->pegasus_rct){
  611. for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
  612. ptr[3*mb_x+1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2])>>2);
  613. ptr[3*mb_x+0] = buffer[mb_x][1] + ptr[3*mb_x+1];
  614. ptr[3*mb_x+2] = buffer[mb_x][2] + ptr[3*mb_x+1];
  615. }
  616. }else{
  617. for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
  618. ptr[3*mb_x+0] = buffer[mb_x][2];
  619. ptr[3*mb_x+1] = buffer[mb_x][1];
  620. ptr[3*mb_x+2] = buffer[mb_x][0];
  621. }
  622. }
  623. }
  624. return 0;
  625. }
  626. static int ljpeg_decode_yuv_scan(MJpegDecodeContext *s, int predictor, int point_transform){
  627. int i, mb_x, mb_y;
  628. const int nb_components=3;
  629. for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
  630. for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
  631. if (s->restart_interval && !s->restart_count)
  632. s->restart_count = s->restart_interval;
  633. if(mb_x==0 || mb_y==0 || s->interlaced){
  634. for(i=0;i<nb_components;i++) {
  635. uint8_t *ptr;
  636. int n, h, v, x, y, c, j, linesize;
  637. n = s->nb_blocks[i];
  638. c = s->comp_index[i];
  639. h = s->h_scount[i];
  640. v = s->v_scount[i];
  641. x = 0;
  642. y = 0;
  643. linesize= s->linesize[c];
  644. for(j=0; j<n; j++) {
  645. int pred, dc;
  646. ptr = s->picture.data[c] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
  647. if(y==0 && mb_y==0){
  648. if(x==0 && mb_x==0){
  649. pred= 128 << point_transform;
  650. }else{
  651. pred= ptr[-1];
  652. }
  653. }else{
  654. if(x==0 && mb_x==0){
  655. pred= ptr[-linesize];
  656. }else{
  657. PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
  658. }
  659. }
  660. if (s->interlaced && s->bottom_field)
  661. ptr += linesize >> 1;
  662. dc = mjpeg_decode_dc(s, s->dc_index[i]);
  663. if(dc == 0xFFFF)
  664. return -1;
  665. *ptr= pred + (dc << point_transform);
  666. if (++x == h) {
  667. x = 0;
  668. y++;
  669. }
  670. }
  671. }
  672. }else{
  673. for(i=0;i<nb_components;i++) {
  674. uint8_t *ptr;
  675. int n, h, v, x, y, c, j, linesize, dc;
  676. n = s->nb_blocks[i];
  677. c = s->comp_index[i];
  678. h = s->h_scount[i];
  679. v = s->v_scount[i];
  680. x = 0;
  681. y = 0;
  682. linesize= s->linesize[c];
  683. for(j=0; j<n; j++) {
  684. int pred;
  685. ptr = s->picture.data[c] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
  686. PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
  687. dc = mjpeg_decode_dc(s, s->dc_index[i]);
  688. if(dc == 0xFFFF)
  689. return -1;
  690. *ptr= pred + (dc << point_transform);
  691. if (++x == h) {
  692. x = 0;
  693. y++;
  694. }
  695. }
  696. }
  697. }
  698. if (s->restart_interval && !--s->restart_count) {
  699. align_get_bits(&s->gb);
  700. skip_bits(&s->gb, 16); /* skip RSTn */
  701. }
  702. }
  703. }
  704. return 0;
  705. }
  706. static av_always_inline void mjpeg_copy_block(uint8_t *dst, const uint8_t *src,
  707. int linesize, int lowres)
  708. {
  709. switch (lowres) {
  710. case 0: copy_block8(dst, src, linesize, linesize, 8);
  711. break;
  712. case 1: copy_block4(dst, src, linesize, linesize, 4);
  713. break;
  714. case 2: copy_block2(dst, src, linesize, linesize, 2);
  715. break;
  716. case 3: *dst = *src;
  717. break;
  718. }
  719. }
  720. static int mjpeg_decode_scan(MJpegDecodeContext *s, int nb_components, int Ah, int Al,
  721. const uint8_t *mb_bitmask, const AVFrame *reference){
  722. int i, mb_x, mb_y;
  723. uint8_t* data[MAX_COMPONENTS];
  724. const uint8_t *reference_data[MAX_COMPONENTS];
  725. int linesize[MAX_COMPONENTS];
  726. GetBitContext mb_bitmask_gb;
  727. if (mb_bitmask) {
  728. init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width*s->mb_height);
  729. }
  730. if(s->flipped && s->avctx->flags & CODEC_FLAG_EMU_EDGE) {
  731. av_log(s->avctx, AV_LOG_ERROR, "Can not flip image with CODEC_FLAG_EMU_EDGE set!\n");
  732. s->flipped = 0;
  733. }
  734. for(i=0; i < nb_components; i++) {
  735. int c = s->comp_index[i];
  736. data[c] = s->picture_ptr->data[c];
  737. reference_data[c] = reference ? reference->data[c] : NULL;
  738. linesize[c]=s->linesize[c];
  739. s->coefs_finished[c] |= 1;
  740. if(s->flipped) {
  741. //picture should be flipped upside-down for this codec
  742. int offset = (linesize[c] * (s->v_scount[i] * (8 * s->mb_height -((s->height/s->v_max)&7)) - 1 ));
  743. data[c] += offset;
  744. reference_data[c] += offset;
  745. linesize[c] *= -1;
  746. }
  747. }
  748. for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
  749. for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
  750. const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
  751. if (s->restart_interval && !s->restart_count)
  752. s->restart_count = s->restart_interval;
  753. if(get_bits_count(&s->gb)>s->gb.size_in_bits){
  754. av_log(s->avctx, AV_LOG_ERROR, "overread %d\n", get_bits_count(&s->gb) - s->gb.size_in_bits);
  755. return -1;
  756. }
  757. for(i=0;i<nb_components;i++) {
  758. uint8_t *ptr;
  759. int n, h, v, x, y, c, j;
  760. int block_offset;
  761. n = s->nb_blocks[i];
  762. c = s->comp_index[i];
  763. h = s->h_scount[i];
  764. v = s->v_scount[i];
  765. x = 0;
  766. y = 0;
  767. for(j=0;j<n;j++) {
  768. block_offset = (((linesize[c] * (v * mb_y + y) * 8) +
  769. (h * mb_x + x) * 8) >> s->avctx->lowres);
  770. if(s->interlaced && s->bottom_field)
  771. block_offset += linesize[c] >> 1;
  772. ptr = data[c] + block_offset;
  773. if(!s->progressive) {
  774. if (copy_mb) {
  775. mjpeg_copy_block(ptr, reference_data[c] + block_offset, linesize[c], s->avctx->lowres);
  776. } else {
  777. s->dsp.clear_block(s->block);
  778. if(decode_block(s, s->block, i,
  779. s->dc_index[i], s->ac_index[i],
  780. s->quant_matrixes[ s->quant_index[c] ]) < 0) {
  781. av_log(s->avctx, AV_LOG_ERROR, "error y=%d x=%d\n", mb_y, mb_x);
  782. return -1;
  783. }
  784. s->dsp.idct_put(ptr, linesize[c], s->block);
  785. }
  786. } else {
  787. int block_idx = s->block_stride[c] * (v * mb_y + y) + (h * mb_x + x);
  788. DCTELEM *block = s->blocks[c][block_idx];
  789. if(Ah)
  790. block[0] += get_bits1(&s->gb) * s->quant_matrixes[ s->quant_index[c] ][0] << Al;
  791. else if(decode_dc_progressive(s, block, i, s->dc_index[i], s->quant_matrixes[ s->quant_index[c] ], Al) < 0) {
  792. av_log(s->avctx, AV_LOG_ERROR, "error y=%d x=%d\n", mb_y, mb_x);
  793. return -1;
  794. }
  795. }
  796. // av_log(s->avctx, AV_LOG_DEBUG, "mb: %d %d processed\n", mb_y, mb_x);
  797. //av_log(NULL, AV_LOG_DEBUG, "%d %d %d %d %d %d %d %d \n", mb_x, mb_y, x, y, c, s->bottom_field, (v * mb_y + y) * 8, (h * mb_x + x) * 8);
  798. if (++x == h) {
  799. x = 0;
  800. y++;
  801. }
  802. }
  803. }
  804. if (s->restart_interval) --s->restart_count;
  805. i= 8+((-get_bits_count(&s->gb))&7);
  806. if (s->restart_interval && show_bits(&s->gb, i) == (1<<i)-1){ /* skip RSTn */
  807. int pos= get_bits_count(&s->gb);
  808. align_get_bits(&s->gb);
  809. while(get_bits_count(&s->gb) < s->gb.size_in_bits && show_bits(&s->gb, 8) == 0xFF)
  810. skip_bits(&s->gb, 8);
  811. if(get_bits_count(&s->gb) < s->gb.size_in_bits && (get_bits(&s->gb, 8)&0xF8) == 0xD0){
  812. for (i=0; i<nb_components; i++) /* reset dc */
  813. s->last_dc[i] = 1024;
  814. }else{
  815. skip_bits_long(&s->gb, pos - get_bits_count(&s->gb));
  816. }
  817. }
  818. }
  819. }
  820. return 0;
  821. }
  822. static int mjpeg_decode_scan_progressive_ac(MJpegDecodeContext *s, int ss, int se, int Ah, int Al){
  823. int mb_x, mb_y;
  824. int EOBRUN = 0;
  825. int c = s->comp_index[0];
  826. uint8_t* data = s->picture.data[c];
  827. int linesize = s->linesize[c];
  828. int last_scan = 0;
  829. int16_t *quant_matrix = s->quant_matrixes[ s->quant_index[c] ];
  830. if(!Al) {
  831. s->coefs_finished[c] |= (1LL<<(se+1))-(1LL<<ss);
  832. last_scan = !~s->coefs_finished[c];
  833. }
  834. if(s->interlaced && s->bottom_field)
  835. data += linesize >> 1;
  836. for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
  837. uint8_t *ptr = data + (mb_y*linesize*8 >> s->avctx->lowres);
  838. int block_idx = mb_y * s->block_stride[c];
  839. DCTELEM (*block)[64] = &s->blocks[c][block_idx];
  840. uint8_t *last_nnz = &s->last_nnz[c][block_idx];
  841. for(mb_x = 0; mb_x < s->mb_width; mb_x++, block++, last_nnz++) {
  842. int ret;
  843. if(Ah)
  844. ret = decode_block_refinement(s, *block, last_nnz, s->ac_index[0],
  845. quant_matrix, ss, se, Al, &EOBRUN);
  846. else
  847. ret = decode_block_progressive(s, *block, last_nnz, s->ac_index[0],
  848. quant_matrix, ss, se, Al, &EOBRUN);
  849. if(ret < 0) {
  850. av_log(s->avctx, AV_LOG_ERROR, "error y=%d x=%d\n", mb_y, mb_x);
  851. return -1;
  852. }
  853. if(last_scan) {
  854. s->dsp.idct_put(ptr, linesize, *block);
  855. ptr += 8 >> s->avctx->lowres;
  856. }
  857. }
  858. }
  859. return 0;
  860. }
  861. int ff_mjpeg_decode_sos(MJpegDecodeContext *s,
  862. const uint8_t *mb_bitmask, const AVFrame *reference)
  863. {
  864. int len, nb_components, i, h, v, predictor, point_transform;
  865. int index, id;
  866. const int block_size= s->lossless ? 1 : 8;
  867. int ilv, prev_shift;
  868. /* XXX: verify len field validity */
  869. len = get_bits(&s->gb, 16);
  870. nb_components = get_bits(&s->gb, 8);
  871. if (nb_components == 0 || nb_components > MAX_COMPONENTS){
  872. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: nb_components (%d) unsupported\n", nb_components);
  873. return -1;
  874. }
  875. if (len != 6+2*nb_components)
  876. {
  877. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: invalid len (%d)\n", len);
  878. return -1;
  879. }
  880. for(i=0;i<nb_components;i++) {
  881. id = get_bits(&s->gb, 8) - 1;
  882. av_log(s->avctx, AV_LOG_DEBUG, "component: %d\n", id);
  883. /* find component index */
  884. for(index=0;index<s->nb_components;index++)
  885. if (id == s->component_id[index])
  886. break;
  887. if (index == s->nb_components)
  888. {
  889. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: index(%d) out of components\n", index);
  890. return -1;
  891. }
  892. /* Metasoft MJPEG codec has Cb and Cr swapped */
  893. if (s->avctx->codec_tag == MKTAG('M', 'T', 'S', 'J')
  894. && nb_components == 3 && s->nb_components == 3 && i)
  895. index = 3 - i;
  896. if(nb_components == 3 && s->nb_components == 3 && s->avctx->pix_fmt == PIX_FMT_GBR24P)
  897. index = (i+2)%3;
  898. s->comp_index[i] = index;
  899. s->nb_blocks[i] = s->h_count[index] * s->v_count[index];
  900. s->h_scount[i] = s->h_count[index];
  901. s->v_scount[i] = s->v_count[index];
  902. s->dc_index[i] = get_bits(&s->gb, 4);
  903. s->ac_index[i] = get_bits(&s->gb, 4);
  904. if (s->dc_index[i] < 0 || s->ac_index[i] < 0 ||
  905. s->dc_index[i] >= 4 || s->ac_index[i] >= 4)
  906. goto out_of_range;
  907. if (!s->vlcs[0][s->dc_index[i]].table || !s->vlcs[1][s->ac_index[i]].table)
  908. goto out_of_range;
  909. }
  910. predictor= get_bits(&s->gb, 8); /* JPEG Ss / lossless JPEG predictor /JPEG-LS NEAR */
  911. ilv= get_bits(&s->gb, 8); /* JPEG Se / JPEG-LS ILV */
  912. if(s->avctx->codec_tag != AV_RL32("CJPG")){
  913. prev_shift = get_bits(&s->gb, 4); /* Ah */
  914. point_transform= get_bits(&s->gb, 4); /* Al */
  915. }else
  916. prev_shift= point_transform= 0;
  917. for(i=0;i<nb_components;i++)
  918. s->last_dc[i] = 1024;
  919. if (nb_components > 1) {
  920. /* interleaved stream */
  921. s->mb_width = (s->width + s->h_max * block_size - 1) / (s->h_max * block_size);
  922. s->mb_height = (s->height + s->v_max * block_size - 1) / (s->v_max * block_size);
  923. } else if(!s->ls) { /* skip this for JPEG-LS */
  924. h = s->h_max / s->h_scount[0];
  925. v = s->v_max / s->v_scount[0];
  926. s->mb_width = (s->width + h * block_size - 1) / (h * block_size);
  927. s->mb_height = (s->height + v * block_size - 1) / (v * block_size);
  928. s->nb_blocks[0] = 1;
  929. s->h_scount[0] = 1;
  930. s->v_scount[0] = 1;
  931. }
  932. if(s->avctx->debug & FF_DEBUG_PICT_INFO)
  933. av_log(s->avctx, AV_LOG_DEBUG, "%s %s p:%d >>:%d ilv:%d bits:%d skip:%d %s comp:%d\n", s->lossless ? "lossless" : "sequential DCT", s->rgb ? "RGB" : "",
  934. predictor, point_transform, ilv, s->bits, s->mjpb_skiptosod,
  935. s->pegasus_rct ? "PRCT" : (s->rct ? "RCT" : ""), nb_components);
  936. /* mjpeg-b can have padding bytes between sos and image data, skip them */
  937. for (i = s->mjpb_skiptosod; i > 0; i--)
  938. skip_bits(&s->gb, 8);
  939. if(s->lossless){
  940. av_assert0(s->picture_ptr == &s->picture);
  941. if(CONFIG_JPEGLS_DECODER && s->ls){
  942. // for(){
  943. // reset_ls_coding_parameters(s, 0);
  944. if(ff_jpegls_decode_picture(s, predictor, point_transform, ilv) < 0)
  945. return -1;
  946. }else{
  947. if(s->rgb){
  948. if(ljpeg_decode_rgb_scan(s, predictor, point_transform) < 0)
  949. return -1;
  950. }else{
  951. if(ljpeg_decode_yuv_scan(s, predictor, point_transform) < 0)
  952. return -1;
  953. }
  954. }
  955. }else{
  956. if(s->progressive && predictor) {
  957. av_assert0(s->picture_ptr == &s->picture);
  958. if(mjpeg_decode_scan_progressive_ac(s, predictor, ilv, prev_shift, point_transform) < 0)
  959. return -1;
  960. } else {
  961. if(mjpeg_decode_scan(s, nb_components, prev_shift, point_transform,
  962. mb_bitmask, reference) < 0)
  963. return -1;
  964. }
  965. }
  966. emms_c();
  967. return 0;
  968. out_of_range:
  969. av_log(s->avctx, AV_LOG_ERROR, "decode_sos: ac/dc index out of range\n");
  970. return -1;
  971. }
  972. static int mjpeg_decode_dri(MJpegDecodeContext *s)
  973. {
  974. if (get_bits(&s->gb, 16) != 4)
  975. return -1;
  976. s->restart_interval = get_bits(&s->gb, 16);
  977. s->restart_count = 0;
  978. av_log(s->avctx, AV_LOG_DEBUG, "restart interval: %d\n", s->restart_interval);
  979. return 0;
  980. }
  981. static int mjpeg_decode_app(MJpegDecodeContext *s)
  982. {
  983. int len, id, i;
  984. len = get_bits(&s->gb, 16);
  985. if (len < 5)
  986. return -1;
  987. if(8*len + get_bits_count(&s->gb) > s->gb.size_in_bits)
  988. return -1;
  989. id = get_bits_long(&s->gb, 32);
  990. id = av_be2ne32(id);
  991. len -= 6;
  992. if(s->avctx->debug & FF_DEBUG_STARTCODE){
  993. av_log(s->avctx, AV_LOG_DEBUG, "APPx %8X\n", id);
  994. }
  995. /* Buggy AVID, it puts EOI only at every 10th frame. */
  996. /* Also, this fourcc is used by non-avid files too, it holds some
  997. information, but it's always present in AVID-created files. */
  998. if (id == AV_RL32("AVI1"))
  999. {
  1000. /* structure:
  1001. 4bytes AVI1
  1002. 1bytes polarity
  1003. 1bytes always zero
  1004. 4bytes field_size
  1005. 4bytes field_size_less_padding
  1006. */
  1007. s->buggy_avid = 1;
  1008. // if (s->first_picture)
  1009. // printf("mjpeg: workarounding buggy AVID\n");
  1010. i = get_bits(&s->gb, 8); len--;
  1011. av_log(s->avctx, AV_LOG_DEBUG, "polarity %d\n", i);
  1012. #if 0
  1013. skip_bits(&s->gb, 8);
  1014. skip_bits(&s->gb, 32);
  1015. skip_bits(&s->gb, 32);
  1016. len -= 10;
  1017. #endif
  1018. // if (s->interlace_polarity)
  1019. // printf("mjpeg: interlace polarity: %d\n", s->interlace_polarity);
  1020. goto out;
  1021. }
  1022. // len -= 2;
  1023. if (id == AV_RL32("JFIF"))
  1024. {
  1025. int t_w, t_h, v1, v2;
  1026. skip_bits(&s->gb, 8); /* the trailing zero-byte */
  1027. v1= get_bits(&s->gb, 8);
  1028. v2= get_bits(&s->gb, 8);
  1029. skip_bits(&s->gb, 8);
  1030. s->avctx->sample_aspect_ratio.num= get_bits(&s->gb, 16);
  1031. s->avctx->sample_aspect_ratio.den= get_bits(&s->gb, 16);
  1032. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1033. av_log(s->avctx, AV_LOG_INFO, "mjpeg: JFIF header found (version: %x.%x) SAR=%d/%d\n",
  1034. v1, v2,
  1035. s->avctx->sample_aspect_ratio.num,
  1036. s->avctx->sample_aspect_ratio.den
  1037. );
  1038. t_w = get_bits(&s->gb, 8);
  1039. t_h = get_bits(&s->gb, 8);
  1040. if (t_w && t_h)
  1041. {
  1042. /* skip thumbnail */
  1043. if (len-10-(t_w*t_h*3) > 0)
  1044. len -= t_w*t_h*3;
  1045. }
  1046. len -= 10;
  1047. goto out;
  1048. }
  1049. if (id == AV_RL32("Adob") && (get_bits(&s->gb, 8) == 'e'))
  1050. {
  1051. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1052. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Adobe header found\n");
  1053. skip_bits(&s->gb, 16); /* version */
  1054. skip_bits(&s->gb, 16); /* flags0 */
  1055. skip_bits(&s->gb, 16); /* flags1 */
  1056. skip_bits(&s->gb, 8); /* transform */
  1057. len -= 7;
  1058. goto out;
  1059. }
  1060. if (id == AV_RL32("LJIF")){
  1061. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1062. av_log(s->avctx, AV_LOG_INFO, "Pegasus lossless jpeg header found\n");
  1063. skip_bits(&s->gb, 16); /* version ? */
  1064. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1065. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1066. skip_bits(&s->gb, 16); /* unknwon always 0? */
  1067. switch( get_bits(&s->gb, 8)){
  1068. case 1:
  1069. s->rgb= 1;
  1070. s->pegasus_rct=0;
  1071. break;
  1072. case 2:
  1073. s->rgb= 1;
  1074. s->pegasus_rct=1;
  1075. break;
  1076. default:
  1077. av_log(s->avctx, AV_LOG_ERROR, "unknown colorspace\n");
  1078. }
  1079. len -= 9;
  1080. goto out;
  1081. }
  1082. /* Apple MJPEG-A */
  1083. if ((s->start_code == APP1) && (len > (0x28 - 8)))
  1084. {
  1085. id = get_bits_long(&s->gb, 32);
  1086. id = av_be2ne32(id);
  1087. len -= 4;
  1088. if (id == AV_RL32("mjpg")) /* Apple MJPEG-A */
  1089. {
  1090. #if 0
  1091. skip_bits(&s->gb, 32); /* field size */
  1092. skip_bits(&s->gb, 32); /* pad field size */
  1093. skip_bits(&s->gb, 32); /* next off */
  1094. skip_bits(&s->gb, 32); /* quant off */
  1095. skip_bits(&s->gb, 32); /* huff off */
  1096. skip_bits(&s->gb, 32); /* image off */
  1097. skip_bits(&s->gb, 32); /* scan off */
  1098. skip_bits(&s->gb, 32); /* data off */
  1099. #endif
  1100. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1101. av_log(s->avctx, AV_LOG_INFO, "mjpeg: Apple MJPEG-A header found\n");
  1102. }
  1103. }
  1104. out:
  1105. /* slow but needed for extreme adobe jpegs */
  1106. if (len < 0)
  1107. av_log(s->avctx, AV_LOG_ERROR, "mjpeg: error, decode_app parser read over the end\n");
  1108. while(--len > 0)
  1109. skip_bits(&s->gb, 8);
  1110. return 0;
  1111. }
  1112. static int mjpeg_decode_com(MJpegDecodeContext *s)
  1113. {
  1114. int len = get_bits(&s->gb, 16);
  1115. if (len >= 2 && 8*len - 16 + get_bits_count(&s->gb) <= s->gb.size_in_bits) {
  1116. char *cbuf = av_malloc(len - 1);
  1117. if (cbuf) {
  1118. int i;
  1119. for (i = 0; i < len - 2; i++)
  1120. cbuf[i] = get_bits(&s->gb, 8);
  1121. if (i > 0 && cbuf[i-1] == '\n')
  1122. cbuf[i-1] = 0;
  1123. else
  1124. cbuf[i] = 0;
  1125. if(s->avctx->debug & FF_DEBUG_PICT_INFO)
  1126. av_log(s->avctx, AV_LOG_INFO, "mjpeg comment: '%s'\n", cbuf);
  1127. /* buggy avid, it puts EOI only at every 10th frame */
  1128. if (!strcmp(cbuf, "AVID"))
  1129. {
  1130. s->buggy_avid = 1;
  1131. // if (s->first_picture)
  1132. // printf("mjpeg: workarounding buggy AVID\n");
  1133. }
  1134. else if(!strcmp(cbuf, "CS=ITU601")){
  1135. s->cs_itu601= 1;
  1136. }
  1137. else if((len > 20 && !strncmp(cbuf, "Intel(R) JPEG Library", 21)) ||
  1138. (len > 19 && !strncmp(cbuf, "Metasoft MJPEG Codec", 20))){
  1139. s->flipped = 1;
  1140. }
  1141. av_free(cbuf);
  1142. }
  1143. }
  1144. return 0;
  1145. }
  1146. /* return the 8 bit start code value and update the search
  1147. state. Return -1 if no start code found */
  1148. static int find_marker(const uint8_t **pbuf_ptr, const uint8_t *buf_end)
  1149. {
  1150. const uint8_t *buf_ptr;
  1151. unsigned int v, v2;
  1152. int val;
  1153. int skipped=0;
  1154. buf_ptr = *pbuf_ptr;
  1155. while (buf_ptr < buf_end) {
  1156. v = *buf_ptr++;
  1157. v2 = *buf_ptr;
  1158. if ((v == 0xff) && (v2 >= 0xc0) && (v2 <= 0xfe) && buf_ptr < buf_end) {
  1159. val = *buf_ptr++;
  1160. goto found;
  1161. }
  1162. skipped++;
  1163. }
  1164. val = -1;
  1165. found:
  1166. av_dlog(NULL, "find_marker skipped %d bytes\n", skipped);
  1167. *pbuf_ptr = buf_ptr;
  1168. return val;
  1169. }
  1170. int ff_mjpeg_find_marker(MJpegDecodeContext *s,
  1171. const uint8_t **buf_ptr, const uint8_t *buf_end,
  1172. const uint8_t **unescaped_buf_ptr, int *unescaped_buf_size)
  1173. {
  1174. int start_code;
  1175. start_code = find_marker(buf_ptr, buf_end);
  1176. if ((buf_end - *buf_ptr) > s->buffer_size)
  1177. {
  1178. av_free(s->buffer);
  1179. s->buffer_size = buf_end - *buf_ptr;
  1180. s->buffer = av_malloc(s->buffer_size + FF_INPUT_BUFFER_PADDING_SIZE);
  1181. av_log(s->avctx, AV_LOG_DEBUG, "buffer too small, expanding to %d bytes\n",
  1182. s->buffer_size);
  1183. }
  1184. /* unescape buffer of SOS, use special treatment for JPEG-LS */
  1185. if (start_code == SOS && !s->ls)
  1186. {
  1187. const uint8_t *src = *buf_ptr;
  1188. uint8_t *dst = s->buffer;
  1189. while (src<buf_end)
  1190. {
  1191. uint8_t x = *(src++);
  1192. *(dst++) = x;
  1193. if (s->avctx->codec_id != CODEC_ID_THP)
  1194. {
  1195. if (x == 0xff) {
  1196. while (src < buf_end && x == 0xff)
  1197. x = *(src++);
  1198. if (x >= 0xd0 && x <= 0xd7)
  1199. *(dst++) = x;
  1200. else if (x)
  1201. break;
  1202. }
  1203. }
  1204. }
  1205. *unescaped_buf_ptr = s->buffer;
  1206. *unescaped_buf_size = dst - s->buffer;
  1207. av_log(s->avctx, AV_LOG_DEBUG, "escaping removed %td bytes\n",
  1208. (buf_end - *buf_ptr) - (dst - s->buffer));
  1209. }
  1210. else if(start_code == SOS && s->ls){
  1211. const uint8_t *src = *buf_ptr;
  1212. uint8_t *dst = s->buffer;
  1213. int bit_count = 0;
  1214. int t = 0, b = 0;
  1215. PutBitContext pb;
  1216. s->cur_scan++;
  1217. /* find marker */
  1218. while (src + t < buf_end){
  1219. uint8_t x = src[t++];
  1220. if (x == 0xff){
  1221. while((src + t < buf_end) && x == 0xff)
  1222. x = src[t++];
  1223. if (x & 0x80) {
  1224. t -= 2;
  1225. break;
  1226. }
  1227. }
  1228. }
  1229. bit_count = t * 8;
  1230. init_put_bits(&pb, dst, t);
  1231. /* unescape bitstream */
  1232. while(b < t){
  1233. uint8_t x = src[b++];
  1234. put_bits(&pb, 8, x);
  1235. if(x == 0xFF){
  1236. x = src[b++];
  1237. put_bits(&pb, 7, x);
  1238. bit_count--;
  1239. }
  1240. }
  1241. flush_put_bits(&pb);
  1242. *unescaped_buf_ptr = dst;
  1243. *unescaped_buf_size = (bit_count + 7) >> 3;
  1244. }
  1245. else
  1246. {
  1247. *unescaped_buf_ptr = *buf_ptr;
  1248. *unescaped_buf_size = buf_end - *buf_ptr;
  1249. }
  1250. return start_code;
  1251. }
  1252. int ff_mjpeg_decode_frame(AVCodecContext *avctx,
  1253. void *data, int *data_size,
  1254. AVPacket *avpkt)
  1255. {
  1256. const uint8_t *buf = avpkt->data;
  1257. int buf_size = avpkt->size;
  1258. MJpegDecodeContext *s = avctx->priv_data;
  1259. const uint8_t *buf_end, *buf_ptr;
  1260. const uint8_t *unescaped_buf_ptr;
  1261. int unescaped_buf_size;
  1262. int start_code;
  1263. AVFrame *picture = data;
  1264. s->got_picture = 0; // picture from previous image can not be reused
  1265. buf_ptr = buf;
  1266. buf_end = buf + buf_size;
  1267. while (buf_ptr < buf_end) {
  1268. /* find start next marker */
  1269. start_code = ff_mjpeg_find_marker(s, &buf_ptr, buf_end,
  1270. &unescaped_buf_ptr, &unescaped_buf_size);
  1271. {
  1272. /* EOF */
  1273. if (start_code < 0) {
  1274. goto the_end;
  1275. } else {
  1276. av_log(avctx, AV_LOG_DEBUG, "marker=%x avail_size_in_buf=%td\n", start_code, buf_end - buf_ptr);
  1277. init_get_bits(&s->gb, unescaped_buf_ptr, unescaped_buf_size*8);
  1278. s->start_code = start_code;
  1279. if(s->avctx->debug & FF_DEBUG_STARTCODE){
  1280. av_log(avctx, AV_LOG_DEBUG, "startcode: %X\n", start_code);
  1281. }
  1282. /* process markers */
  1283. if (start_code >= 0xd0 && start_code <= 0xd7) {
  1284. av_log(avctx, AV_LOG_DEBUG, "restart marker: %d\n", start_code&0x0f);
  1285. /* APP fields */
  1286. } else if (start_code >= APP0 && start_code <= APP15) {
  1287. mjpeg_decode_app(s);
  1288. /* Comment */
  1289. } else if (start_code == COM){
  1290. mjpeg_decode_com(s);
  1291. }
  1292. switch(start_code) {
  1293. case SOI:
  1294. s->restart_interval = 0;
  1295. s->restart_count = 0;
  1296. /* nothing to do on SOI */
  1297. break;
  1298. case DQT:
  1299. ff_mjpeg_decode_dqt(s);
  1300. break;
  1301. case DHT:
  1302. if(ff_mjpeg_decode_dht(s) < 0){
  1303. av_log(avctx, AV_LOG_ERROR, "huffman table decode error\n");
  1304. return -1;
  1305. }
  1306. break;
  1307. case SOF0:
  1308. case SOF1:
  1309. s->lossless=0;
  1310. s->ls=0;
  1311. s->progressive=0;
  1312. if (ff_mjpeg_decode_sof(s) < 0)
  1313. return -1;
  1314. break;
  1315. case SOF2:
  1316. s->lossless=0;
  1317. s->ls=0;
  1318. s->progressive=1;
  1319. if (ff_mjpeg_decode_sof(s) < 0)
  1320. return -1;
  1321. break;
  1322. case SOF3:
  1323. s->lossless=1;
  1324. s->ls=0;
  1325. s->progressive=0;
  1326. if (ff_mjpeg_decode_sof(s) < 0)
  1327. return -1;
  1328. break;
  1329. case SOF48:
  1330. s->lossless=1;
  1331. s->ls=1;
  1332. s->progressive=0;
  1333. if (ff_mjpeg_decode_sof(s) < 0)
  1334. return -1;
  1335. break;
  1336. case LSE:
  1337. if (!CONFIG_JPEGLS_DECODER || ff_jpegls_decode_lse(s) < 0)
  1338. return -1;
  1339. break;
  1340. case EOI:
  1341. eoi_parser:
  1342. s->cur_scan = 0;
  1343. if (!s->got_picture) {
  1344. av_log(avctx, AV_LOG_WARNING, "Found EOI before any SOF, ignoring\n");
  1345. break;
  1346. }
  1347. if (s->interlaced) {
  1348. s->bottom_field ^= 1;
  1349. /* if not bottom field, do not output image yet */
  1350. if (s->bottom_field == !s->interlace_polarity)
  1351. break;
  1352. }
  1353. *picture = *s->picture_ptr;
  1354. *data_size = sizeof(AVFrame);
  1355. if(!s->lossless){
  1356. picture->quality= FFMAX3(s->qscale[0], s->qscale[1], s->qscale[2]);
  1357. picture->qstride= 0;
  1358. picture->qscale_table= s->qscale_table;
  1359. memset(picture->qscale_table, picture->quality, (s->width+15)/16);
  1360. if(avctx->debug & FF_DEBUG_QP)
  1361. av_log(avctx, AV_LOG_DEBUG, "QP: %d\n", picture->quality);
  1362. picture->quality*= FF_QP2LAMBDA;
  1363. }
  1364. goto the_end;
  1365. case SOS:
  1366. if (!s->got_picture) {
  1367. av_log(avctx, AV_LOG_WARNING, "Can not process SOS before SOF, skipping\n");
  1368. break;
  1369. }
  1370. if (ff_mjpeg_decode_sos(s, NULL, NULL) < 0 &&
  1371. (avctx->err_recognition & AV_EF_EXPLODE))
  1372. return AVERROR_INVALIDDATA;
  1373. break;
  1374. case DRI:
  1375. mjpeg_decode_dri(s);
  1376. break;
  1377. case SOF5:
  1378. case SOF6:
  1379. case SOF7:
  1380. case SOF9:
  1381. case SOF10:
  1382. case SOF11:
  1383. case SOF13:
  1384. case SOF14:
  1385. case SOF15:
  1386. case JPG:
  1387. av_log(avctx, AV_LOG_ERROR, "mjpeg: unsupported coding type (%x)\n", start_code);
  1388. break;
  1389. // default:
  1390. // printf("mjpeg: unsupported marker (%x)\n", start_code);
  1391. // break;
  1392. }
  1393. /* eof process start code */
  1394. buf_ptr += (get_bits_count(&s->gb)+7)/8;
  1395. av_log(avctx, AV_LOG_DEBUG, "marker parser used %d bytes (%d bits)\n",
  1396. (get_bits_count(&s->gb)+7)/8, get_bits_count(&s->gb));
  1397. }
  1398. }
  1399. }
  1400. if (s->got_picture) {
  1401. av_log(avctx, AV_LOG_WARNING, "EOI missing, emulating\n");
  1402. goto eoi_parser;
  1403. }
  1404. av_log(avctx, AV_LOG_FATAL, "No JPEG data found in image\n");
  1405. return -1;
  1406. the_end:
  1407. av_log(avctx, AV_LOG_DEBUG, "mjpeg decode frame unused %td bytes\n", buf_end - buf_ptr);
  1408. // return buf_end - buf_ptr;
  1409. return buf_ptr - buf;
  1410. }
  1411. av_cold int ff_mjpeg_decode_end(AVCodecContext *avctx)
  1412. {
  1413. MJpegDecodeContext *s = avctx->priv_data;
  1414. int i, j;
  1415. if (s->picture_ptr && s->picture_ptr->data[0])
  1416. avctx->release_buffer(avctx, s->picture_ptr);
  1417. av_free(s->buffer);
  1418. av_free(s->qscale_table);
  1419. av_freep(&s->ljpeg_buffer);
  1420. s->ljpeg_buffer_size=0;
  1421. for(i=0;i<3;i++) {
  1422. for(j=0;j<4;j++)
  1423. free_vlc(&s->vlcs[i][j]);
  1424. }
  1425. for(i=0; i<MAX_COMPONENTS; i++) {
  1426. av_freep(&s->blocks[i]);
  1427. av_freep(&s->last_nnz[i]);
  1428. }
  1429. return 0;
  1430. }
  1431. #define OFFSET(x) offsetof(MJpegDecodeContext, x)
  1432. #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
  1433. static const AVOption options[] = {
  1434. { "extern_huff", "Use external huffman table.", OFFSET(extern_huff), AV_OPT_TYPE_INT, { 0 }, 0, 1, VD },
  1435. { NULL },
  1436. };
  1437. static const AVClass mjpegdec_class = {
  1438. .class_name = "MJPEG decoder",
  1439. .item_name = av_default_item_name,
  1440. .option = options,
  1441. .version = LIBAVUTIL_VERSION_INT,
  1442. };
  1443. AVCodec ff_mjpeg_decoder = {
  1444. .name = "mjpeg",
  1445. .type = AVMEDIA_TYPE_VIDEO,
  1446. .id = CODEC_ID_MJPEG,
  1447. .priv_data_size = sizeof(MJpegDecodeContext),
  1448. .init = ff_mjpeg_decode_init,
  1449. .close = ff_mjpeg_decode_end,
  1450. .decode = ff_mjpeg_decode_frame,
  1451. .capabilities = CODEC_CAP_DR1,
  1452. .max_lowres = 3,
  1453. .long_name = NULL_IF_CONFIG_SMALL("MJPEG (Motion JPEG)"),
  1454. .priv_class = &mjpegdec_class,
  1455. };
  1456. AVCodec ff_thp_decoder = {
  1457. .name = "thp",
  1458. .type = AVMEDIA_TYPE_VIDEO,
  1459. .id = CODEC_ID_THP,
  1460. .priv_data_size = sizeof(MJpegDecodeContext),
  1461. .init = ff_mjpeg_decode_init,
  1462. .close = ff_mjpeg_decode_end,
  1463. .decode = ff_mjpeg_decode_frame,
  1464. .capabilities = CODEC_CAP_DR1,
  1465. .max_lowres = 3,
  1466. .long_name = NULL_IF_CONFIG_SMALL("Nintendo Gamecube THP video"),
  1467. };