You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

668 lines
19KB

  1. /*
  2. * H261 decoder
  3. * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
  4. * Copyright (c) 2004 Maarten Daniels
  5. *
  6. * This file is part of Libav.
  7. *
  8. * Libav is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * Libav is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with Libav; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. /**
  23. * @file
  24. * H.261 decoder.
  25. */
  26. #include "avcodec.h"
  27. #include "mpegvideo.h"
  28. #include "h263.h"
  29. #include "h261.h"
  30. #define H261_MBA_VLC_BITS 9
  31. #define H261_MTYPE_VLC_BITS 6
  32. #define H261_MV_VLC_BITS 7
  33. #define H261_CBP_VLC_BITS 9
  34. #define TCOEFF_VLC_BITS 9
  35. #define MBA_STUFFING 33
  36. #define MBA_STARTCODE 34
  37. static VLC h261_mba_vlc;
  38. static VLC h261_mtype_vlc;
  39. static VLC h261_mv_vlc;
  40. static VLC h261_cbp_vlc;
  41. static av_cold void h261_decode_init_vlc(H261Context *h)
  42. {
  43. static int done = 0;
  44. if (!done) {
  45. done = 1;
  46. INIT_VLC_STATIC(&h261_mba_vlc, H261_MBA_VLC_BITS, 35,
  47. ff_h261_mba_bits, 1, 1,
  48. ff_h261_mba_code, 1, 1, 662);
  49. INIT_VLC_STATIC(&h261_mtype_vlc, H261_MTYPE_VLC_BITS, 10,
  50. ff_h261_mtype_bits, 1, 1,
  51. ff_h261_mtype_code, 1, 1, 80);
  52. INIT_VLC_STATIC(&h261_mv_vlc, H261_MV_VLC_BITS, 17,
  53. &ff_h261_mv_tab[0][1], 2, 1,
  54. &ff_h261_mv_tab[0][0], 2, 1, 144);
  55. INIT_VLC_STATIC(&h261_cbp_vlc, H261_CBP_VLC_BITS, 63,
  56. &ff_h261_cbp_tab[0][1], 2, 1,
  57. &ff_h261_cbp_tab[0][0], 2, 1, 512);
  58. INIT_VLC_RL(ff_h261_rl_tcoeff, 552);
  59. }
  60. }
  61. static av_cold int h261_decode_init(AVCodecContext *avctx)
  62. {
  63. H261Context *h = avctx->priv_data;
  64. MpegEncContext *const s = &h->s;
  65. // set defaults
  66. ff_MPV_decode_defaults(s);
  67. s->avctx = avctx;
  68. s->width = s->avctx->coded_width;
  69. s->height = s->avctx->coded_height;
  70. s->codec_id = s->avctx->codec->id;
  71. s->out_format = FMT_H261;
  72. s->low_delay = 1;
  73. avctx->pix_fmt = AV_PIX_FMT_YUV420P;
  74. s->codec_id = avctx->codec->id;
  75. ff_h261_common_init();
  76. h261_decode_init_vlc(h);
  77. h->gob_start_code_skipped = 0;
  78. return 0;
  79. }
  80. /**
  81. * Decode the group of blocks header or slice header.
  82. * @return <0 if an error occurred
  83. */
  84. static int h261_decode_gob_header(H261Context *h)
  85. {
  86. unsigned int val;
  87. MpegEncContext *const s = &h->s;
  88. if (!h->gob_start_code_skipped) {
  89. /* Check for GOB Start Code */
  90. val = show_bits(&s->gb, 15);
  91. if (val)
  92. return -1;
  93. /* We have a GBSC */
  94. skip_bits(&s->gb, 16);
  95. }
  96. h->gob_start_code_skipped = 0;
  97. h->gob_number = get_bits(&s->gb, 4); /* GN */
  98. s->qscale = get_bits(&s->gb, 5); /* GQUANT */
  99. /* Check if gob_number is valid */
  100. if (s->mb_height == 18) { // CIF
  101. if ((h->gob_number <= 0) || (h->gob_number > 12))
  102. return -1;
  103. } else { // QCIF
  104. if ((h->gob_number != 1) && (h->gob_number != 3) &&
  105. (h->gob_number != 5))
  106. return -1;
  107. }
  108. /* GEI */
  109. while (get_bits1(&s->gb) != 0)
  110. skip_bits(&s->gb, 8);
  111. if (s->qscale == 0) {
  112. av_log(s->avctx, AV_LOG_ERROR, "qscale has forbidden 0 value\n");
  113. if (s->avctx->err_recognition & AV_EF_BITSTREAM)
  114. return -1;
  115. }
  116. /* For the first transmitted macroblock in a GOB, MBA is the absolute
  117. * address. For subsequent macroblocks, MBA is the difference between
  118. * the absolute addresses of the macroblock and the last transmitted
  119. * macroblock. */
  120. h->current_mba = 0;
  121. h->mba_diff = 0;
  122. return 0;
  123. }
  124. /**
  125. * Decode the group of blocks / video packet header.
  126. * @return <0 if no resync found
  127. */
  128. static int h261_resync(H261Context *h)
  129. {
  130. MpegEncContext *const s = &h->s;
  131. int left, ret;
  132. if (h->gob_start_code_skipped) {
  133. ret = h261_decode_gob_header(h);
  134. if (ret >= 0)
  135. return 0;
  136. } else {
  137. if (show_bits(&s->gb, 15) == 0) {
  138. ret = h261_decode_gob_header(h);
  139. if (ret >= 0)
  140. return 0;
  141. }
  142. // OK, it is not where it is supposed to be ...
  143. s->gb = s->last_resync_gb;
  144. align_get_bits(&s->gb);
  145. left = get_bits_left(&s->gb);
  146. for (; left > 15 + 1 + 4 + 5; left -= 8) {
  147. if (show_bits(&s->gb, 15) == 0) {
  148. GetBitContext bak = s->gb;
  149. ret = h261_decode_gob_header(h);
  150. if (ret >= 0)
  151. return 0;
  152. s->gb = bak;
  153. }
  154. skip_bits(&s->gb, 8);
  155. }
  156. }
  157. return -1;
  158. }
  159. /**
  160. * Decode skipped macroblocks.
  161. * @return 0
  162. */
  163. static int h261_decode_mb_skipped(H261Context *h, int mba1, int mba2)
  164. {
  165. MpegEncContext *const s = &h->s;
  166. int i;
  167. s->mb_intra = 0;
  168. for (i = mba1; i < mba2; i++) {
  169. int j, xy;
  170. s->mb_x = ((h->gob_number - 1) % 2) * 11 + i % 11;
  171. s->mb_y = ((h->gob_number - 1) / 2) * 3 + i / 11;
  172. xy = s->mb_x + s->mb_y * s->mb_stride;
  173. ff_init_block_index(s);
  174. ff_update_block_index(s);
  175. for (j = 0; j < 6; j++)
  176. s->block_last_index[j] = -1;
  177. s->mv_dir = MV_DIR_FORWARD;
  178. s->mv_type = MV_TYPE_16X16;
  179. s->current_picture.mb_type[xy] = MB_TYPE_SKIP | MB_TYPE_16x16 | MB_TYPE_L0;
  180. s->mv[0][0][0] = 0;
  181. s->mv[0][0][1] = 0;
  182. s->mb_skipped = 1;
  183. h->mtype &= ~MB_TYPE_H261_FIL;
  184. ff_MPV_decode_mb(s, s->block);
  185. }
  186. return 0;
  187. }
  188. static const int mvmap[17] = {
  189. 0, -1, -2, -3, -4, -5, -6, -7, -8, -9, -10, -11, -12, -13, -14, -15, -16
  190. };
  191. static int decode_mv_component(GetBitContext *gb, int v)
  192. {
  193. int mv_diff = get_vlc2(gb, h261_mv_vlc.table, H261_MV_VLC_BITS, 2);
  194. /* check if mv_diff is valid */
  195. if (mv_diff < 0)
  196. return v;
  197. mv_diff = mvmap[mv_diff];
  198. if (mv_diff && !get_bits1(gb))
  199. mv_diff = -mv_diff;
  200. v += mv_diff;
  201. if (v <= -16)
  202. v += 32;
  203. else if (v >= 16)
  204. v -= 32;
  205. return v;
  206. }
  207. /**
  208. * Decode a macroblock.
  209. * @return <0 if an error occurred
  210. */
  211. static int h261_decode_block(H261Context *h, int16_t *block, int n, int coded)
  212. {
  213. MpegEncContext *const s = &h->s;
  214. int code, level, i, j, run;
  215. RLTable *rl = &ff_h261_rl_tcoeff;
  216. const uint8_t *scan_table;
  217. /* For the variable length encoding there are two code tables, one being
  218. * used for the first transmitted LEVEL in INTER, INTER + MC and
  219. * INTER + MC + FIL blocks, the second for all other LEVELs except the
  220. * first one in INTRA blocks which is fixed length coded with 8 bits.
  221. * NOTE: The two code tables only differ in one VLC so we handle that
  222. * manually. */
  223. scan_table = s->intra_scantable.permutated;
  224. if (s->mb_intra) {
  225. /* DC coef */
  226. level = get_bits(&s->gb, 8);
  227. // 0 (00000000b) and -128 (10000000b) are FORBIDDEN
  228. if ((level & 0x7F) == 0) {
  229. av_log(s->avctx, AV_LOG_ERROR, "illegal dc %d at %d %d\n",
  230. level, s->mb_x, s->mb_y);
  231. return -1;
  232. }
  233. /* The code 1000 0000 is not used, the reconstruction level of 1024
  234. * being coded as 1111 1111. */
  235. if (level == 255)
  236. level = 128;
  237. block[0] = level;
  238. i = 1;
  239. } else if (coded) {
  240. // Run Level Code
  241. // EOB Not possible for first level when cbp is available (that's why the table is different)
  242. // 0 1 1s
  243. // * * 0*
  244. int check = show_bits(&s->gb, 2);
  245. i = 0;
  246. if (check & 0x2) {
  247. skip_bits(&s->gb, 2);
  248. block[0] = (check & 0x1) ? -1 : 1;
  249. i = 1;
  250. }
  251. } else {
  252. i = 0;
  253. }
  254. if (!coded) {
  255. s->block_last_index[n] = i - 1;
  256. return 0;
  257. }
  258. for (;;) {
  259. code = get_vlc2(&s->gb, rl->vlc.table, TCOEFF_VLC_BITS, 2);
  260. if (code < 0) {
  261. av_log(s->avctx, AV_LOG_ERROR, "illegal ac vlc code at %dx%d\n",
  262. s->mb_x, s->mb_y);
  263. return -1;
  264. }
  265. if (code == rl->n) {
  266. /* escape */
  267. /* The remaining combinations of (run, level) are encoded with a
  268. * 20-bit word consisting of 6 bits escape, 6 bits run and 8 bits
  269. * level. */
  270. run = get_bits(&s->gb, 6);
  271. level = get_sbits(&s->gb, 8);
  272. } else if (code == 0) {
  273. break;
  274. } else {
  275. run = rl->table_run[code];
  276. level = rl->table_level[code];
  277. if (get_bits1(&s->gb))
  278. level = -level;
  279. }
  280. i += run;
  281. if (i >= 64) {
  282. av_log(s->avctx, AV_LOG_ERROR, "run overflow at %dx%d\n",
  283. s->mb_x, s->mb_y);
  284. return -1;
  285. }
  286. j = scan_table[i];
  287. block[j] = level;
  288. i++;
  289. }
  290. s->block_last_index[n] = i - 1;
  291. return 0;
  292. }
  293. static int h261_decode_mb(H261Context *h)
  294. {
  295. MpegEncContext *const s = &h->s;
  296. int i, cbp, xy;
  297. cbp = 63;
  298. // Read mba
  299. do {
  300. h->mba_diff = get_vlc2(&s->gb, h261_mba_vlc.table,
  301. H261_MBA_VLC_BITS, 2);
  302. /* Check for slice end */
  303. /* NOTE: GOB can be empty (no MB data) or exist only of MBA_stuffing */
  304. if (h->mba_diff == MBA_STARTCODE) { // start code
  305. h->gob_start_code_skipped = 1;
  306. return SLICE_END;
  307. }
  308. } while (h->mba_diff == MBA_STUFFING); // stuffing
  309. if (h->mba_diff < 0) {
  310. if (get_bits_left(&s->gb) <= 7)
  311. return SLICE_END;
  312. av_log(s->avctx, AV_LOG_ERROR, "illegal mba at %d %d\n", s->mb_x, s->mb_y);
  313. return SLICE_ERROR;
  314. }
  315. h->mba_diff += 1;
  316. h->current_mba += h->mba_diff;
  317. if (h->current_mba > MBA_STUFFING)
  318. return SLICE_ERROR;
  319. s->mb_x = ((h->gob_number - 1) % 2) * 11 + ((h->current_mba - 1) % 11);
  320. s->mb_y = ((h->gob_number - 1) / 2) * 3 + ((h->current_mba - 1) / 11);
  321. xy = s->mb_x + s->mb_y * s->mb_stride;
  322. ff_init_block_index(s);
  323. ff_update_block_index(s);
  324. // Read mtype
  325. h->mtype = get_vlc2(&s->gb, h261_mtype_vlc.table, H261_MTYPE_VLC_BITS, 2);
  326. h->mtype = ff_h261_mtype_map[h->mtype];
  327. // Read mquant
  328. if (IS_QUANT(h->mtype))
  329. ff_set_qscale(s, get_bits(&s->gb, 5));
  330. s->mb_intra = IS_INTRA4x4(h->mtype);
  331. // Read mv
  332. if (IS_16X16(h->mtype)) {
  333. /* Motion vector data is included for all MC macroblocks. MVD is
  334. * obtained from the macroblock vector by subtracting the vector
  335. * of the preceding macroblock. For this calculation the vector
  336. * of the preceding macroblock is regarded as zero in the
  337. * following three situations:
  338. * 1) evaluating MVD for macroblocks 1, 12 and 23;
  339. * 2) evaluating MVD for macroblocks in which MBA does not represent a difference of 1;
  340. * 3) MTYPE of the previous macroblock was not MC. */
  341. if ((h->current_mba == 1) || (h->current_mba == 12) ||
  342. (h->current_mba == 23) || (h->mba_diff != 1)) {
  343. h->current_mv_x = 0;
  344. h->current_mv_y = 0;
  345. }
  346. h->current_mv_x = decode_mv_component(&s->gb, h->current_mv_x);
  347. h->current_mv_y = decode_mv_component(&s->gb, h->current_mv_y);
  348. } else {
  349. h->current_mv_x = 0;
  350. h->current_mv_y = 0;
  351. }
  352. // Read cbp
  353. if (HAS_CBP(h->mtype))
  354. cbp = get_vlc2(&s->gb, h261_cbp_vlc.table, H261_CBP_VLC_BITS, 2) + 1;
  355. if (s->mb_intra) {
  356. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  357. goto intra;
  358. }
  359. //set motion vectors
  360. s->mv_dir = MV_DIR_FORWARD;
  361. s->mv_type = MV_TYPE_16X16;
  362. s->current_picture.mb_type[xy] = MB_TYPE_16x16 | MB_TYPE_L0;
  363. s->mv[0][0][0] = h->current_mv_x * 2; // gets divided by 2 in motion compensation
  364. s->mv[0][0][1] = h->current_mv_y * 2;
  365. intra:
  366. /* decode each block */
  367. if (s->mb_intra || HAS_CBP(h->mtype)) {
  368. s->dsp.clear_blocks(s->block[0]);
  369. for (i = 0; i < 6; i++) {
  370. if (h261_decode_block(h, s->block[i], i, cbp & 32) < 0)
  371. return SLICE_ERROR;
  372. cbp += cbp;
  373. }
  374. } else {
  375. for (i = 0; i < 6; i++)
  376. s->block_last_index[i] = -1;
  377. }
  378. ff_MPV_decode_mb(s, s->block);
  379. return SLICE_OK;
  380. }
  381. /**
  382. * Decode the H.261 picture header.
  383. * @return <0 if no startcode found
  384. */
  385. static int h261_decode_picture_header(H261Context *h)
  386. {
  387. MpegEncContext *const s = &h->s;
  388. int format, i;
  389. uint32_t startcode = 0;
  390. for (i = get_bits_left(&s->gb); i > 24; i -= 1) {
  391. startcode = ((startcode << 1) | get_bits(&s->gb, 1)) & 0x000FFFFF;
  392. if (startcode == 0x10)
  393. break;
  394. }
  395. if (startcode != 0x10) {
  396. av_log(s->avctx, AV_LOG_ERROR, "Bad picture start code\n");
  397. return -1;
  398. }
  399. /* temporal reference */
  400. i = get_bits(&s->gb, 5); /* picture timestamp */
  401. if (i < (s->picture_number & 31))
  402. i += 32;
  403. s->picture_number = (s->picture_number & ~31) + i;
  404. s->avctx->time_base = (AVRational) { 1001, 30000 };
  405. s->current_picture.f.pts = s->picture_number;
  406. /* PTYPE starts here */
  407. skip_bits1(&s->gb); /* split screen off */
  408. skip_bits1(&s->gb); /* camera off */
  409. skip_bits1(&s->gb); /* freeze picture release off */
  410. format = get_bits1(&s->gb);
  411. // only 2 formats possible
  412. if (format == 0) { // QCIF
  413. s->width = 176;
  414. s->height = 144;
  415. s->mb_width = 11;
  416. s->mb_height = 9;
  417. } else { // CIF
  418. s->width = 352;
  419. s->height = 288;
  420. s->mb_width = 22;
  421. s->mb_height = 18;
  422. }
  423. s->mb_num = s->mb_width * s->mb_height;
  424. skip_bits1(&s->gb); /* still image mode off */
  425. skip_bits1(&s->gb); /* Reserved */
  426. /* PEI */
  427. while (get_bits1(&s->gb) != 0)
  428. skip_bits(&s->gb, 8);
  429. /* H.261 has no I-frames, but if we pass AV_PICTURE_TYPE_I for the first
  430. * frame, the codec crashes if it does not contain all I-blocks
  431. * (e.g. when a packet is lost). */
  432. s->pict_type = AV_PICTURE_TYPE_P;
  433. h->gob_number = 0;
  434. return 0;
  435. }
  436. static int h261_decode_gob(H261Context *h)
  437. {
  438. MpegEncContext *const s = &h->s;
  439. ff_set_qscale(s, s->qscale);
  440. /* decode mb's */
  441. while (h->current_mba <= MBA_STUFFING) {
  442. int ret;
  443. /* DCT & quantize */
  444. ret = h261_decode_mb(h);
  445. if (ret < 0) {
  446. if (ret == SLICE_END) {
  447. h261_decode_mb_skipped(h, h->current_mba, 33);
  448. return 0;
  449. }
  450. av_log(s->avctx, AV_LOG_ERROR, "Error at MB: %d\n",
  451. s->mb_x + s->mb_y * s->mb_stride);
  452. return -1;
  453. }
  454. h261_decode_mb_skipped(h,
  455. h->current_mba - h->mba_diff,
  456. h->current_mba - 1);
  457. }
  458. return -1;
  459. }
  460. /**
  461. * returns the number of bytes consumed for building the current frame
  462. */
  463. static int get_consumed_bytes(MpegEncContext *s, int buf_size)
  464. {
  465. int pos = get_bits_count(&s->gb) >> 3;
  466. if (pos == 0)
  467. pos = 1; // avoid infinite loops (i doubt that is needed but ...)
  468. if (pos + 10 > buf_size)
  469. pos = buf_size; // oops ;)
  470. return pos;
  471. }
  472. static int h261_decode_frame(AVCodecContext *avctx, void *data,
  473. int *got_frame, AVPacket *avpkt)
  474. {
  475. const uint8_t *buf = avpkt->data;
  476. int buf_size = avpkt->size;
  477. H261Context *h = avctx->priv_data;
  478. MpegEncContext *s = &h->s;
  479. int ret;
  480. AVFrame *pict = data;
  481. av_dlog(avctx, "*****frame %d size=%d\n", avctx->frame_number, buf_size);
  482. av_dlog(avctx, "bytes=%x %x %x %x\n", buf[0], buf[1], buf[2], buf[3]);
  483. s->flags = avctx->flags;
  484. s->flags2 = avctx->flags2;
  485. h->gob_start_code_skipped = 0;
  486. retry:
  487. init_get_bits(&s->gb, buf, buf_size * 8);
  488. if (!s->context_initialized)
  489. // we need the IDCT permutaton for reading a custom matrix
  490. if (ff_MPV_common_init(s) < 0)
  491. return -1;
  492. /* We need to set current_picture_ptr before reading the header,
  493. * otherwise we cannot store anything in there. */
  494. if (s->current_picture_ptr == NULL || s->current_picture_ptr->f.data[0]) {
  495. int i = ff_find_unused_picture(s, 0);
  496. if (i < 0)
  497. return i;
  498. s->current_picture_ptr = &s->picture[i];
  499. }
  500. ret = h261_decode_picture_header(h);
  501. /* skip if the header was thrashed */
  502. if (ret < 0) {
  503. av_log(s->avctx, AV_LOG_ERROR, "header damaged\n");
  504. return -1;
  505. }
  506. if (s->width != avctx->coded_width || s->height != avctx->coded_height) {
  507. ParseContext pc = s->parse_context; // FIXME move this demuxing hack to libavformat
  508. s->parse_context.buffer = 0;
  509. ff_MPV_common_end(s);
  510. s->parse_context = pc;
  511. }
  512. if (!s->context_initialized) {
  513. avcodec_set_dimensions(avctx, s->width, s->height);
  514. goto retry;
  515. }
  516. // for skipping the frame
  517. s->current_picture.f.pict_type = s->pict_type;
  518. s->current_picture.f.key_frame = s->pict_type == AV_PICTURE_TYPE_I;
  519. if ((avctx->skip_frame >= AVDISCARD_NONREF && s->pict_type == AV_PICTURE_TYPE_B) ||
  520. (avctx->skip_frame >= AVDISCARD_NONKEY && s->pict_type != AV_PICTURE_TYPE_I) ||
  521. avctx->skip_frame >= AVDISCARD_ALL)
  522. return get_consumed_bytes(s, buf_size);
  523. if (ff_MPV_frame_start(s, avctx) < 0)
  524. return -1;
  525. ff_mpeg_er_frame_start(s);
  526. /* decode each macroblock */
  527. s->mb_x = 0;
  528. s->mb_y = 0;
  529. while (h->gob_number < (s->mb_height == 18 ? 12 : 5)) {
  530. if (h261_resync(h) < 0)
  531. break;
  532. h261_decode_gob(h);
  533. }
  534. ff_MPV_frame_end(s);
  535. assert(s->current_picture.f.pict_type == s->current_picture_ptr->f.pict_type);
  536. assert(s->current_picture.f.pict_type == s->pict_type);
  537. if ((ret = av_frame_ref(pict, &s->current_picture_ptr->f)) < 0)
  538. return ret;
  539. ff_print_debug_info(s, s->current_picture_ptr);
  540. *got_frame = 1;
  541. return get_consumed_bytes(s, buf_size);
  542. }
  543. static av_cold int h261_decode_end(AVCodecContext *avctx)
  544. {
  545. H261Context *h = avctx->priv_data;
  546. MpegEncContext *s = &h->s;
  547. ff_MPV_common_end(s);
  548. return 0;
  549. }
  550. AVCodec ff_h261_decoder = {
  551. .name = "h261",
  552. .type = AVMEDIA_TYPE_VIDEO,
  553. .id = AV_CODEC_ID_H261,
  554. .priv_data_size = sizeof(H261Context),
  555. .init = h261_decode_init,
  556. .close = h261_decode_end,
  557. .decode = h261_decode_frame,
  558. .capabilities = CODEC_CAP_DR1,
  559. .long_name = NULL_IF_CONFIG_SMALL("H.261"),
  560. };